diff --git "a/wandb/run-20220503_172048-zotxt8wa/files/wandb-summary.json" "b/wandb/run-20220503_172048-zotxt8wa/files/wandb-summary.json" --- "a/wandb/run-20220503_172048-zotxt8wa/files/wandb-summary.json" +++ "b/wandb/run-20220503_172048-zotxt8wa/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.5646, "train/learning_rate": 0.00028133557762064176, "train/epoch": 0.69, "train/global_step": 4500, "_runtime": 48456, "_timestamp": 1651646904, "_step": 4508, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1021.0], "bins": [-515.541015625, -507.42926025390625, -499.3175048828125, -491.20574951171875, -483.093994140625, -474.98223876953125, -466.8704833984375, -458.75872802734375, -450.64697265625, -442.53521728515625, -434.4234619140625, -426.31170654296875, -418.199951171875, -410.08819580078125, -401.9764404296875, -393.86468505859375, -385.7528991699219, -377.6411437988281, -369.5293884277344, -361.4176330566406, -353.3058776855469, -345.1941223144531, -337.0823669433594, -328.9705810546875, -320.85882568359375, -312.7470703125, -304.63531494140625, -296.5235595703125, -288.41180419921875, -280.300048828125, -272.18829345703125, -264.0765380859375, -255.96478271484375, -247.85302734375, -239.74127197265625, -231.6295166015625, -223.51776123046875, -215.406005859375, -207.2942352294922, -199.18247985839844, -191.0707244873047, -182.95896911621094, -174.8472137451172, -166.73545837402344, -158.62368774414062, -150.51193237304688, -142.40017700195312, -134.28842163085938, -126.17666625976562, -118.06491088867188, -109.95315551757812, -101.84139251708984, -93.7296371459961, -85.61788177490234, -77.50611877441406, -69.39436340332031, -61.28260803222656, -53.17085266113281, -45.0590934753418, -36.94733428955078, -28.83557891845703, -20.72382354736328, -12.612064361572266, -4.50030517578125, 3.6114518642425537]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 8.0, 9.0, 16.0, 13.0, 25.0, 37.0, 68.0, 48.0, 69.0, 84.0, 90.0, 79.0, 74.0, 51.0, 57.0, 66.0, 45.0, 38.0, 29.0, 28.0, 23.0, 17.0, 10.0, 6.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.99260139465332, -19.24203872680664, -18.491474151611328, -17.74091148376465, -16.990346908569336, -16.239784240722656, -15.48922061920166, -14.738656997680664, -13.988093376159668, -13.237529754638672, -12.486966133117676, -11.73640251159668, -10.98583984375, -10.235275268554688, -9.484712600708008, -8.734148979187012, -7.983585357666016, -7.2330217361450195, -6.482458114624023, -5.7318949699401855, -4.9813313484191895, -4.230767726898193, -3.4802045822143555, -2.7296409606933594, -1.9790773391723633, -1.2285138368606567, -0.4779503345489502, 0.2726130485534668, 1.023176670074463, 1.773740291595459, 2.524303436279297, 3.274867057800293, 4.025428771972656, 4.775992393493652, 5.526556015014648, 6.277119159698486, 7.027682781219482, 7.7782464027404785, 8.528809547424316, 9.279373168945312, 10.029936790466309, 10.780500411987305, 11.5310640335083, 12.281627655029297, 13.032190322875977, 13.782754898071289, 14.533317565917969, 15.283881187438965, 16.03444480895996, 16.78500747680664, 17.535572052001953, 18.286134719848633, 19.036699295043945, 19.787261962890625, 20.537826538085938, 21.288389205932617, 22.038951873779297, 22.789514541625977, 23.54007911682129, 24.29064178466797, 25.04120635986328, 25.79176902770996, 26.54233169555664, 27.292896270751953, 28.043460845947266]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 21.0, 21.0, 27.0, 53.0, 82.0, 147.0, 218.0, 399.0, 683.0, 1220.0, 2648.0, 8169.0, 43969.0, 4114583.0, 14210.0, 3987.0, 1744.0, 962.0, 489.0, 253.0, 158.0, 87.0, 62.0, 29.0, 21.0, 10.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0078125, -7.6768798828125, -7.345947265625, -7.0150146484375, -6.68408203125, -6.3531494140625, -6.022216796875, -5.6912841796875, -5.3603515625, -5.0294189453125, -4.698486328125, -4.3675537109375, -4.03662109375, -3.7056884765625, -3.374755859375, -3.0438232421875, -2.712890625, -2.3819580078125, -2.051025390625, -1.7200927734375, -1.38916015625, -1.0582275390625, -0.727294921875, -0.3963623046875, -0.0654296875, 0.2655029296875, 0.596435546875, 0.9273681640625, 1.25830078125, 1.5892333984375, 1.920166015625, 2.2510986328125, 2.58203125, 2.9129638671875, 3.243896484375, 3.5748291015625, 3.90576171875, 4.2366943359375, 4.567626953125, 4.8985595703125, 5.2294921875, 5.5604248046875, 5.891357421875, 6.2222900390625, 6.55322265625, 6.8841552734375, 7.215087890625, 7.5460205078125, 7.876953125, 8.2078857421875, 8.538818359375, 8.8697509765625, 9.20068359375, 9.5316162109375, 9.862548828125, 10.1934814453125, 10.5244140625, 10.8553466796875, 11.186279296875, 11.5172119140625, 11.84814453125, 12.1790771484375, 12.510009765625, 12.8409423828125, 13.171875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 2.0, 15.0, 13.0, 15.0, 32.0, 49.0, 56.0, 59.0, 89.0, 86.0, 92.0, 72.0, 73.0, 61.0, 67.0, 49.0, 45.0, 32.0, 27.0, 19.0, 12.0, 15.0, 6.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.1844482421875, -11.736083984375, -11.2877197265625, -10.83935546875, -10.3909912109375, -9.942626953125, -9.4942626953125, -9.0458984375, -8.5975341796875, -8.149169921875, -7.7008056640625, -7.25244140625, -6.8040771484375, -6.355712890625, -5.9073486328125, -5.458984375, -5.0106201171875, -4.562255859375, -4.1138916015625, -3.66552734375, -3.2171630859375, -2.768798828125, -2.3204345703125, -1.8720703125, -1.4237060546875, -0.975341796875, -0.5269775390625, -0.07861328125, 0.3697509765625, 0.818115234375, 1.2664794921875, 1.71484375, 2.1632080078125, 2.611572265625, 3.0599365234375, 3.50830078125, 3.9566650390625, 4.405029296875, 4.8533935546875, 5.3017578125, 5.7501220703125, 6.198486328125, 6.6468505859375, 7.09521484375, 7.5435791015625, 7.991943359375, 8.4403076171875, 8.888671875, 9.3370361328125, 9.785400390625, 10.2337646484375, 10.68212890625, 11.1304931640625, 11.578857421875, 12.0272216796875, 12.4755859375, 12.9239501953125, 13.372314453125, 13.8206787109375, 14.26904296875, 14.7174072265625, 15.165771484375, 15.6141357421875, 16.0625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 1.0, 4.0, 17.0, 26.0, 4193633.0, 541.0, 20.0, 5.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-274.25, -261.72265625, -249.1953125, -236.66796875, -224.140625, -211.61328125, -199.0859375, -186.55859375, -174.03125, -161.50390625, -148.9765625, -136.44921875, -123.921875, -111.39453125, -98.8671875, -86.33984375, -73.8125, -61.28515625, -48.7578125, -36.23046875, -23.703125, -11.17578125, 1.3515625, 13.87890625, 26.40625, 38.93359375, 51.4609375, 63.98828125, 76.515625, 89.04296875, 101.5703125, 114.09765625, 126.625, 139.15234375, 151.6796875, 164.20703125, 176.734375, 189.26171875, 201.7890625, 214.31640625, 226.84375, 239.37109375, 251.8984375, 264.42578125, 276.953125, 289.48046875, 302.0078125, 314.53515625, 327.0625, 339.58984375, 352.1171875, 364.64453125, 377.171875, 389.69921875, 402.2265625, 414.75390625, 427.28125, 439.80859375, 452.3359375, 464.86328125, 477.390625, 489.91796875, 502.4453125, 514.97265625, 527.5]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 1.0, 9.0, 16.0, 47.0, 3942.0, 16.0, 7.0, 4.0, 8.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6015625, -3.44085693359375, -3.2801513671875, -3.11944580078125, -2.958740234375, -2.79803466796875, -2.6373291015625, -2.47662353515625, -2.31591796875, -2.15521240234375, -1.9945068359375, -1.83380126953125, -1.673095703125, -1.51239013671875, -1.3516845703125, -1.19097900390625, -1.0302734375, -0.86956787109375, -0.7088623046875, -0.54815673828125, -0.387451171875, -0.22674560546875, -0.0660400390625, 0.09466552734375, 0.25537109375, 0.41607666015625, 0.5767822265625, 0.73748779296875, 0.898193359375, 1.05889892578125, 1.2196044921875, 1.38031005859375, 1.541015625, 1.70172119140625, 1.8624267578125, 2.02313232421875, 2.183837890625, 2.34454345703125, 2.5052490234375, 2.66595458984375, 2.82666015625, 2.98736572265625, 3.1480712890625, 3.30877685546875, 3.469482421875, 3.63018798828125, 3.7908935546875, 3.95159912109375, 4.1123046875, 4.27301025390625, 4.4337158203125, 4.59442138671875, 4.755126953125, 4.91583251953125, 5.0765380859375, 5.23724365234375, 5.39794921875, 5.55865478515625, 5.7193603515625, 5.88006591796875, 6.040771484375, 6.20147705078125, 6.3621826171875, 6.52288818359375, 6.68359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 12.0, 29.0, 110.0, 448.0, 296.0, 83.0, 24.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.157729148864746, -12.425065040588379, -11.692399978637695, -10.959735870361328, -10.227071762084961, -9.494406700134277, -8.76174259185791, -8.029077529907227, -7.296413421630859, -6.563748836517334, -5.831084251403809, -5.098420143127441, -4.365755558013916, -3.6330909729003906, -2.9004268646240234, -2.167762279510498, -1.4350976943969727, -0.7024332284927368, 0.030231237411499023, 0.7628955841064453, 1.4955601692199707, 2.228224754333496, 2.9608888626098633, 3.6935534477233887, 4.426218032836914, 5.1588826179504395, 5.891547203063965, 6.624211311340332, 7.356875896453857, 8.089540481567383, 8.82220458984375, 9.554868698120117, 10.287532806396484, 11.020196914672852, 11.752861976623535, 12.485526084899902, 13.218191146850586, 13.950855255126953, 14.68351936340332, 15.416183471679688, 16.148849487304688, 16.881513595581055, 17.614177703857422, 18.346843719482422, 19.07950782775879, 19.812171936035156, 20.544836044311523, 21.27750015258789, 22.010164260864258, 22.742828369140625, 23.475492477416992, 24.20815658569336, 24.94082260131836, 25.673486709594727, 26.406150817871094, 27.13881492614746, 27.871479034423828, 28.604143142700195, 29.336807250976562, 30.069473266601562, 30.80213737487793, 31.534801483154297, 32.26746368408203, 33.00012969970703, 33.73279571533203]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 5.0, 22.0, 22.0, 21.0, 28.0, 35.0, 38.0, 57.0, 47.0, 61.0, 58.0, 65.0, 58.0, 77.0, 53.0, 46.0, 47.0, 38.0, 47.0, 41.0, 27.0, 24.0, 17.0, 21.0, 11.0, 6.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.512107849121094, -15.050027847290039, -14.587947845458984, -14.12586784362793, -13.663787841796875, -13.20170783996582, -12.739627838134766, -12.277547836303711, -11.815467834472656, -11.353387832641602, -10.891307830810547, -10.429227828979492, -9.967147827148438, -9.505067825317383, -9.042987823486328, -8.580907821655273, -8.118828773498535, -7.6567487716674805, -7.194668769836426, -6.732588768005371, -6.270508766174316, -5.808428764343262, -5.346349239349365, -4.8842692375183105, -4.422189235687256, -3.960109233856201, -3.4980292320251465, -3.035949468612671, -2.573869466781616, -2.1117894649505615, -1.649709701538086, -1.1876296997070312, -0.7255487442016602, -0.26346880197525024, 0.19861114025115967, 0.6606910228729248, 1.1227710247039795, 1.5848510265350342, 2.0469307899475098, 2.5090107917785645, 2.971090793609619, 3.433170795440674, 3.8952507972717285, 4.357330322265625, 4.81941032409668, 5.281490325927734, 5.743570327758789, 6.205650329589844, 6.667730331420898, 7.129810333251953, 7.591890335083008, 8.053970336914062, 8.516050338745117, 8.978130340576172, 9.440210342407227, 9.902290344238281, 10.364370346069336, 10.82645034790039, 11.288530349731445, 11.7506103515625, 12.212690353393555, 12.67477035522461, 13.136850357055664, 13.598930358886719, 14.061009407043457]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 6.0, 7.0, 4.0, 7.0, 15.0, 11.0, 21.0, 30.0, 38.0, 56.0, 78.0, 121.0, 195.0, 249.0, 468.0, 841.0, 1448.0, 2821.0, 6002.0, 16022.0, 110107.0, 860862.0, 31313.0, 9170.0, 3895.0, 2007.0, 1096.0, 595.0, 365.0, 231.0, 149.0, 97.0, 60.0, 50.0, 30.0, 26.0, 13.0, 11.0, 6.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.783203125, -1.7242279052734375, -1.665252685546875, -1.6062774658203125, -1.54730224609375, -1.4883270263671875, -1.429351806640625, -1.3703765869140625, -1.3114013671875, -1.2524261474609375, -1.193450927734375, -1.1344757080078125, -1.07550048828125, -1.0165252685546875, -0.957550048828125, -0.8985748291015625, -0.839599609375, -0.7806243896484375, -0.721649169921875, -0.6626739501953125, -0.60369873046875, -0.5447235107421875, -0.485748291015625, -0.4267730712890625, -0.3677978515625, -0.3088226318359375, -0.249847412109375, -0.1908721923828125, -0.13189697265625, -0.0729217529296875, -0.013946533203125, 0.0450286865234375, 0.10400390625, 0.1629791259765625, 0.221954345703125, 0.2809295654296875, 0.33990478515625, 0.3988800048828125, 0.457855224609375, 0.5168304443359375, 0.5758056640625, 0.6347808837890625, 0.693756103515625, 0.7527313232421875, 0.81170654296875, 0.8706817626953125, 0.929656982421875, 0.9886322021484375, 1.047607421875, 1.1065826416015625, 1.165557861328125, 1.2245330810546875, 1.28350830078125, 1.3424835205078125, 1.401458740234375, 1.4604339599609375, 1.5194091796875, 1.5783843994140625, 1.637359619140625, 1.6963348388671875, 1.75531005859375, 1.8142852783203125, 1.873260498046875, 1.9322357177734375, 1.9912109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 8.0, 9.0, 16.0, 20.0, 26.0, 48.0, 47.0, 57.0, 71.0, 83.0, 78.0, 103.0, 85.0, 67.0, 52.0, 60.0, 41.0, 39.0, 24.0, 17.0, 16.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.70703125, -7.475830078125, -7.24462890625, -7.013427734375, -6.7822265625, -6.551025390625, -6.31982421875, -6.088623046875, -5.857421875, -5.626220703125, -5.39501953125, -5.163818359375, -4.9326171875, -4.701416015625, -4.47021484375, -4.239013671875, -4.0078125, -3.776611328125, -3.54541015625, -3.314208984375, -3.0830078125, -2.851806640625, -2.62060546875, -2.389404296875, -2.158203125, -1.927001953125, -1.69580078125, -1.464599609375, -1.2333984375, -1.002197265625, -0.77099609375, -0.539794921875, -0.30859375, -0.077392578125, 0.15380859375, 0.385009765625, 0.6162109375, 0.847412109375, 1.07861328125, 1.309814453125, 1.541015625, 1.772216796875, 2.00341796875, 2.234619140625, 2.4658203125, 2.697021484375, 2.92822265625, 3.159423828125, 3.390625, 3.621826171875, 3.85302734375, 4.084228515625, 4.3154296875, 4.546630859375, 4.77783203125, 5.009033203125, 5.240234375, 5.471435546875, 5.70263671875, 5.933837890625, 6.1650390625, 6.396240234375, 6.62744140625, 6.858642578125, 7.08984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 8.0, 13.0, 9.0, 15.0, 24.0, 32.0, 43.0, 53.0, 68.0, 104.0, 137.0, 243.0, 501.0, 1464.0, 5865.0, 35007.0, 682510.0, 293268.0, 22630.0, 4133.0, 1217.0, 447.0, 243.0, 142.0, 90.0, 68.0, 47.0, 43.0, 27.0, 15.0, 24.0, 11.0, 12.0, 7.0, 8.0, 3.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2666015625, -0.25768280029296875, -0.2487640380859375, -0.23984527587890625, -0.230926513671875, -0.22200775146484375, -0.2130889892578125, -0.20417022705078125, -0.19525146484375, -0.18633270263671875, -0.1774139404296875, -0.16849517822265625, -0.159576416015625, -0.15065765380859375, -0.1417388916015625, -0.13282012939453125, -0.1239013671875, -0.11498260498046875, -0.1060638427734375, -0.09714508056640625, -0.088226318359375, -0.07930755615234375, -0.0703887939453125, -0.06147003173828125, -0.05255126953125, -0.04363250732421875, -0.0347137451171875, -0.02579498291015625, -0.016876220703125, -0.00795745849609375, 0.0009613037109375, 0.00988006591796875, 0.018798828125, 0.02771759033203125, 0.0366363525390625, 0.04555511474609375, 0.054473876953125, 0.06339263916015625, 0.0723114013671875, 0.08123016357421875, 0.09014892578125, 0.09906768798828125, 0.1079864501953125, 0.11690521240234375, 0.125823974609375, 0.13474273681640625, 0.1436614990234375, 0.15258026123046875, 0.1614990234375, 0.17041778564453125, 0.1793365478515625, 0.18825531005859375, 0.197174072265625, 0.20609283447265625, 0.2150115966796875, 0.22393035888671875, 0.23284912109375, 0.24176788330078125, 0.2506866455078125, 0.25960540771484375, 0.268524169921875, 0.27744293212890625, 0.2863616943359375, 0.29528045654296875, 0.30419921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 9.0, 11.0, 7.0, 11.0, 14.0, 18.0, 17.0, 20.0, 28.0, 38.0, 37.0, 40.0, 53.0, 49.0, 46.0, 47.0, 49.0, 44.0, 44.0, 62.0, 43.0, 48.0, 43.0, 37.0, 31.0, 33.0, 26.0, 27.0, 14.0, 8.0, 10.0, 6.0, 5.0, 5.0, 6.0, 1.0, 7.0, 3.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.78125, -6.55499267578125, -6.3287353515625, -6.10247802734375, -5.876220703125, -5.64996337890625, -5.4237060546875, -5.19744873046875, -4.97119140625, -4.74493408203125, -4.5186767578125, -4.29241943359375, -4.066162109375, -3.83990478515625, -3.6136474609375, -3.38739013671875, -3.1611328125, -2.93487548828125, -2.7086181640625, -2.48236083984375, -2.256103515625, -2.02984619140625, -1.8035888671875, -1.57733154296875, -1.35107421875, -1.12481689453125, -0.8985595703125, -0.67230224609375, -0.446044921875, -0.21978759765625, 0.0064697265625, 0.23272705078125, 0.458984375, 0.68524169921875, 0.9114990234375, 1.13775634765625, 1.364013671875, 1.59027099609375, 1.8165283203125, 2.04278564453125, 2.26904296875, 2.49530029296875, 2.7215576171875, 2.94781494140625, 3.174072265625, 3.40032958984375, 3.6265869140625, 3.85284423828125, 4.0791015625, 4.30535888671875, 4.5316162109375, 4.75787353515625, 4.984130859375, 5.21038818359375, 5.4366455078125, 5.66290283203125, 5.88916015625, 6.11541748046875, 6.3416748046875, 6.56793212890625, 6.794189453125, 7.02044677734375, 7.2467041015625, 7.47296142578125, 7.69921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 5.0, 13.0, 10.0, 13.0, 18.0, 21.0, 39.0, 44.0, 77.0, 102.0, 128.0, 192.0, 267.0, 374.0, 492.0, 726.0, 1076.0, 1539.0, 2441.0, 3780.0, 6575.0, 13297.0, 35763.0, 148426.0, 639370.0, 132206.0, 32585.0, 12321.0, 6191.0, 3557.0, 2156.0, 1491.0, 955.0, 647.0, 511.0, 313.0, 214.0, 188.0, 115.0, 74.0, 77.0, 46.0, 33.0, 24.0, 21.0, 13.0, 6.0, 8.0, 8.0, 3.0, 5.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0015239715576171875, -0.001478433609008789, -0.0014328956604003906, -0.0013873577117919922, -0.0013418197631835938, -0.0012962818145751953, -0.0012507438659667969, -0.0012052059173583984, -0.00115966796875, -0.0011141300201416016, -0.0010685920715332031, -0.0010230541229248047, -0.0009775161743164062, -0.0009319782257080078, -0.0008864402770996094, -0.0008409023284912109, -0.0007953643798828125, -0.0007498264312744141, -0.0007042884826660156, -0.0006587505340576172, -0.0006132125854492188, -0.0005676746368408203, -0.0005221366882324219, -0.00047659873962402344, -0.000431060791015625, -0.00038552284240722656, -0.0003399848937988281, -0.0002944469451904297, -0.00024890899658203125, -0.0002033710479736328, -0.00015783309936523438, -0.00011229515075683594, -6.67572021484375e-05, -2.1219253540039062e-05, 2.4318695068359375e-05, 6.985664367675781e-05, 0.00011539459228515625, 0.0001609325408935547, 0.00020647048950195312, 0.00025200843811035156, 0.00029754638671875, 0.00034308433532714844, 0.0003886222839355469, 0.0004341602325439453, 0.00047969818115234375, 0.0005252361297607422, 0.0005707740783691406, 0.0006163120269775391, 0.0006618499755859375, 0.0007073879241943359, 0.0007529258728027344, 0.0007984638214111328, 0.0008440017700195312, 0.0008895397186279297, 0.0009350776672363281, 0.0009806156158447266, 0.001026153564453125, 0.0010716915130615234, 0.0011172294616699219, 0.0011627674102783203, 0.0012083053588867188, 0.0012538433074951172, 0.0012993812561035156, 0.001344919204711914, 0.0013904571533203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 2.0, 8.0, 13.0, 24.0, 38.0, 95.0, 287.0, 315.0, 93.0, 45.0, 33.0, 18.0, 8.0, 12.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000186920166015625, -0.00018173456192016602, -0.00017654895782470703, -0.00017136335372924805, -0.00016617774963378906, -0.00016099214553833008, -0.0001558065414428711, -0.0001506209373474121, -0.00014543533325195312, -0.00014024972915649414, -0.00013506412506103516, -0.00012987852096557617, -0.0001246929168701172, -0.0001195073127746582, -0.00011432170867919922, -0.00010913610458374023, -0.00010395050048828125, -9.876489639282227e-05, -9.357929229736328e-05, -8.83936882019043e-05, -8.320808410644531e-05, -7.802248001098633e-05, -7.283687591552734e-05, -6.765127182006836e-05, -6.246566772460938e-05, -5.728006362915039e-05, -5.2094459533691406e-05, -4.690885543823242e-05, -4.172325134277344e-05, -3.653764724731445e-05, -3.135204315185547e-05, -2.6166439056396484e-05, -2.09808349609375e-05, -1.5795230865478516e-05, -1.0609626770019531e-05, -5.424022674560547e-06, -2.384185791015625e-07, 4.947185516357422e-06, 1.0132789611816406e-05, 1.531839370727539e-05, 2.0503997802734375e-05, 2.568960189819336e-05, 3.0875205993652344e-05, 3.606081008911133e-05, 4.124641418457031e-05, 4.64320182800293e-05, 5.161762237548828e-05, 5.6803226470947266e-05, 6.198883056640625e-05, 6.717443466186523e-05, 7.236003875732422e-05, 7.75456428527832e-05, 8.273124694824219e-05, 8.791685104370117e-05, 9.310245513916016e-05, 9.828805923461914e-05, 0.00010347366333007812, 0.00010865926742553711, 0.0001138448715209961, 0.00011903047561645508, 0.00012421607971191406, 0.00012940168380737305, 0.00013458728790283203, 0.00013977289199829102, 0.00014495849609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 3.0, 7.0, 14.0, 17.0, 23.0, 39.0, 83.0, 334.0, 983491.0, 64038.0, 264.0, 74.0, 42.0, 32.0, 10.0, 11.0, 10.0, 6.0, 7.0, 4.0, 2.0, 5.0, 1.0, 4.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0157928466796875, -0.015365362167358398, -0.014937877655029297, -0.014510393142700195, -0.014082908630371094, -0.013655424118041992, -0.01322793960571289, -0.012800455093383789, -0.012372970581054688, -0.011945486068725586, -0.011518001556396484, -0.011090517044067383, -0.010663032531738281, -0.01023554801940918, -0.009808063507080078, -0.009380578994750977, -0.008953094482421875, -0.008525609970092773, -0.008098125457763672, -0.00767064094543457, -0.007243156433105469, -0.006815671920776367, -0.006388187408447266, -0.005960702896118164, -0.0055332183837890625, -0.005105733871459961, -0.004678249359130859, -0.004250764846801758, -0.0038232803344726562, -0.0033957958221435547, -0.002968311309814453, -0.0025408267974853516, -0.00211334228515625, -0.0016858577728271484, -0.0012583732604980469, -0.0008308887481689453, -0.00040340423583984375, 2.4080276489257812e-05, 0.0004515647888183594, 0.0008790493011474609, 0.0013065338134765625, 0.001734018325805664, 0.0021615028381347656, 0.002588987350463867, 0.0030164718627929688, 0.0034439563751220703, 0.003871440887451172, 0.0042989253997802734, 0.004726409912109375, 0.0051538944244384766, 0.005581378936767578, 0.00600886344909668, 0.006436347961425781, 0.006863832473754883, 0.007291316986083984, 0.007718801498413086, 0.008146286010742188, 0.008573770523071289, 0.00900125503540039, 0.009428739547729492, 0.009856224060058594, 0.010283708572387695, 0.010711193084716797, 0.011138677597045898, 0.011566162109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 4.0, 1.0, 10.0, 8.0, 7.0, 12.0, 16.0, 22.0, 20.0, 48.0, 78.0, 119.0, 191.0, 149.0, 94.0, 58.0, 43.0, 31.0, 20.0, 11.0, 15.0, 7.0, 7.0, 3.0, 6.0, 3.0, 4.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004715919494628906, -0.00045880675315856934, -0.00044602155685424805, -0.00043323636054992676, -0.00042045116424560547, -0.0004076659679412842, -0.0003948807716369629, -0.0003820955753326416, -0.0003693103790283203, -0.000356525182723999, -0.00034373998641967773, -0.00033095479011535645, -0.00031816959381103516, -0.00030538439750671387, -0.0002925992012023926, -0.0002798140048980713, -0.00026702880859375, -0.0002542436122894287, -0.00024145841598510742, -0.00022867321968078613, -0.00021588802337646484, -0.00020310282707214355, -0.00019031763076782227, -0.00017753243446350098, -0.0001647472381591797, -0.0001519620418548584, -0.0001391768455505371, -0.00012639164924621582, -0.00011360645294189453, -0.00010082125663757324, -8.803606033325195e-05, -7.525086402893066e-05, -6.246566772460938e-05, -4.9680471420288086e-05, -3.68952751159668e-05, -2.4110078811645508e-05, -1.1324882507324219e-05, 1.4603137969970703e-06, 1.424551010131836e-05, 2.703070640563965e-05, 3.981590270996094e-05, 5.2601099014282227e-05, 6.538629531860352e-05, 7.81714916229248e-05, 9.09566879272461e-05, 0.00010374188423156738, 0.00011652708053588867, 0.00012931227684020996, 0.00014209747314453125, 0.00015488266944885254, 0.00016766786575317383, 0.00018045306205749512, 0.0001932382583618164, 0.0002060234546661377, 0.00021880865097045898, 0.00023159384727478027, 0.00024437904357910156, 0.00025716423988342285, 0.00026994943618774414, 0.00028273463249206543, 0.0002955198287963867, 0.000308305025100708, 0.0003210902214050293, 0.0003338754177093506, 0.0003466606140136719]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 10.0, 46.0, 339.0, 524.0, 68.0, 14.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.316783905029297, -6.601988315582275, -5.887192726135254, -5.172397613525391, -4.457601547241211, -3.7428061962127686, -3.028010845184326, -2.3132152557373047, -1.5984196662902832, -0.8836241364479065, -0.16882860660552979, 0.5459668636322021, 1.2607624530792236, 1.9755580425262451, 2.6903533935546875, 3.405148983001709, 4.1199445724487305, 4.834740161895752, 5.549535751342773, 6.264330863952637, 6.979126930236816, 7.69392204284668, 8.40871810913086, 9.123513221740723, 9.838308334350586, 10.55310344696045, 11.267899513244629, 11.982694625854492, 12.697490692138672, 13.412285804748535, 14.127080917358398, 14.841876983642578, 15.556673049926758, 16.271469116210938, 16.986263275146484, 17.701059341430664, 18.415855407714844, 19.130651473999023, 19.84544563293457, 20.56024169921875, 21.27503776550293, 21.98983383178711, 22.704627990722656, 23.419424057006836, 24.134220123291016, 24.849016189575195, 25.563810348510742, 26.278606414794922, 26.99340057373047, 27.70819664001465, 28.422990798950195, 29.137786865234375, 29.852582931518555, 30.567378997802734, 31.28217315673828, 31.99696922302246, 32.71176528930664, 33.42655944824219, 34.141357421875, 34.85615158081055, 35.570945739746094, 36.285743713378906, 37.00053787231445, 37.71533203125, 38.43013000488281]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 10.0, 10.0, 21.0, 19.0, 28.0, 61.0, 47.0, 64.0, 68.0, 86.0, 79.0, 89.0, 78.0, 53.0, 57.0, 60.0, 47.0, 32.0, 25.0, 20.0, 10.0, 9.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.200119495391846, -6.987898349761963, -6.775676727294922, -6.563455581665039, -6.351234436035156, -6.139013290405273, -5.926792144775391, -5.71457052230835, -5.502349376678467, -5.290128231048584, -5.077906608581543, -4.86568546295166, -4.653464317321777, -4.4412431716918945, -4.229022026062012, -4.016800403594971, -3.804579257965088, -3.592358112335205, -3.380136728286743, -3.1679153442382812, -2.9556941986083984, -2.7434730529785156, -2.5312516689300537, -2.319030284881592, -2.106809139251709, -1.8945878744125366, -1.6823666095733643, -1.470145344734192, -1.2579240798950195, -1.0457028150558472, -0.8334815502166748, -0.6212602853775024, -0.4090390205383301, -0.19681775569915771, 0.015403509140014648, 0.227624773979187, 0.4398460388183594, 0.6520673036575317, 0.8642885684967041, 1.0765098333358765, 1.2887310981750488, 1.5009523630142212, 1.7131736278533936, 1.925394892692566, 2.1376161575317383, 2.349837303161621, 2.562058687210083, 2.774280071258545, 2.9865012168884277, 3.1987223625183105, 3.4109437465667725, 3.6231651306152344, 3.835386276245117, 4.047607421875, 4.259828567504883, 4.472050189971924, 4.684271335601807, 4.8964924812316895, 5.1087141036987305, 5.320935249328613, 5.533156394958496, 5.745377540588379, 5.957598686218262, 6.169820308685303, 6.3820414543151855]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 3.0, 6.0, 11.0, 15.0, 21.0, 22.0, 41.0, 66.0, 82.0, 173.0, 328.0, 590.0, 1396.0, 3977.0, 17501.0, 258075.0, 724500.0, 32381.0, 5845.0, 1836.0, 777.0, 374.0, 228.0, 111.0, 62.0, 43.0, 16.0, 29.0, 12.0, 10.0, 5.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69140625, -7.45941162109375, -7.2274169921875, -6.99542236328125, -6.763427734375, -6.53143310546875, -6.2994384765625, -6.06744384765625, -5.83544921875, -5.60345458984375, -5.3714599609375, -5.13946533203125, -4.907470703125, -4.67547607421875, -4.4434814453125, -4.21148681640625, -3.9794921875, -3.74749755859375, -3.5155029296875, -3.28350830078125, -3.051513671875, -2.81951904296875, -2.5875244140625, -2.35552978515625, -2.12353515625, -1.89154052734375, -1.6595458984375, -1.42755126953125, -1.195556640625, -0.96356201171875, -0.7315673828125, -0.49957275390625, -0.267578125, -0.03558349609375, 0.1964111328125, 0.42840576171875, 0.660400390625, 0.89239501953125, 1.1243896484375, 1.35638427734375, 1.58837890625, 1.82037353515625, 2.0523681640625, 2.28436279296875, 2.516357421875, 2.74835205078125, 2.9803466796875, 3.21234130859375, 3.4443359375, 3.67633056640625, 3.9083251953125, 4.14031982421875, 4.372314453125, 4.60430908203125, 4.8363037109375, 5.06829833984375, 5.30029296875, 5.53228759765625, 5.7642822265625, 5.99627685546875, 6.228271484375, 6.46026611328125, 6.6922607421875, 6.92425537109375, 7.15625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 9.0, 11.0, 11.0, 18.0, 17.0, 32.0, 44.0, 51.0, 50.0, 82.0, 94.0, 86.0, 88.0, 102.0, 50.0, 66.0, 50.0, 51.0, 23.0, 22.0, 17.0, 10.0, 5.0, 0.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71875, -5.56365966796875, -5.4085693359375, -5.25347900390625, -5.098388671875, -4.94329833984375, -4.7882080078125, -4.63311767578125, -4.47802734375, -4.32293701171875, -4.1678466796875, -4.01275634765625, -3.857666015625, -3.70257568359375, -3.5474853515625, -3.39239501953125, -3.2373046875, -3.08221435546875, -2.9271240234375, -2.77203369140625, -2.616943359375, -2.46185302734375, -2.3067626953125, -2.15167236328125, -1.99658203125, -1.84149169921875, -1.6864013671875, -1.53131103515625, -1.376220703125, -1.22113037109375, -1.0660400390625, -0.91094970703125, -0.755859375, -0.60076904296875, -0.4456787109375, -0.29058837890625, -0.135498046875, 0.01959228515625, 0.1746826171875, 0.32977294921875, 0.48486328125, 0.63995361328125, 0.7950439453125, 0.95013427734375, 1.105224609375, 1.26031494140625, 1.4154052734375, 1.57049560546875, 1.7255859375, 1.88067626953125, 2.0357666015625, 2.19085693359375, 2.345947265625, 2.50103759765625, 2.6561279296875, 2.81121826171875, 2.96630859375, 3.12139892578125, 3.2764892578125, 3.43157958984375, 3.586669921875, 3.74176025390625, 3.8968505859375, 4.05194091796875, 4.20703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 10.0, 9.0, 16.0, 23.0, 25.0, 26.0, 35.0, 54.0, 70.0, 195.0, 860.0, 1046242.0, 504.0, 161.0, 64.0, 49.0, 31.0, 36.0, 15.0, 22.0, 15.0, 8.0, 8.0, 7.0, 11.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.3125, -120.3505859375, -116.388671875, -112.4267578125, -108.46484375, -104.5029296875, -100.541015625, -96.5791015625, -92.6171875, -88.6552734375, -84.693359375, -80.7314453125, -76.76953125, -72.8076171875, -68.845703125, -64.8837890625, -60.921875, -56.9599609375, -52.998046875, -49.0361328125, -45.07421875, -41.1123046875, -37.150390625, -33.1884765625, -29.2265625, -25.2646484375, -21.302734375, -17.3408203125, -13.37890625, -9.4169921875, -5.455078125, -1.4931640625, 2.46875, 6.4306640625, 10.392578125, 14.3544921875, 18.31640625, 22.2783203125, 26.240234375, 30.2021484375, 34.1640625, 38.1259765625, 42.087890625, 46.0498046875, 50.01171875, 53.9736328125, 57.935546875, 61.8974609375, 65.859375, 69.8212890625, 73.783203125, 77.7451171875, 81.70703125, 85.6689453125, 89.630859375, 93.5927734375, 97.5546875, 101.5166015625, 105.478515625, 109.4404296875, 113.40234375, 117.3642578125, 121.326171875, 125.2880859375, 129.25]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 11.0, 10.0, 10.0, 11.0, 19.0, 20.0, 21.0, 27.0, 33.0, 36.0, 41.0, 66.0, 69.0, 78.0, 80.0, 85.0, 61.0, 70.0, 37.0, 34.0, 33.0, 26.0, 19.0, 9.0, 15.0, 9.0, 7.0, 14.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.3203125, -10.9776611328125, -10.635009765625, -10.2923583984375, -9.94970703125, -9.6070556640625, -9.264404296875, -8.9217529296875, -8.5791015625, -8.2364501953125, -7.893798828125, -7.5511474609375, -7.20849609375, -6.8658447265625, -6.523193359375, -6.1805419921875, -5.837890625, -5.4952392578125, -5.152587890625, -4.8099365234375, -4.46728515625, -4.1246337890625, -3.781982421875, -3.4393310546875, -3.0966796875, -2.7540283203125, -2.411376953125, -2.0687255859375, -1.72607421875, -1.3834228515625, -1.040771484375, -0.6981201171875, -0.35546875, -0.0128173828125, 0.329833984375, 0.6724853515625, 1.01513671875, 1.3577880859375, 1.700439453125, 2.0430908203125, 2.3857421875, 2.7283935546875, 3.071044921875, 3.4136962890625, 3.75634765625, 4.0989990234375, 4.441650390625, 4.7843017578125, 5.126953125, 5.4696044921875, 5.812255859375, 6.1549072265625, 6.49755859375, 6.8402099609375, 7.182861328125, 7.5255126953125, 7.8681640625, 8.2108154296875, 8.553466796875, 8.8961181640625, 9.23876953125, 9.5814208984375, 9.924072265625, 10.2667236328125, 10.609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 6.0, 16.0, 30.0, 85.0, 1047118.0, 1216.0, 41.0, 17.0, 12.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.375, -117.306640625, -113.23828125, -109.169921875, -105.1015625, -101.033203125, -96.96484375, -92.896484375, -88.828125, -84.759765625, -80.69140625, -76.623046875, -72.5546875, -68.486328125, -64.41796875, -60.349609375, -56.28125, -52.212890625, -48.14453125, -44.076171875, -40.0078125, -35.939453125, -31.87109375, -27.802734375, -23.734375, -19.666015625, -15.59765625, -11.529296875, -7.4609375, -3.392578125, 0.67578125, 4.744140625, 8.8125, 12.880859375, 16.94921875, 21.017578125, 25.0859375, 29.154296875, 33.22265625, 37.291015625, 41.359375, 45.427734375, 49.49609375, 53.564453125, 57.6328125, 61.701171875, 65.76953125, 69.837890625, 73.90625, 77.974609375, 82.04296875, 86.111328125, 90.1796875, 94.248046875, 98.31640625, 102.384765625, 106.453125, 110.521484375, 114.58984375, 118.658203125, 122.7265625, 126.794921875, 130.86328125, 134.931640625, 139.0]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 3.0, 3.0, 10.0, 17.0, 10.0, 16.0, 25.0, 41.0, 95.0, 564.0, 90.0, 38.0, 18.0, 16.0, 14.0, 8.0, 7.0, 6.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001708984375, -0.0016697198152542114, -0.0016304552555084229, -0.0015911906957626343, -0.0015519261360168457, -0.0015126615762710571, -0.0014733970165252686, -0.00143413245677948, -0.0013948678970336914, -0.0013556033372879028, -0.0013163387775421143, -0.0012770742177963257, -0.0012378096580505371, -0.0011985450983047485, -0.00115928053855896, -0.0011200159788131714, -0.0010807514190673828, -0.0010414868593215942, -0.0010022222995758057, -0.0009629577398300171, -0.0009236931800842285, -0.0008844286203384399, -0.0008451640605926514, -0.0008058995008468628, -0.0007666349411010742, -0.0007273703813552856, -0.0006881058216094971, -0.0006488412618637085, -0.0006095767021179199, -0.0005703121423721313, -0.0005310475826263428, -0.0004917830228805542, -0.0004525184631347656, -0.00041325390338897705, -0.0003739893436431885, -0.0003347247838973999, -0.00029546022415161133, -0.00025619566440582275, -0.00021693110466003418, -0.0001776665449142456, -0.00013840198516845703, -9.913742542266846e-05, -5.987286567687988e-05, -2.060830593109131e-05, 1.8656253814697266e-05, 5.792081356048584e-05, 9.718537330627441e-05, 0.000136449933052063, 0.00017571449279785156, 0.00021497905254364014, 0.0002542436122894287, 0.0002935081720352173, 0.00033277273178100586, 0.00037203729152679443, 0.000411301851272583, 0.0004505664110183716, 0.0004898309707641602, 0.0005290955305099487, 0.0005683600902557373, 0.0006076246500015259, 0.0006468892097473145, 0.000686153769493103, 0.0007254183292388916, 0.0007646828889846802, 0.0008039474487304688]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 8.0, 8.0, 21.0, 42.0, 335.0, 1047986.0, 74.0, 30.0, 13.0, 11.0, 8.0, 6.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.625, -185.0546875, -179.484375, -173.9140625, -168.34375, -162.7734375, -157.203125, -151.6328125, -146.0625, -140.4921875, -134.921875, -129.3515625, -123.78125, -118.2109375, -112.640625, -107.0703125, -101.5, -95.9296875, -90.359375, -84.7890625, -79.21875, -73.6484375, -68.078125, -62.5078125, -56.9375, -51.3671875, -45.796875, -40.2265625, -34.65625, -29.0859375, -23.515625, -17.9453125, -12.375, -6.8046875, -1.234375, 4.3359375, 9.90625, 15.4765625, 21.046875, 26.6171875, 32.1875, 37.7578125, 43.328125, 48.8984375, 54.46875, 60.0390625, 65.609375, 71.1796875, 76.75, 82.3203125, 87.890625, 93.4609375, 99.03125, 104.6015625, 110.171875, 115.7421875, 121.3125, 126.8828125, 132.453125, 138.0234375, 143.59375, 149.1640625, 154.734375, 160.3046875, 165.875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 7.0, 6.0, 17.0, 45.0, 55.0, 728.0, 49.0, 31.0, 24.0, 10.0, 9.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6328125, -9.3526611328125, -9.072509765625, -8.7923583984375, -8.51220703125, -8.2320556640625, -7.951904296875, -7.6717529296875, -7.3916015625, -7.1114501953125, -6.831298828125, -6.5511474609375, -6.27099609375, -5.9908447265625, -5.710693359375, -5.4305419921875, -5.150390625, -4.8702392578125, -4.590087890625, -4.3099365234375, -4.02978515625, -3.7496337890625, -3.469482421875, -3.1893310546875, -2.9091796875, -2.6290283203125, -2.348876953125, -2.0687255859375, -1.78857421875, -1.5084228515625, -1.228271484375, -0.9481201171875, -0.66796875, -0.3878173828125, -0.107666015625, 0.1724853515625, 0.45263671875, 0.7327880859375, 1.012939453125, 1.2930908203125, 1.5732421875, 1.8533935546875, 2.133544921875, 2.4136962890625, 2.69384765625, 2.9739990234375, 3.254150390625, 3.5343017578125, 3.814453125, 4.0946044921875, 4.374755859375, 4.6549072265625, 4.93505859375, 5.2152099609375, 5.495361328125, 5.7755126953125, 6.0556640625, 6.3358154296875, 6.615966796875, 6.8961181640625, 7.17626953125, 7.4564208984375, 7.736572265625, 8.0167236328125, 8.296875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1020.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.030845642089844, 13.232248306274414, 37.49534225463867, 61.75843811035156, 86.02153015136719, 110.28462219238281, 134.5477294921875, 158.81082153320312, 183.07391357421875, 207.33700561523438, 231.60009765625, 255.86318969726562, 280.12628173828125, 304.3893737792969, 328.6524658203125, 352.91558837890625, 377.17864990234375, 401.4417419433594, 425.704833984375, 449.9679260253906, 474.23101806640625, 498.4941101074219, 522.7572021484375, 547.0203247070312, 571.2833862304688, 595.5465087890625, 619.8095703125, 644.0726928710938, 668.3357543945312, 692.598876953125, 716.8619384765625, 741.1250610351562, 765.3881225585938, 789.6512451171875, 813.914306640625, 838.1774291992188, 862.4404907226562, 886.70361328125, 910.9666748046875, 935.2297973632812, 959.4928588867188, 983.7559814453125, 1008.01904296875, 1032.2821044921875, 1056.5452880859375, 1080.808349609375, 1105.0714111328125, 1129.33447265625, 1153.59765625, 1177.8607177734375, 1202.1239013671875, 1226.386962890625, 1250.6500244140625, 1274.9130859375, 1299.17626953125, 1323.4393310546875, 1347.702392578125, 1371.9654541015625, 1396.2286376953125, 1420.49169921875, 1444.7547607421875, 1469.017822265625, 1493.281005859375, 1517.5440673828125, 1541.80712890625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 11.0, 12.0, 25.0, 57.0, 69.0, 95.0, 123.0, 149.0, 139.0, 115.0, 90.0, 63.0, 23.0, 25.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.71484375, -11.561805725097656, -10.408768653869629, -9.255731582641602, -8.102693557739258, -6.949656009674072, -5.796618461608887, -4.643581390380859, -3.4905433654785156, -2.33750581741333, -1.1844682693481445, -0.031430721282958984, 1.1216068267822266, 2.274644374847412, 3.4276819229125977, 4.580718994140625, 5.733757019042969, 6.886794567108154, 8.03983211517334, 9.192869186401367, 10.345907211303711, 11.498945236206055, 12.651982307434082, 13.80501937866211, 14.958057403564453, 16.111095428466797, 17.26413345336914, 18.41716957092285, 19.570207595825195, 20.72324562072754, 21.87628173828125, 23.029319763183594, 24.182353973388672, 25.335391998291016, 26.48843002319336, 27.64146614074707, 28.794504165649414, 29.947542190551758, 31.10057830810547, 32.25361633300781, 33.406654357910156, 34.5596923828125, 35.712730407714844, 36.86576843261719, 38.01880645751953, 39.17184066772461, 40.32487869262695, 41.4779167175293, 42.63095474243164, 43.783992767333984, 44.93703079223633, 46.09006881713867, 47.24310302734375, 48.396141052246094, 49.54917907714844, 50.70221710205078, 51.855255126953125, 53.00829315185547, 54.16133117675781, 55.314369201660156, 56.4674072265625, 57.62044143676758, 58.77347946166992, 59.926517486572266, 61.07955551147461]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 13.0, 7.0, 11.0, 26.0, 59.0, 90.0, 209.0, 415.0, 1211.0, 3748201.0, 441830.0, 1256.0, 462.0, 227.0, 99.0, 80.0, 39.0, 20.0, 13.0, 6.0, 4.0, 1.0, 0.0, 5.0, 0.0, 1.0, 1.0], "bins": [-67.8125, -66.36962890625, -64.9267578125, -63.48388671875, -62.041015625, -60.59814453125, -59.1552734375, -57.71240234375, -56.26953125, -54.82666015625, -53.3837890625, -51.94091796875, -50.498046875, -49.05517578125, -47.6123046875, -46.16943359375, -44.7265625, -43.28369140625, -41.8408203125, -40.39794921875, -38.955078125, -37.51220703125, -36.0693359375, -34.62646484375, -33.18359375, -31.74072265625, -30.2978515625, -28.85498046875, -27.412109375, -25.96923828125, -24.5263671875, -23.08349609375, -21.640625, -20.19775390625, -18.7548828125, -17.31201171875, -15.869140625, -14.42626953125, -12.9833984375, -11.54052734375, -10.09765625, -8.65478515625, -7.2119140625, -5.76904296875, -4.326171875, -2.88330078125, -1.4404296875, 0.00244140625, 1.4453125, 2.88818359375, 4.3310546875, 5.77392578125, 7.216796875, 8.65966796875, 10.1025390625, 11.54541015625, 12.98828125, 14.43115234375, 15.8740234375, 17.31689453125, 18.759765625, 20.20263671875, 21.6455078125, 23.08837890625, 24.53125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 12.0, 25.0, 55.0, 81.0, 106.0, 130.0, 153.0, 137.0, 119.0, 72.0, 53.0, 25.0, 14.0, 13.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.27734375, -6.118255615234375, -5.95916748046875, -5.800079345703125, -5.6409912109375, -5.481903076171875, -5.32281494140625, -5.163726806640625, -5.004638671875, -4.845550537109375, -4.68646240234375, -4.527374267578125, -4.3682861328125, -4.209197998046875, -4.05010986328125, -3.891021728515625, -3.73193359375, -3.572845458984375, -3.41375732421875, -3.254669189453125, -3.0955810546875, -2.936492919921875, -2.77740478515625, -2.618316650390625, -2.459228515625, -2.300140380859375, -2.14105224609375, -1.981964111328125, -1.8228759765625, -1.663787841796875, -1.50469970703125, -1.345611572265625, -1.1865234375, -1.027435302734375, -0.86834716796875, -0.709259033203125, -0.5501708984375, -0.391082763671875, -0.23199462890625, -0.072906494140625, 0.086181640625, 0.245269775390625, 0.40435791015625, 0.563446044921875, 0.7225341796875, 0.881622314453125, 1.04071044921875, 1.199798583984375, 1.35888671875, 1.517974853515625, 1.67706298828125, 1.836151123046875, 1.9952392578125, 2.154327392578125, 2.31341552734375, 2.472503662109375, 2.631591796875, 2.790679931640625, 2.94976806640625, 3.108856201171875, 3.2679443359375, 3.427032470703125, 3.58612060546875, 3.745208740234375, 3.904296875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 2.0, 2.0, 5.0, 3.0, 10.0, 11.0, 35.0, 95.0, 4188755.0, 5237.0, 68.0, 11.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-110.3125, -106.4951171875, -102.677734375, -98.8603515625, -95.04296875, -91.2255859375, -87.408203125, -83.5908203125, -79.7734375, -75.9560546875, -72.138671875, -68.3212890625, -64.50390625, -60.6865234375, -56.869140625, -53.0517578125, -49.234375, -45.4169921875, -41.599609375, -37.7822265625, -33.96484375, -30.1474609375, -26.330078125, -22.5126953125, -18.6953125, -14.8779296875, -11.060546875, -7.2431640625, -3.42578125, 0.3916015625, 4.208984375, 8.0263671875, 11.84375, 15.6611328125, 19.478515625, 23.2958984375, 27.11328125, 30.9306640625, 34.748046875, 38.5654296875, 42.3828125, 46.2001953125, 50.017578125, 53.8349609375, 57.65234375, 61.4697265625, 65.287109375, 69.1044921875, 72.921875, 76.7392578125, 80.556640625, 84.3740234375, 88.19140625, 92.0087890625, 95.826171875, 99.6435546875, 103.4609375, 107.2783203125, 111.095703125, 114.9130859375, 118.73046875, 122.5478515625, 126.365234375, 130.1826171875, 134.0]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 3.0, 8.0, 20.0, 3621.0, 371.0, 20.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.603515625, -2.494659423828125, -2.38580322265625, -2.276947021484375, -2.1680908203125, -2.059234619140625, -1.95037841796875, -1.841522216796875, -1.732666015625, -1.623809814453125, -1.51495361328125, -1.406097412109375, -1.2972412109375, -1.188385009765625, -1.07952880859375, -0.970672607421875, -0.86181640625, -0.752960205078125, -0.64410400390625, -0.535247802734375, -0.4263916015625, -0.317535400390625, -0.20867919921875, -0.099822998046875, 0.009033203125, 0.117889404296875, 0.22674560546875, 0.335601806640625, 0.4444580078125, 0.553314208984375, 0.66217041015625, 0.771026611328125, 0.8798828125, 0.988739013671875, 1.09759521484375, 1.206451416015625, 1.3153076171875, 1.424163818359375, 1.53302001953125, 1.641876220703125, 1.750732421875, 1.859588623046875, 1.96844482421875, 2.077301025390625, 2.1861572265625, 2.295013427734375, 2.40386962890625, 2.512725830078125, 2.62158203125, 2.730438232421875, 2.83929443359375, 2.948150634765625, 3.0570068359375, 3.165863037109375, 3.27471923828125, 3.383575439453125, 3.492431640625, 3.601287841796875, 3.71014404296875, 3.819000244140625, 3.9278564453125, 4.036712646484375, 4.14556884765625, 4.254425048828125, 4.36328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 11.0, 18.0, 37.0, 67.0, 166.0, 306.0, 277.0, 77.0, 25.0, 13.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5056376457214355, -2.227318525314331, -1.9489991664886475, -1.670680046081543, -1.392360806465149, -1.1140415668487549, -0.8357224464416504, -0.5574032068252563, -0.2790839672088623, -0.0007647573947906494, 0.277554452419281, 0.5558736324310303, 0.8341928720474243, 1.1125121116638184, 1.3908312320709229, 1.669150471687317, 1.947469711303711, 2.2257888317108154, 2.504108190536499, 2.7824273109436035, 3.060746669769287, 3.3390657901763916, 3.617384910583496, 3.8957042694091797, 4.174023628234863, 4.452342987060547, 4.730661869049072, 5.008981227874756, 5.2873005867004395, 5.565619468688965, 5.843938827514648, 6.122258186340332, 6.400576591491699, 6.678895950317383, 6.957214832305908, 7.235534191131592, 7.513853549957275, 7.792172431945801, 8.070491790771484, 8.348811149597168, 8.627130508422852, 8.905449867248535, 9.183769226074219, 9.462087631225586, 9.74040699005127, 10.018726348876953, 10.297045707702637, 10.57536506652832, 10.853683471679688, 11.132002830505371, 11.410322189331055, 11.688640594482422, 11.966959953308105, 12.245279312133789, 12.523598670959473, 12.801918029785156, 13.08023738861084, 13.358556747436523, 13.636876106262207, 13.91519546508789, 14.193513870239258, 14.471833229064941, 14.750152587890625, 15.028471946716309, 15.306791305541992]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 12.0, 13.0, 23.0, 43.0, 63.0, 62.0, 107.0, 115.0, 123.0, 109.0, 107.0, 77.0, 53.0, 38.0, 28.0, 17.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.378300189971924, -7.221693992614746, -7.065087795257568, -6.908481597900391, -6.751875400543213, -6.595269203186035, -6.438663005828857, -6.28205680847168, -6.12545108795166, -5.968844890594482, -5.812238693237305, -5.655632495880127, -5.499026298522949, -5.3424201011657715, -5.185813903808594, -5.029208183288574, -4.872601509094238, -4.7159953117370605, -4.559389114379883, -4.402782917022705, -4.246176719665527, -4.08957052230835, -3.932964563369751, -3.7763583660125732, -3.6197521686553955, -3.4631459712982178, -3.30653977394104, -3.1499335765838623, -2.9933276176452637, -2.836721420288086, -2.680115222930908, -2.5235090255737305, -2.3669028282165527, -2.210296630859375, -2.0536904335021973, -1.897084355354309, -1.7404781579971313, -1.5838719606399536, -1.4272658824920654, -1.2706596851348877, -1.11405348777771, -0.9574472904205322, -0.8008411526679993, -0.6442350149154663, -0.4876288175582886, -0.33102262020111084, -0.17441648244857788, -0.017810344696044922, 0.1387958526611328, 0.29540202021598816, 0.4520081877708435, 0.6086143255233765, 0.7652205228805542, 0.9218267202377319, 1.0784327983856201, 1.2350389957427979, 1.3916451930999756, 1.5482513904571533, 1.704857587814331, 1.8614636659622192, 2.0180697441101074, 2.174675941467285, 2.331282138824463, 2.4878883361816406, 2.6444945335388184]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 2.0, 7.0, 9.0, 13.0, 21.0, 42.0, 92.0, 212.0, 725.0, 2464.0, 19643.0, 997112.0, 24250.0, 2755.0, 725.0, 243.0, 104.0, 54.0, 29.0, 14.0, 7.0, 9.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8818359375, -1.8239898681640625, -1.766143798828125, -1.7082977294921875, -1.65045166015625, -1.5926055908203125, -1.534759521484375, -1.4769134521484375, -1.4190673828125, -1.3612213134765625, -1.303375244140625, -1.2455291748046875, -1.18768310546875, -1.1298370361328125, -1.071990966796875, -1.0141448974609375, -0.956298828125, -0.8984527587890625, -0.840606689453125, -0.7827606201171875, -0.72491455078125, -0.6670684814453125, -0.609222412109375, -0.5513763427734375, -0.4935302734375, -0.4356842041015625, -0.377838134765625, -0.3199920654296875, -0.26214599609375, -0.2042999267578125, -0.146453857421875, -0.0886077880859375, -0.03076171875, 0.0270843505859375, 0.084930419921875, 0.1427764892578125, 0.20062255859375, 0.2584686279296875, 0.316314697265625, 0.3741607666015625, 0.4320068359375, 0.4898529052734375, 0.547698974609375, 0.6055450439453125, 0.66339111328125, 0.7212371826171875, 0.779083251953125, 0.8369293212890625, 0.894775390625, 0.9526214599609375, 1.010467529296875, 1.0683135986328125, 1.12615966796875, 1.1840057373046875, 1.241851806640625, 1.2996978759765625, 1.3575439453125, 1.4153900146484375, 1.473236083984375, 1.5310821533203125, 1.58892822265625, 1.6467742919921875, 1.704620361328125, 1.7624664306640625, 1.8203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 7.0, 20.0, 34.0, 55.0, 96.0, 107.0, 161.0, 150.0, 121.0, 102.0, 64.0, 37.0, 26.0, 12.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.16796875, -6.039825439453125, -5.91168212890625, -5.783538818359375, -5.6553955078125, -5.527252197265625, -5.39910888671875, -5.270965576171875, -5.142822265625, -5.014678955078125, -4.88653564453125, -4.758392333984375, -4.6302490234375, -4.502105712890625, -4.37396240234375, -4.245819091796875, -4.11767578125, -3.989532470703125, -3.86138916015625, -3.733245849609375, -3.6051025390625, -3.476959228515625, -3.34881591796875, -3.220672607421875, -3.092529296875, -2.964385986328125, -2.83624267578125, -2.708099365234375, -2.5799560546875, -2.451812744140625, -2.32366943359375, -2.195526123046875, -2.0673828125, -1.939239501953125, -1.81109619140625, -1.682952880859375, -1.5548095703125, -1.426666259765625, -1.29852294921875, -1.170379638671875, -1.042236328125, -0.914093017578125, -0.78594970703125, -0.657806396484375, -0.5296630859375, -0.401519775390625, -0.27337646484375, -0.145233154296875, -0.01708984375, 0.111053466796875, 0.23919677734375, 0.367340087890625, 0.4954833984375, 0.623626708984375, 0.75177001953125, 0.879913330078125, 1.008056640625, 1.136199951171875, 1.26434326171875, 1.392486572265625, 1.5206298828125, 1.648773193359375, 1.77691650390625, 1.905059814453125, 2.033203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 9.0, 4.0, 6.0, 9.0, 15.0, 22.0, 21.0, 29.0, 37.0, 44.0, 70.0, 79.0, 104.0, 148.0, 224.0, 451.0, 1136.0, 3995.0, 18030.0, 132800.0, 794864.0, 79154.0, 12327.0, 2960.0, 901.0, 377.0, 195.0, 118.0, 89.0, 72.0, 62.0, 45.0, 31.0, 24.0, 25.0, 21.0, 17.0, 10.0, 9.0, 5.0, 6.0, 1.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12200927734375, -0.11824226379394531, -0.11447525024414062, -0.11070823669433594, -0.10694122314453125, -0.10317420959472656, -0.09940719604492188, -0.09564018249511719, -0.0918731689453125, -0.08810615539550781, -0.08433914184570312, -0.08057212829589844, -0.07680511474609375, -0.07303810119628906, -0.06927108764648438, -0.06550407409667969, -0.061737060546875, -0.05797004699707031, -0.054203033447265625, -0.05043601989746094, -0.04666900634765625, -0.04290199279785156, -0.039134979248046875, -0.03536796569824219, -0.0316009521484375, -0.027833938598632812, -0.024066925048828125, -0.020299911499023438, -0.01653289794921875, -0.012765884399414062, -0.008998870849609375, -0.0052318572998046875, -0.00146484375, 0.0023021697998046875, 0.006069183349609375, 0.009836196899414062, 0.01360321044921875, 0.017370223999023438, 0.021137237548828125, 0.024904251098632812, 0.0286712646484375, 0.03243827819824219, 0.036205291748046875, 0.03997230529785156, 0.04373931884765625, 0.04750633239746094, 0.051273345947265625, 0.05504035949707031, 0.058807373046875, 0.06257438659667969, 0.06634140014648438, 0.07010841369628906, 0.07387542724609375, 0.07764244079589844, 0.08140945434570312, 0.08517646789550781, 0.0889434814453125, 0.09271049499511719, 0.09647750854492188, 0.10024452209472656, 0.10401153564453125, 0.10777854919433594, 0.11154556274414062, 0.11531257629394531, 0.11907958984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 1.0, 4.0, 6.0, 11.0, 13.0, 13.0, 24.0, 21.0, 18.0, 25.0, 30.0, 30.0, 40.0, 40.0, 34.0, 46.0, 42.0, 41.0, 53.0, 45.0, 45.0, 33.0, 33.0, 43.0, 34.0, 38.0, 27.0, 33.0, 28.0, 33.0, 15.0, 14.0, 15.0, 12.0, 14.0, 10.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.119140625, -3.023162841796875, -2.92718505859375, -2.831207275390625, -2.7352294921875, -2.639251708984375, -2.54327392578125, -2.447296142578125, -2.351318359375, -2.255340576171875, -2.15936279296875, -2.063385009765625, -1.9674072265625, -1.871429443359375, -1.77545166015625, -1.679473876953125, -1.58349609375, -1.487518310546875, -1.39154052734375, -1.295562744140625, -1.1995849609375, -1.103607177734375, -1.00762939453125, -0.911651611328125, -0.815673828125, -0.719696044921875, -0.62371826171875, -0.527740478515625, -0.4317626953125, -0.335784912109375, -0.23980712890625, -0.143829345703125, -0.0478515625, 0.048126220703125, 0.14410400390625, 0.240081787109375, 0.3360595703125, 0.432037353515625, 0.52801513671875, 0.623992919921875, 0.719970703125, 0.815948486328125, 0.91192626953125, 1.007904052734375, 1.1038818359375, 1.199859619140625, 1.29583740234375, 1.391815185546875, 1.48779296875, 1.583770751953125, 1.67974853515625, 1.775726318359375, 1.8717041015625, 1.967681884765625, 2.06365966796875, 2.159637451171875, 2.255615234375, 2.351593017578125, 2.44757080078125, 2.543548583984375, 2.6395263671875, 2.735504150390625, 2.83148193359375, 2.927459716796875, 3.0234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 9.0, 13.0, 20.0, 26.0, 34.0, 47.0, 70.0, 90.0, 128.0, 183.0, 246.0, 352.0, 478.0, 768.0, 1073.0, 1723.0, 2756.0, 4723.0, 7952.0, 14584.0, 27998.0, 61766.0, 198077.0, 537064.0, 100732.0, 40584.0, 19881.0, 10751.0, 6212.0, 3524.0, 2273.0, 1359.0, 909.0, 616.0, 432.0, 307.0, 206.0, 150.0, 125.0, 79.0, 60.0, 40.0, 41.0, 15.0, 21.0, 13.0, 11.0, 10.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0010852813720703125, -0.0010494142770767212, -0.0010135471820831299, -0.0009776800870895386, -0.0009418129920959473, -0.000905945897102356, -0.0008700788021087646, -0.0008342117071151733, -0.000798344612121582, -0.0007624775171279907, -0.0007266104221343994, -0.0006907433271408081, -0.0006548762321472168, -0.0006190091371536255, -0.0005831420421600342, -0.0005472749471664429, -0.0005114078521728516, -0.00047554075717926025, -0.00043967366218566895, -0.00040380656719207764, -0.00036793947219848633, -0.000332072377204895, -0.0002962052822113037, -0.0002603381872177124, -0.0002244710922241211, -0.00018860399723052979, -0.00015273690223693848, -0.00011686980724334717, -8.100271224975586e-05, -4.513561725616455e-05, -9.268522262573242e-06, 2.6598572731018066e-05, 6.246566772460938e-05, 9.833276271820068e-05, 0.000134199857711792, 0.0001700669527053833, 0.0002059340476989746, 0.00024180114269256592, 0.0002776682376861572, 0.00031353533267974854, 0.00034940242767333984, 0.00038526952266693115, 0.00042113661766052246, 0.00045700371265411377, 0.0004928708076477051, 0.0005287379026412964, 0.0005646049976348877, 0.000600472092628479, 0.0006363391876220703, 0.0006722062826156616, 0.0007080733776092529, 0.0007439404726028442, 0.0007798075675964355, 0.0008156746625900269, 0.0008515417575836182, 0.0008874088525772095, 0.0009232759475708008, 0.0009591430425643921, 0.0009950101375579834, 0.0010308772325515747, 0.001066744327545166, 0.0011026114225387573, 0.0011384785175323486, 0.00117434561252594, 0.0012102127075195312]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 4.0, 6.0, 16.0, 13.0, 19.0, 14.0, 28.0, 40.0, 78.0, 141.0, 191.0, 158.0, 100.0, 52.0, 41.0, 21.0, 22.0, 11.0, 9.0, 10.0, 6.0, 7.0, 1.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000133514404296875, -0.0001292973756790161, -0.00012508034706115723, -0.00012086331844329834, -0.00011664628982543945, -0.00011242926120758057, -0.00010821223258972168, -0.00010399520397186279, -9.97781753540039e-05, -9.556114673614502e-05, -9.134411811828613e-05, -8.712708950042725e-05, -8.291006088256836e-05, -7.869303226470947e-05, -7.447600364685059e-05, -7.02589750289917e-05, -6.604194641113281e-05, -6.182491779327393e-05, -5.760788917541504e-05, -5.339086055755615e-05, -4.9173831939697266e-05, -4.495680332183838e-05, -4.073977470397949e-05, -3.6522746086120605e-05, -3.230571746826172e-05, -2.8088688850402832e-05, -2.3871660232543945e-05, -1.965463161468506e-05, -1.5437602996826172e-05, -1.1220574378967285e-05, -7.0035457611083984e-06, -2.7865171432495117e-06, 1.430511474609375e-06, 5.647540092468262e-06, 9.864568710327148e-06, 1.4081597328186035e-05, 1.8298625946044922e-05, 2.251565456390381e-05, 2.6732683181762695e-05, 3.094971179962158e-05, 3.516674041748047e-05, 3.9383769035339355e-05, 4.360079765319824e-05, 4.781782627105713e-05, 5.2034854888916016e-05, 5.62518835067749e-05, 6.046891212463379e-05, 6.468594074249268e-05, 6.890296936035156e-05, 7.311999797821045e-05, 7.733702659606934e-05, 8.155405521392822e-05, 8.577108383178711e-05, 8.9988112449646e-05, 9.420514106750488e-05, 9.842216968536377e-05, 0.00010263919830322266, 0.00010685622692108154, 0.00011107325553894043, 0.00011529028415679932, 0.0001195073127746582, 0.0001237243413925171, 0.00012794137001037598, 0.00013215839862823486, 0.00013637542724609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 4.0, 6.0, 1.0, 7.0, 7.0, 4.0, 14.0, 12.0, 22.0, 31.0, 39.0, 37.0, 59.0, 83.0, 129.0, 241.0, 1167.0, 14781.0, 917602.0, 109138.0, 4165.0, 511.0, 145.0, 95.0, 47.0, 44.0, 40.0, 28.0, 16.0, 16.0, 16.0, 11.0, 7.0, 9.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0036106109619140625, -0.003500431776046753, -0.0033902525901794434, -0.003280073404312134, -0.0031698942184448242, -0.0030597150325775146, -0.002949535846710205, -0.0028393566608428955, -0.002729177474975586, -0.0026189982891082764, -0.002508819103240967, -0.0023986399173736572, -0.0022884607315063477, -0.002178281545639038, -0.0020681023597717285, -0.001957923173904419, -0.0018477439880371094, -0.0017375648021697998, -0.0016273856163024902, -0.0015172064304351807, -0.001407027244567871, -0.0012968480587005615, -0.001186668872833252, -0.0010764896869659424, -0.0009663105010986328, -0.0008561313152313232, -0.0007459521293640137, -0.0006357729434967041, -0.0005255937576293945, -0.00041541457176208496, -0.0003052353858947754, -0.00019505620002746582, -8.487701416015625e-05, 2.530217170715332e-05, 0.0001354813575744629, 0.00024566054344177246, 0.00035583972930908203, 0.0004660189151763916, 0.0005761981010437012, 0.0006863772869110107, 0.0007965564727783203, 0.0009067356586456299, 0.0010169148445129395, 0.001127094030380249, 0.0012372732162475586, 0.0013474524021148682, 0.0014576315879821777, 0.0015678107738494873, 0.0016779899597167969, 0.0017881691455841064, 0.001898348331451416, 0.0020085275173187256, 0.002118706703186035, 0.0022288858890533447, 0.0023390650749206543, 0.002449244260787964, 0.0025594234466552734, 0.002669602632522583, 0.0027797818183898926, 0.002889961004257202, 0.0030001401901245117, 0.0031103193759918213, 0.003220498561859131, 0.0033306777477264404, 0.00344085693359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 3.0, 8.0, 9.0, 12.0, 11.0, 20.0, 22.0, 18.0, 21.0, 19.0, 39.0, 28.0, 35.0, 56.0, 72.0, 147.0, 110.0, 63.0, 52.0, 36.0, 45.0, 31.0, 20.0, 14.0, 15.0, 13.0, 12.0, 5.0, 11.0, 10.0, 4.0, 5.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.00025653839111328125, -0.00024893879890441895, -0.00024133920669555664, -0.00023373961448669434, -0.00022614002227783203, -0.00021854043006896973, -0.00021094083786010742, -0.00020334124565124512, -0.0001957416534423828, -0.0001881420612335205, -0.0001805424690246582, -0.0001729428768157959, -0.0001653432846069336, -0.0001577436923980713, -0.00015014410018920898, -0.00014254450798034668, -0.00013494491577148438, -0.00012734532356262207, -0.00011974573135375977, -0.00011214613914489746, -0.00010454654693603516, -9.694695472717285e-05, -8.934736251831055e-05, -8.174777030944824e-05, -7.414817810058594e-05, -6.654858589172363e-05, -5.894899368286133e-05, -5.1349401473999023e-05, -4.374980926513672e-05, -3.6150217056274414e-05, -2.855062484741211e-05, -2.0951032638549805e-05, -1.33514404296875e-05, -5.751848220825195e-06, 1.8477439880371094e-06, 9.447336196899414e-06, 1.704692840576172e-05, 2.4646520614624023e-05, 3.224611282348633e-05, 3.984570503234863e-05, 4.744529724121094e-05, 5.504488945007324e-05, 6.264448165893555e-05, 7.024407386779785e-05, 7.784366607666016e-05, 8.544325828552246e-05, 9.304285049438477e-05, 0.00010064244270324707, 0.00010824203491210938, 0.00011584162712097168, 0.00012344121932983398, 0.0001310408115386963, 0.0001386404037475586, 0.0001462399959564209, 0.0001538395881652832, 0.0001614391803741455, 0.0001690387725830078, 0.00017663836479187012, 0.00018423795700073242, 0.00019183754920959473, 0.00019943714141845703, 0.00020703673362731934, 0.00021463632583618164, 0.00022223591804504395, 0.00022983551025390625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [6.0, 21.0, 71.0, 312.0, 535.0, 58.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6109589338302612, -1.232051134109497, -0.8531434535980225, -0.4742356538772583, -0.09532797336578369, 0.2835797071456909, 0.6624876260757446, 1.0413953065872192, 1.4203029870986938, 1.799210786819458, 2.1781184673309326, 2.5570263862609863, 2.935934066772461, 3.3148417472839355, 3.69374942779541, 4.072657108306885, 4.451564788818359, 4.830472469329834, 5.209380149841309, 5.588288307189941, 5.967195510864258, 6.346103668212891, 6.725011348724365, 7.10391902923584, 7.4828267097473145, 7.861734390258789, 8.240642547607422, 8.619549751281738, 8.998457908630371, 9.377365112304688, 9.75627326965332, 10.135181427001953, 10.514089584350586, 10.892997741699219, 11.271904945373535, 11.650813102722168, 12.029720306396484, 12.408628463745117, 12.78753662109375, 13.166443824768066, 13.545351028442383, 13.924259185791016, 14.303166389465332, 14.682074546813965, 15.060981750488281, 15.439889907836914, 15.818798065185547, 16.197704315185547, 16.576614379882812, 16.955522537231445, 17.334430694580078, 17.713336944580078, 18.09224510192871, 18.471153259277344, 18.850061416625977, 19.22896957397461, 19.60787582397461, 19.986783981323242, 20.365692138671875, 20.744598388671875, 21.123506546020508, 21.50241470336914, 21.881322860717773, 22.260231018066406, 22.639137268066406]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 13.0, 23.0, 58.0, 123.0, 165.0, 225.0, 184.0, 112.0, 61.0, 29.0, 11.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.671836853027344, -5.502560138702393, -5.333282947540283, -5.164006233215332, -4.994729042053223, -4.8254523277282715, -4.656175136566162, -4.486898422241211, -4.317621231079102, -4.14834451675415, -3.979067325592041, -3.8097903728485107, -3.6405134201049805, -3.47123646736145, -3.30195951461792, -3.1326828002929688, -2.9634058475494385, -2.794128894805908, -2.624851942062378, -2.4555749893188477, -2.2862980365753174, -2.117021083831787, -1.9477442502975464, -1.7784672975540161, -1.6091903448104858, -1.4399133920669556, -1.2706364393234253, -1.1013596057891846, -0.9320825934410095, -0.7628056406974792, -0.5935287475585938, -0.4242517948150635, -0.2549748420715332, -0.08569790422916412, 0.08357903361320496, 0.25285595655441284, 0.4221329092979431, 0.5914098620414734, 0.7606867551803589, 0.9299637079238892, 1.0992406606674194, 1.2685176134109497, 1.43779456615448, 1.6070713996887207, 1.776348352432251, 1.9456253051757812, 2.1149022579193115, 2.284179210662842, 2.453456163406372, 2.6227331161499023, 2.7920100688934326, 2.961287021636963, 3.130563974380493, 3.2998409271240234, 3.4691176414489746, 3.638394832611084, 3.807671546936035, 3.9769484996795654, 4.146225452423096, 4.315502166748047, 4.484779357910156, 4.654056072235107, 4.823333263397217, 4.992609977722168, 5.161887168884277]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 6.0, 9.0, 11.0, 10.0, 13.0, 15.0, 23.0, 35.0, 75.0, 204.0, 676.0, 3003.0, 21600.0, 888544.0, 124168.0, 7990.0, 1446.0, 347.0, 145.0, 77.0, 29.0, 11.0, 13.0, 15.0, 11.0, 13.0, 12.0, 5.0, 1.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5234375, -6.318115234375, -6.11279296875, -5.907470703125, -5.7021484375, -5.496826171875, -5.29150390625, -5.086181640625, -4.880859375, -4.675537109375, -4.47021484375, -4.264892578125, -4.0595703125, -3.854248046875, -3.64892578125, -3.443603515625, -3.23828125, -3.032958984375, -2.82763671875, -2.622314453125, -2.4169921875, -2.211669921875, -2.00634765625, -1.801025390625, -1.595703125, -1.390380859375, -1.18505859375, -0.979736328125, -0.7744140625, -0.569091796875, -0.36376953125, -0.158447265625, 0.046875, 0.252197265625, 0.45751953125, 0.662841796875, 0.8681640625, 1.073486328125, 1.27880859375, 1.484130859375, 1.689453125, 1.894775390625, 2.10009765625, 2.305419921875, 2.5107421875, 2.716064453125, 2.92138671875, 3.126708984375, 3.33203125, 3.537353515625, 3.74267578125, 3.947998046875, 4.1533203125, 4.358642578125, 4.56396484375, 4.769287109375, 4.974609375, 5.179931640625, 5.38525390625, 5.590576171875, 5.7958984375, 6.001220703125, 6.20654296875, 6.411865234375, 6.6171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 13.0, 25.0, 50.0, 120.0, 186.0, 213.0, 179.0, 105.0, 61.0, 28.0, 18.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91552734375, -0.8686294555664062, -0.8217315673828125, -0.7748336791992188, -0.727935791015625, -0.6810379028320312, -0.6341400146484375, -0.5872421264648438, -0.54034423828125, -0.49344635009765625, -0.4465484619140625, -0.39965057373046875, -0.352752685546875, -0.30585479736328125, -0.2589569091796875, -0.21205902099609375, -0.1651611328125, -0.11826324462890625, -0.0713653564453125, -0.02446746826171875, 0.022430419921875, 0.06932830810546875, 0.1162261962890625, 0.16312408447265625, 0.21002197265625, 0.25691986083984375, 0.3038177490234375, 0.35071563720703125, 0.397613525390625, 0.44451141357421875, 0.4914093017578125, 0.5383071899414062, 0.585205078125, 0.6321029663085938, 0.6790008544921875, 0.7258987426757812, 0.772796630859375, 0.8196945190429688, 0.8665924072265625, 0.9134902954101562, 0.96038818359375, 1.0072860717773438, 1.0541839599609375, 1.1010818481445312, 1.147979736328125, 1.1948776245117188, 1.2417755126953125, 1.2886734008789062, 1.3355712890625, 1.3824691772460938, 1.4293670654296875, 1.4762649536132812, 1.523162841796875, 1.5700607299804688, 1.6169586181640625, 1.6638565063476562, 1.71075439453125, 1.7576522827148438, 1.8045501708984375, 1.8514480590820312, 1.898345947265625, 1.9452438354492188, 1.9921417236328125, 2.0390396118164062, 2.0859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 13.0, 12.0, 14.0, 15.0, 29.0, 26.0, 35.0, 43.0, 68.0, 81.0, 98.0, 224.0, 1080.0, 40045.0, 998697.0, 7029.0, 454.0, 138.0, 90.0, 70.0, 48.0, 41.0, 44.0, 22.0, 19.0, 23.0, 13.0, 7.0, 9.0, 9.0, 7.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.4375, -11.12255859375, -10.8076171875, -10.49267578125, -10.177734375, -9.86279296875, -9.5478515625, -9.23291015625, -8.91796875, -8.60302734375, -8.2880859375, -7.97314453125, -7.658203125, -7.34326171875, -7.0283203125, -6.71337890625, -6.3984375, -6.08349609375, -5.7685546875, -5.45361328125, -5.138671875, -4.82373046875, -4.5087890625, -4.19384765625, -3.87890625, -3.56396484375, -3.2490234375, -2.93408203125, -2.619140625, -2.30419921875, -1.9892578125, -1.67431640625, -1.359375, -1.04443359375, -0.7294921875, -0.41455078125, -0.099609375, 0.21533203125, 0.5302734375, 0.84521484375, 1.16015625, 1.47509765625, 1.7900390625, 2.10498046875, 2.419921875, 2.73486328125, 3.0498046875, 3.36474609375, 3.6796875, 3.99462890625, 4.3095703125, 4.62451171875, 4.939453125, 5.25439453125, 5.5693359375, 5.88427734375, 6.19921875, 6.51416015625, 6.8291015625, 7.14404296875, 7.458984375, 7.77392578125, 8.0888671875, 8.40380859375, 8.71875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 1.0, 8.0, 5.0, 9.0, 11.0, 14.0, 7.0, 11.0, 24.0, 16.0, 15.0, 26.0, 33.0, 50.0, 43.0, 57.0, 56.0, 66.0, 91.0, 63.0, 62.0, 42.0, 47.0, 36.0, 28.0, 31.0, 23.0, 24.0, 15.0, 15.0, 16.0, 6.0, 12.0, 3.0, 8.0, 9.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6962890625, -1.6487579345703125, -1.601226806640625, -1.5536956787109375, -1.50616455078125, -1.4586334228515625, -1.411102294921875, -1.3635711669921875, -1.3160400390625, -1.2685089111328125, -1.220977783203125, -1.1734466552734375, -1.12591552734375, -1.0783843994140625, -1.030853271484375, -0.9833221435546875, -0.935791015625, -0.8882598876953125, -0.840728759765625, -0.7931976318359375, -0.74566650390625, -0.6981353759765625, -0.650604248046875, -0.6030731201171875, -0.5555419921875, -0.5080108642578125, -0.460479736328125, -0.4129486083984375, -0.36541748046875, -0.3178863525390625, -0.270355224609375, -0.2228240966796875, -0.17529296875, -0.1277618408203125, -0.080230712890625, -0.0326995849609375, 0.01483154296875, 0.0623626708984375, 0.109893798828125, 0.1574249267578125, 0.2049560546875, 0.2524871826171875, 0.300018310546875, 0.3475494384765625, 0.39508056640625, 0.4426116943359375, 0.490142822265625, 0.5376739501953125, 0.585205078125, 0.6327362060546875, 0.680267333984375, 0.7277984619140625, 0.77532958984375, 0.8228607177734375, 0.870391845703125, 0.9179229736328125, 0.9654541015625, 1.0129852294921875, 1.060516357421875, 1.1080474853515625, 1.15557861328125, 1.2031097412109375, 1.250640869140625, 1.2981719970703125, 1.345703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 6.0, 6.0, 11.0, 11.0, 13.0, 34.0, 39.0, 49.0, 107.0, 175.0, 413.0, 1046.0, 3310.0, 13879.0, 74566.0, 865592.0, 70859.0, 13437.0, 3144.0, 1025.0, 393.0, 167.0, 90.0, 54.0, 32.0, 22.0, 23.0, 13.0, 10.0, 6.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.411865234375, -0.3987846374511719, -0.38570404052734375, -0.3726234436035156, -0.3595428466796875, -0.3464622497558594, -0.33338165283203125, -0.3203010559082031, -0.307220458984375, -0.2941398620605469, -0.28105926513671875, -0.2679786682128906, -0.2548980712890625, -0.24181747436523438, -0.22873687744140625, -0.21565628051757812, -0.20257568359375, -0.18949508666992188, -0.17641448974609375, -0.16333389282226562, -0.1502532958984375, -0.13717269897460938, -0.12409210205078125, -0.11101150512695312, -0.097930908203125, -0.08485031127929688, -0.07176971435546875, -0.058689117431640625, -0.0456085205078125, -0.032527923583984375, -0.01944732666015625, -0.006366729736328125, 0.0067138671875, 0.019794464111328125, 0.03287506103515625, 0.045955657958984375, 0.0590362548828125, 0.07211685180664062, 0.08519744873046875, 0.09827804565429688, 0.111358642578125, 0.12443923950195312, 0.13751983642578125, 0.15060043334960938, 0.1636810302734375, 0.17676162719726562, 0.18984222412109375, 0.20292282104492188, 0.21600341796875, 0.22908401489257812, 0.24216461181640625, 0.2552452087402344, 0.2683258056640625, 0.2814064025878906, 0.29448699951171875, 0.3075675964355469, 0.320648193359375, 0.3337287902832031, 0.34680938720703125, 0.3598899841308594, 0.3729705810546875, 0.3860511779785156, 0.39913177490234375, 0.4122123718261719, 0.42529296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 7.0, 8.0, 7.0, 17.0, 21.0, 29.0, 53.0, 134.0, 543.0, 67.0, 30.0, 19.0, 19.0, 14.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00011426210403442383, -0.00011100620031356812, -0.0001077502965927124, -0.00010449439287185669, -0.00010123848915100098, -9.798258543014526e-05, -9.472668170928955e-05, -9.147077798843384e-05, -8.821487426757812e-05, -8.495897054672241e-05, -8.17030668258667e-05, -7.844716310501099e-05, -7.519125938415527e-05, -7.193535566329956e-05, -6.867945194244385e-05, -6.542354822158813e-05, -6.216764450073242e-05, -5.891174077987671e-05, -5.5655837059020996e-05, -5.239993333816528e-05, -4.914402961730957e-05, -4.588812589645386e-05, -4.2632222175598145e-05, -3.937631845474243e-05, -3.612041473388672e-05, -3.2864511013031006e-05, -2.9608607292175293e-05, -2.635270357131958e-05, -2.3096799850463867e-05, -1.9840896129608154e-05, -1.658499240875244e-05, -1.3329088687896729e-05, -1.0073184967041016e-05, -6.817281246185303e-06, -3.56137752532959e-06, -3.0547380447387695e-07, 2.950429916381836e-06, 6.206333637237549e-06, 9.462237358093262e-06, 1.2718141078948975e-05, 1.5974044799804688e-05, 1.92299485206604e-05, 2.2485852241516113e-05, 2.5741755962371826e-05, 2.899765968322754e-05, 3.225356340408325e-05, 3.5509467124938965e-05, 3.876537084579468e-05, 4.202127456665039e-05, 4.5277178287506104e-05, 4.8533082008361816e-05, 5.178898572921753e-05, 5.504488945007324e-05, 5.8300793170928955e-05, 6.155669689178467e-05, 6.481260061264038e-05, 6.80685043334961e-05, 7.13244080543518e-05, 7.458031177520752e-05, 7.783621549606323e-05, 8.109211921691895e-05, 8.434802293777466e-05, 8.760392665863037e-05, 9.085983037948608e-05, 9.41157341003418e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 0.0, 5.0, 6.0, 1.0, 11.0, 3.0, 6.0, 12.0, 18.0, 15.0, 22.0, 24.0, 30.0, 41.0, 73.0, 125.0, 368.0, 3706.0, 937204.0, 104064.0, 2203.0, 271.0, 108.0, 54.0, 37.0, 29.0, 14.0, 28.0, 16.0, 3.0, 10.0, 14.0, 12.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5226936340332031, -0.5068130493164062, -0.4909324645996094, -0.4750518798828125, -0.4591712951660156, -0.44329071044921875, -0.4274101257324219, -0.411529541015625, -0.3956489562988281, -0.37976837158203125, -0.3638877868652344, -0.3480072021484375, -0.3321266174316406, -0.31624603271484375, -0.3003654479980469, -0.28448486328125, -0.2686042785644531, -0.25272369384765625, -0.23684310913085938, -0.2209625244140625, -0.20508193969726562, -0.18920135498046875, -0.17332077026367188, -0.157440185546875, -0.14155960083007812, -0.12567901611328125, -0.10979843139648438, -0.0939178466796875, -0.07803726196289062, -0.06215667724609375, -0.046276092529296875, -0.0303955078125, -0.014514923095703125, 0.00136566162109375, 0.017246246337890625, 0.0331268310546875, 0.049007415771484375, 0.06488800048828125, 0.08076858520507812, 0.096649169921875, 0.11252975463867188, 0.12841033935546875, 0.14429092407226562, 0.1601715087890625, 0.17605209350585938, 0.19193267822265625, 0.20781326293945312, 0.22369384765625, 0.23957443237304688, 0.25545501708984375, 0.2713356018066406, 0.2872161865234375, 0.3030967712402344, 0.31897735595703125, 0.3348579406738281, 0.350738525390625, 0.3666191101074219, 0.38249969482421875, 0.3983802795410156, 0.4142608642578125, 0.4301414489746094, 0.44602203369140625, 0.4619026184082031, 0.477783203125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 5.0, 2.0, 5.0, 2.0, 4.0, 8.0, 20.0, 17.0, 15.0, 8.0, 19.0, 18.0, 29.0, 32.0, 64.0, 495.0, 59.0, 39.0, 21.0, 20.0, 23.0, 14.0, 15.0, 13.0, 10.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09175968170166016, -0.08909797668457031, -0.08643627166748047, -0.08377456665039062, -0.08111286163330078, -0.07845115661621094, -0.0757894515991211, -0.07312774658203125, -0.0704660415649414, -0.06780433654785156, -0.06514263153076172, -0.062480926513671875, -0.05981922149658203, -0.05715751647949219, -0.054495811462402344, -0.0518341064453125, -0.049172401428222656, -0.04651069641113281, -0.04384899139404297, -0.041187286376953125, -0.03852558135986328, -0.03586387634277344, -0.033202171325683594, -0.03054046630859375, -0.027878761291503906, -0.025217056274414062, -0.02255535125732422, -0.019893646240234375, -0.01723194122314453, -0.014570236206054688, -0.011908531188964844, -0.009246826171875, -0.006585121154785156, -0.0039234161376953125, -0.0012617111206054688, 0.001399993896484375, 0.004061698913574219, 0.0067234039306640625, 0.009385108947753906, 0.01204681396484375, 0.014708518981933594, 0.017370223999023438, 0.02003192901611328, 0.022693634033203125, 0.02535533905029297, 0.028017044067382812, 0.030678749084472656, 0.0333404541015625, 0.036002159118652344, 0.03866386413574219, 0.04132556915283203, 0.043987274169921875, 0.04664897918701172, 0.04931068420410156, 0.051972389221191406, 0.05463409423828125, 0.057295799255371094, 0.05995750427246094, 0.06261920928955078, 0.06528091430664062, 0.06794261932373047, 0.07060432434082031, 0.07326602935791016, 0.075927734375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [180.0, 794.0, 40.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1559242010116577, -0.28599655628204346, 0.5839310884475708, 1.453858733177185, 2.3237862586975098, 3.193713665008545, 4.063641548156738, 4.933569431304932, 5.803496837615967, 6.67342472076416, 7.543352127075195, 8.41327953338623, 9.283206939697266, 10.153135299682617, 11.023062705993652, 11.892990112304688, 12.762918472290039, 13.632845878601074, 14.50277328491211, 15.372701644897461, 16.242630004882812, 17.11255645751953, 17.982484817504883, 18.852413177490234, 19.722339630126953, 20.592267990112305, 21.462194442749023, 22.332122802734375, 23.202049255371094, 24.071977615356445, 24.941905975341797, 25.811832427978516, 26.681758880615234, 27.551687240600586, 28.421613693237305, 29.291542053222656, 30.161468505859375, 31.031396865844727, 31.901325225830078, 32.7712516784668, 33.64118194580078, 34.5111083984375, 35.381038665771484, 36.2509651184082, 37.12089157104492, 37.990821838378906, 38.860748291015625, 39.730674743652344, 40.60060119628906, 41.47052764892578, 42.340457916259766, 43.210384368896484, 44.0803108215332, 44.95024108886719, 45.820167541503906, 46.690093994140625, 47.560020446777344, 48.42994689941406, 49.29987716674805, 50.169803619384766, 51.039730072021484, 51.90966033935547, 52.77958679199219, 53.649513244628906, 54.51944351196289]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 6.0, 6.0, 10.0, 10.0, 18.0, 19.0, 18.0, 20.0, 15.0, 26.0, 23.0, 19.0, 39.0, 32.0, 37.0, 31.0, 45.0, 43.0, 33.0, 37.0, 48.0, 32.0, 38.0, 35.0, 45.0, 38.0, 36.0, 32.0, 29.0, 14.0, 21.0, 15.0, 23.0, 24.0, 20.0, 11.0, 12.0, 10.0, 5.0, 4.0, 7.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.132634162902832, -2.0637855529785156, -1.9949368238449097, -1.9260882139205933, -1.8572394847869873, -1.788390874862671, -1.7195422649383545, -1.6506935358047485, -1.5818448066711426, -1.5129961967468262, -1.4441474676132202, -1.3752988576889038, -1.3064501285552979, -1.2376015186309814, -1.168752908706665, -1.099904179573059, -1.0310555696487427, -0.9622069001197815, -0.8933582305908203, -0.8245096206665039, -0.755660891532898, -0.6868122816085815, -0.6179636120796204, -0.5491149425506592, -0.480266273021698, -0.4114176034927368, -0.34256893396377563, -0.27372029423713684, -0.20487162470817566, -0.13602295517921448, -0.06717431545257568, 0.001674354076385498, 0.07052302360534668, 0.13937169313430786, 0.20822034776210785, 0.27706900238990784, 0.345917671918869, 0.4147663414478302, 0.483614981174469, 0.5524636507034302, 0.6213123202323914, 0.6901609897613525, 0.7590096592903137, 0.8278583288192749, 0.8967069387435913, 0.9655556678771973, 1.0344042778015137, 1.10325288772583, 1.172101616859436, 1.2409502267837524, 1.3097989559173584, 1.3786475658416748, 1.4474962949752808, 1.5163449048995972, 1.5851936340332031, 1.6540422439575195, 1.722890853881836, 1.7917394638061523, 1.8605881929397583, 1.9294368028640747, 1.9982855319976807, 2.067134141921997, 2.1359827518463135, 2.204831600189209, 2.2736802101135254]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 2.0, 6.0, 9.0, 11.0, 20.0, 28.0, 43.0, 75.0, 83.0, 101.0, 162.0, 259.0, 375.0, 510.0, 761.0, 1146.0, 1620.0, 2613.0, 5623.0, 4166044.0, 6397.0, 2844.0, 1793.0, 1143.0, 805.0, 614.0, 356.0, 240.0, 179.0, 112.0, 90.0, 54.0, 54.0, 27.0, 20.0, 13.0, 11.0, 15.0, 7.0, 4.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.23046875, -6.01953125, -5.80859375, -5.59765625, -5.38671875, -5.17578125, -4.96484375, -4.75390625, -4.54296875, -4.33203125, -4.12109375, -3.91015625, -3.69921875, -3.48828125, -3.27734375, -3.06640625, -2.85546875, -2.64453125, -2.43359375, -2.22265625, -2.01171875, -1.80078125, -1.58984375, -1.37890625, -1.16796875, -0.95703125, -0.74609375, -0.53515625, -0.32421875, -0.11328125, 0.09765625, 0.30859375, 0.51953125, 0.73046875, 0.94140625, 1.15234375, 1.36328125, 1.57421875, 1.78515625, 1.99609375, 2.20703125, 2.41796875, 2.62890625, 2.83984375, 3.05078125, 3.26171875, 3.47265625, 3.68359375, 3.89453125, 4.10546875, 4.31640625, 4.52734375, 4.73828125, 4.94921875, 5.16015625, 5.37109375, 5.58203125, 5.79296875, 6.00390625, 6.21484375, 6.42578125, 6.63671875, 6.84765625, 7.05859375, 7.26953125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 11.0, 11.0, 10.0, 9.0, 15.0, 20.0, 26.0, 27.0, 32.0, 43.0, 32.0, 29.0, 46.0, 58.0, 54.0, 59.0, 58.0, 38.0, 64.0, 44.0, 51.0, 28.0, 42.0, 26.0, 40.0, 31.0, 19.0, 23.0, 13.0, 9.0, 6.0, 7.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.29443359375, -0.2857780456542969, -0.27712249755859375, -0.2684669494628906, -0.2598114013671875, -0.2511558532714844, -0.24250030517578125, -0.23384475708007812, -0.225189208984375, -0.21653366088867188, -0.20787811279296875, -0.19922256469726562, -0.1905670166015625, -0.18191146850585938, -0.17325592041015625, -0.16460037231445312, -0.15594482421875, -0.14728927612304688, -0.13863372802734375, -0.12997817993164062, -0.1213226318359375, -0.11266708374023438, -0.10401153564453125, -0.09535598754882812, -0.086700439453125, -0.07804489135742188, -0.06938934326171875, -0.060733795166015625, -0.0520782470703125, -0.043422698974609375, -0.03476715087890625, -0.026111602783203125, -0.0174560546875, -0.008800506591796875, -0.00014495849609375, 0.008510589599609375, 0.0171661376953125, 0.025821685791015625, 0.03447723388671875, 0.043132781982421875, 0.051788330078125, 0.060443878173828125, 0.06909942626953125, 0.07775497436523438, 0.0864105224609375, 0.09506607055664062, 0.10372161865234375, 0.11237716674804688, 0.12103271484375, 0.12968826293945312, 0.13834381103515625, 0.14699935913085938, 0.1556549072265625, 0.16431045532226562, 0.17296600341796875, 0.18162155151367188, 0.190277099609375, 0.19893264770507812, 0.20758819580078125, 0.21624374389648438, 0.2248992919921875, 0.23355484008789062, 0.24221038818359375, 0.2508659362792969, 0.259521484375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 24.0, 372.0, 4185991.0, 7684.0, 172.0, 23.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.78125, -19.78515625, -18.7890625, -17.79296875, -16.796875, -15.80078125, -14.8046875, -13.80859375, -12.8125, -11.81640625, -10.8203125, -9.82421875, -8.828125, -7.83203125, -6.8359375, -5.83984375, -4.84375, -3.84765625, -2.8515625, -1.85546875, -0.859375, 0.13671875, 1.1328125, 2.12890625, 3.125, 4.12109375, 5.1171875, 6.11328125, 7.109375, 8.10546875, 9.1015625, 10.09765625, 11.09375, 12.08984375, 13.0859375, 14.08203125, 15.078125, 16.07421875, 17.0703125, 18.06640625, 19.0625, 20.05859375, 21.0546875, 22.05078125, 23.046875, 24.04296875, 25.0390625, 26.03515625, 27.03125, 28.02734375, 29.0234375, 30.01953125, 31.015625, 32.01171875, 33.0078125, 34.00390625, 35.0, 35.99609375, 36.9921875, 37.98828125, 38.984375, 39.98046875, 40.9765625, 41.97265625, 42.96875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 8.0, 7.0, 311.0, 3715.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82470703125, -0.7930374145507812, -0.7613677978515625, -0.7296981811523438, -0.698028564453125, -0.6663589477539062, -0.6346893310546875, -0.6030197143554688, -0.57135009765625, -0.5396804809570312, -0.5080108642578125, -0.47634124755859375, -0.444671630859375, -0.41300201416015625, -0.3813323974609375, -0.34966278076171875, -0.3179931640625, -0.28632354736328125, -0.2546539306640625, -0.22298431396484375, -0.191314697265625, -0.15964508056640625, -0.1279754638671875, -0.09630584716796875, -0.06463623046875, -0.03296661376953125, -0.0012969970703125, 0.03037261962890625, 0.062042236328125, 0.09371185302734375, 0.1253814697265625, 0.15705108642578125, 0.188720703125, 0.22039031982421875, 0.2520599365234375, 0.28372955322265625, 0.315399169921875, 0.34706878662109375, 0.3787384033203125, 0.41040802001953125, 0.44207763671875, 0.47374725341796875, 0.5054168701171875, 0.5370864868164062, 0.568756103515625, 0.6004257202148438, 0.6320953369140625, 0.6637649536132812, 0.6954345703125, 0.7271041870117188, 0.7587738037109375, 0.7904434204101562, 0.822113037109375, 0.8537826538085938, 0.8854522705078125, 0.9171218872070312, 0.94879150390625, 0.9804611206054688, 1.0121307373046875, 1.0438003540039062, 1.075469970703125, 1.1071395874023438, 1.1388092041015625, 1.1704788208007812, 1.2021484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 8.0, 9.0, 17.0, 19.0, 28.0, 28.0, 40.0, 56.0, 81.0, 117.0, 141.0, 138.0, 105.0, 57.0, 32.0, 33.0, 21.0, 17.0, 13.0, 5.0, 8.0, 2.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2838313579559326, -1.2446240186691284, -1.2054166793823242, -1.16620934009552, -1.1270020008087158, -1.087794542312622, -1.0485872030258179, -1.0093798637390137, -0.9701725244522095, -0.9309651851654053, -0.8917578458786011, -0.8525504469871521, -0.8133431077003479, -0.7741357684135437, -0.7349283695220947, -0.6957210302352905, -0.6565136909484863, -0.6173063516616821, -0.5780990123748779, -0.538891613483429, -0.49968427419662476, -0.46047693490982056, -0.42126956582069397, -0.3820621967315674, -0.3428548574447632, -0.303647518157959, -0.2644401490688324, -0.225232794880867, -0.1860254406929016, -0.14681808650493622, -0.10761073231697083, -0.06840336322784424, -0.02919602394104004, 0.010011330246925354, 0.04921868443489075, 0.08842603862285614, 0.12763339281082153, 0.16684074699878693, 0.20604810118675232, 0.2452554702758789, 0.2844628095626831, 0.3236701488494873, 0.3628775179386139, 0.4020848870277405, 0.4412922263145447, 0.4804995656013489, 0.5197069644927979, 0.558914303779602, 0.5981216430664062, 0.6373289823532104, 0.6765363216400146, 0.7157437205314636, 0.7549510598182678, 0.794158399105072, 0.833365797996521, 0.8725731372833252, 0.9117804765701294, 0.9509878158569336, 0.9901951551437378, 1.029402494430542, 1.0686099529266357, 1.10781729221344, 1.1470246315002441, 1.1862319707870483, 1.2254393100738525]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 9.0, 5.0, 12.0, 13.0, 13.0, 14.0, 16.0, 18.0, 21.0, 19.0, 33.0, 30.0, 30.0, 39.0, 38.0, 38.0, 53.0, 39.0, 44.0, 43.0, 28.0, 44.0, 37.0, 40.0, 41.0, 30.0, 40.0, 29.0, 19.0, 20.0, 20.0, 13.0, 22.0, 18.0, 13.0, 9.0, 7.0, 9.0, 2.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.4533398449420929, -0.43930524587631226, -0.42527061700820923, -0.4112360179424286, -0.39720141887664795, -0.3831667900085449, -0.3691321909427643, -0.35509759187698364, -0.3410629630088806, -0.3270283639431, -0.31299373507499695, -0.2989591360092163, -0.2849245071411133, -0.27088990807533264, -0.256855309009552, -0.24282069504261017, -0.22878608107566833, -0.2147514671087265, -0.20071685314178467, -0.18668225407600403, -0.1726476401090622, -0.15861302614212036, -0.14457842707633972, -0.1305438131093979, -0.11650919914245605, -0.10247458517551422, -0.08843997865915298, -0.07440537214279175, -0.060370758175849915, -0.04633614420890808, -0.032301537692546844, -0.018266931176185608, -0.004232317209243774, 0.00980229303240776, 0.023836903274059296, 0.03787151351571083, 0.051906123757362366, 0.0659407377243042, 0.07997534424066544, 0.09400995075702667, 0.1080445647239685, 0.12207917869091034, 0.13611379265785217, 0.1501483917236328, 0.16418300569057465, 0.17821761965751648, 0.19225221872329712, 0.20628683269023895, 0.2203214466571808, 0.23435606062412262, 0.24839067459106445, 0.2624252736568451, 0.27645987272262573, 0.29049450159072876, 0.3045291006565094, 0.31856369972229004, 0.33259832859039307, 0.3466329276561737, 0.36066755652427673, 0.3747021555900574, 0.3887367844581604, 0.40277138352394104, 0.4168059825897217, 0.4308406114578247, 0.44487521052360535]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 18.0, 39.0, 53.0, 180.0, 943.0, 8779.0, 1012438.0, 24129.0, 1556.0, 265.0, 61.0, 30.0, 6.0, 13.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.5920028686523438, -0.5726776123046875, -0.5533523559570312, -0.534027099609375, -0.5147018432617188, -0.4953765869140625, -0.47605133056640625, -0.45672607421875, -0.43740081787109375, -0.4180755615234375, -0.39875030517578125, -0.379425048828125, -0.36009979248046875, -0.3407745361328125, -0.32144927978515625, -0.3021240234375, -0.28279876708984375, -0.2634735107421875, -0.24414825439453125, -0.224822998046875, -0.20549774169921875, -0.1861724853515625, -0.16684722900390625, -0.14752197265625, -0.12819671630859375, -0.1088714599609375, -0.08954620361328125, -0.070220947265625, -0.05089569091796875, -0.0315704345703125, -0.01224517822265625, 0.007080078125, 0.02640533447265625, 0.0457305908203125, 0.06505584716796875, 0.084381103515625, 0.10370635986328125, 0.1230316162109375, 0.14235687255859375, 0.16168212890625, 0.18100738525390625, 0.2003326416015625, 0.21965789794921875, 0.238983154296875, 0.25830841064453125, 0.2776336669921875, 0.29695892333984375, 0.3162841796875, 0.33560943603515625, 0.3549346923828125, 0.37425994873046875, 0.393585205078125, 0.41291046142578125, 0.4322357177734375, 0.45156097412109375, 0.47088623046875, 0.49021148681640625, 0.5095367431640625, 0.5288619995117188, 0.548187255859375, 0.5675125122070312, 0.5868377685546875, 0.6061630249023438, 0.62548828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 12.0, 26.0, 46.0, 89.0, 151.0, 168.0, 181.0, 134.0, 91.0, 55.0, 28.0, 18.0, 7.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46240234375, -0.42719268798828125, -0.3919830322265625, -0.35677337646484375, -0.321563720703125, -0.28635406494140625, -0.2511444091796875, -0.21593475341796875, -0.18072509765625, -0.14551544189453125, -0.1103057861328125, -0.07509613037109375, -0.039886474609375, -0.00467681884765625, 0.0305328369140625, 0.06574249267578125, 0.1009521484375, 0.13616180419921875, 0.1713714599609375, 0.20658111572265625, 0.241790771484375, 0.27700042724609375, 0.3122100830078125, 0.34741973876953125, 0.38262939453125, 0.41783905029296875, 0.4530487060546875, 0.48825836181640625, 0.523468017578125, 0.5586776733398438, 0.5938873291015625, 0.6290969848632812, 0.664306640625, 0.6995162963867188, 0.7347259521484375, 0.7699356079101562, 0.805145263671875, 0.8403549194335938, 0.8755645751953125, 0.9107742309570312, 0.94598388671875, 0.9811935424804688, 1.0164031982421875, 1.0516128540039062, 1.086822509765625, 1.1220321655273438, 1.1572418212890625, 1.1924514770507812, 1.2276611328125, 1.2628707885742188, 1.2980804443359375, 1.3332901000976562, 1.368499755859375, 1.4037094116210938, 1.4389190673828125, 1.4741287231445312, 1.50933837890625, 1.5445480346679688, 1.5797576904296875, 1.6149673461914062, 1.650177001953125, 1.6853866577148438, 1.7205963134765625, 1.7558059692382812, 1.791015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 8.0, 15.0, 21.0, 21.0, 23.0, 25.0, 36.0, 47.0, 60.0, 88.0, 93.0, 108.0, 166.0, 294.0, 552.0, 1538.0, 5202.0, 22542.0, 167112.0, 765631.0, 68165.0, 11799.0, 2951.0, 923.0, 402.0, 196.0, 130.0, 86.0, 70.0, 55.0, 34.0, 27.0, 24.0, 23.0, 14.0, 17.0, 8.0, 9.0, 0.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.02838134765625, -0.027474641799926758, -0.026567935943603516, -0.025661230087280273, -0.02475452423095703, -0.02384781837463379, -0.022941112518310547, -0.022034406661987305, -0.021127700805664062, -0.02022099494934082, -0.019314289093017578, -0.018407583236694336, -0.017500877380371094, -0.01659417152404785, -0.01568746566772461, -0.014780759811401367, -0.013874053955078125, -0.012967348098754883, -0.01206064224243164, -0.011153936386108398, -0.010247230529785156, -0.009340524673461914, -0.008433818817138672, -0.00752711296081543, -0.0066204071044921875, -0.005713701248168945, -0.004806995391845703, -0.003900289535522461, -0.0029935836791992188, -0.0020868778228759766, -0.0011801719665527344, -0.0002734661102294922, 0.00063323974609375, 0.0015399456024169922, 0.0024466514587402344, 0.0033533573150634766, 0.004260063171386719, 0.005166769027709961, 0.006073474884033203, 0.006980180740356445, 0.007886886596679688, 0.00879359245300293, 0.009700298309326172, 0.010607004165649414, 0.011513710021972656, 0.012420415878295898, 0.01332712173461914, 0.014233827590942383, 0.015140533447265625, 0.016047239303588867, 0.01695394515991211, 0.01786065101623535, 0.018767356872558594, 0.019674062728881836, 0.020580768585205078, 0.02148747444152832, 0.022394180297851562, 0.023300886154174805, 0.024207592010498047, 0.02511429786682129, 0.02602100372314453, 0.026927709579467773, 0.027834415435791016, 0.028741121292114258, 0.0296478271484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 14.0, 15.0, 16.0, 17.0, 19.0, 21.0, 24.0, 33.0, 32.0, 28.0, 27.0, 28.0, 39.0, 32.0, 36.0, 42.0, 43.0, 35.0, 50.0, 45.0, 57.0, 44.0, 27.0, 35.0, 34.0, 28.0, 25.0, 24.0, 15.0, 19.0, 13.0, 16.0, 10.0, 8.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7177734375, -0.69488525390625, -0.6719970703125, -0.64910888671875, -0.626220703125, -0.60333251953125, -0.5804443359375, -0.55755615234375, -0.53466796875, -0.51177978515625, -0.4888916015625, -0.46600341796875, -0.443115234375, -0.42022705078125, -0.3973388671875, -0.37445068359375, -0.3515625, -0.32867431640625, -0.3057861328125, -0.28289794921875, -0.260009765625, -0.23712158203125, -0.2142333984375, -0.19134521484375, -0.16845703125, -0.14556884765625, -0.1226806640625, -0.09979248046875, -0.076904296875, -0.05401611328125, -0.0311279296875, -0.00823974609375, 0.0146484375, 0.03753662109375, 0.0604248046875, 0.08331298828125, 0.106201171875, 0.12908935546875, 0.1519775390625, 0.17486572265625, 0.19775390625, 0.22064208984375, 0.2435302734375, 0.26641845703125, 0.289306640625, 0.31219482421875, 0.3350830078125, 0.35797119140625, 0.380859375, 0.40374755859375, 0.4266357421875, 0.44952392578125, 0.472412109375, 0.49530029296875, 0.5181884765625, 0.54107666015625, 0.56396484375, 0.58685302734375, 0.6097412109375, 0.63262939453125, 0.655517578125, 0.67840576171875, 0.7012939453125, 0.72418212890625, 0.7470703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 11.0, 8.0, 12.0, 13.0, 20.0, 26.0, 44.0, 51.0, 75.0, 104.0, 156.0, 211.0, 319.0, 437.0, 590.0, 886.0, 1274.0, 1813.0, 2771.0, 4144.0, 6800.0, 12100.0, 30226.0, 850289.0, 93325.0, 18279.0, 8916.0, 5259.0, 3313.0, 2193.0, 1467.0, 1021.0, 714.0, 526.0, 349.0, 239.0, 152.0, 124.0, 82.0, 56.0, 41.0, 34.0, 27.0, 15.0, 15.0, 10.0, 6.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00293731689453125, -0.0028502941131591797, -0.0027632713317871094, -0.002676248550415039, -0.0025892257690429688, -0.0025022029876708984, -0.002415180206298828, -0.002328157424926758, -0.0022411346435546875, -0.002154111862182617, -0.002067089080810547, -0.0019800662994384766, -0.0018930435180664062, -0.001806020736694336, -0.0017189979553222656, -0.0016319751739501953, -0.001544952392578125, -0.0014579296112060547, -0.0013709068298339844, -0.001283884048461914, -0.0011968612670898438, -0.0011098384857177734, -0.0010228157043457031, -0.0009357929229736328, -0.0008487701416015625, -0.0007617473602294922, -0.0006747245788574219, -0.0005877017974853516, -0.0005006790161132812, -0.00041365623474121094, -0.0003266334533691406, -0.0002396106719970703, -0.000152587890625, -6.556510925292969e-05, 2.1457672119140625e-05, 0.00010848045349121094, 0.00019550323486328125, 0.00028252601623535156, 0.0003695487976074219, 0.0004565715789794922, 0.0005435943603515625, 0.0006306171417236328, 0.0007176399230957031, 0.0008046627044677734, 0.0008916854858398438, 0.000978708267211914, 0.0010657310485839844, 0.0011527538299560547, 0.001239776611328125, 0.0013267993927001953, 0.0014138221740722656, 0.001500844955444336, 0.0015878677368164062, 0.0016748905181884766, 0.0017619132995605469, 0.0018489360809326172, 0.0019359588623046875, 0.002022981643676758, 0.002110004425048828, 0.0021970272064208984, 0.0022840499877929688, 0.002371072769165039, 0.0024580955505371094, 0.0025451183319091797, 0.00263214111328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 2.0, 10.0, 3.0, 6.0, 9.0, 10.0, 29.0, 37.0, 107.0, 435.0, 197.0, 65.0, 23.0, 23.0, 11.0, 8.0, 6.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017750263214111328, -0.000171540305018425, -0.0001655779778957367, -0.0001596156507730484, -0.0001536533236503601, -0.00014769099652767181, -0.00014172866940498352, -0.00013576634228229523, -0.00012980401515960693, -0.00012384168803691864, -0.00011787936091423035, -0.00011191703379154205, -0.00010595470666885376, -9.999237954616547e-05, -9.403005242347717e-05, -8.806772530078888e-05, -8.210539817810059e-05, -7.614307105541229e-05, -7.0180743932724e-05, -6.42184168100357e-05, -5.825608968734741e-05, -5.229376256465912e-05, -4.6331435441970825e-05, -4.036910831928253e-05, -3.440678119659424e-05, -2.8444454073905945e-05, -2.248212695121765e-05, -1.6519799828529358e-05, -1.0557472705841064e-05, -4.595145583152771e-06, 1.3671815395355225e-06, 7.329508662223816e-06, 1.329183578491211e-05, 1.9254162907600403e-05, 2.5216490030288696e-05, 3.117881715297699e-05, 3.714114427566528e-05, 4.310347139835358e-05, 4.906579852104187e-05, 5.5028125643730164e-05, 6.099045276641846e-05, 6.695277988910675e-05, 7.291510701179504e-05, 7.887743413448334e-05, 8.483976125717163e-05, 9.080208837985992e-05, 9.676441550254822e-05, 0.00010272674262523651, 0.0001086890697479248, 0.0001146513968706131, 0.00012061372399330139, 0.00012657605111598969, 0.00013253837823867798, 0.00013850070536136627, 0.00014446303248405457, 0.00015042535960674286, 0.00015638768672943115, 0.00016235001385211945, 0.00016831234097480774, 0.00017427466809749603, 0.00018023699522018433, 0.00018619932234287262, 0.0001921616494655609, 0.0001981239765882492, 0.0002040863037109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 7.0, 10.0, 10.0, 10.0, 20.0, 30.0, 29.0, 35.0, 54.0, 79.0, 114.0, 162.0, 208.0, 319.0, 483.0, 751.0, 1161.0, 1950.0, 3428.0, 6908.0, 16923.0, 115732.0, 851537.0, 28102.0, 9384.0, 4418.0, 2460.0, 1459.0, 906.0, 584.0, 414.0, 257.0, 185.0, 116.0, 85.0, 59.0, 48.0, 38.0, 25.0, 20.0, 8.0, 6.0, 5.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.0015153884887695312, -0.0014723390340805054, -0.0014292895793914795, -0.0013862401247024536, -0.0013431906700134277, -0.0013001412153244019, -0.001257091760635376, -0.00121404230594635, -0.0011709928512573242, -0.0011279433965682983, -0.0010848939418792725, -0.0010418444871902466, -0.0009987950325012207, -0.0009557455778121948, -0.0009126961231231689, -0.0008696466684341431, -0.0008265972137451172, -0.0007835477590560913, -0.0007404983043670654, -0.0006974488496780396, -0.0006543993949890137, -0.0006113499402999878, -0.0005683004856109619, -0.000525251030921936, -0.00048220157623291016, -0.0004391521215438843, -0.0003961026668548584, -0.0003530532121658325, -0.00031000375747680664, -0.00026695430278778076, -0.00022390484809875488, -0.000180855393409729, -0.00013780593872070312, -9.475648403167725e-05, -5.170702934265137e-05, -8.657574653625488e-06, 3.439188003540039e-05, 7.744133472442627e-05, 0.00012049078941345215, 0.00016354024410247803, 0.0002065896987915039, 0.0002496391534805298, 0.00029268860816955566, 0.00033573806285858154, 0.0003787875175476074, 0.0004218369722366333, 0.0004648864269256592, 0.0005079358816146851, 0.0005509853363037109, 0.0005940347909927368, 0.0006370842456817627, 0.0006801337003707886, 0.0007231831550598145, 0.0007662326097488403, 0.0008092820644378662, 0.0008523315191268921, 0.000895380973815918, 0.0009384304285049438, 0.0009814798831939697, 0.0010245293378829956, 0.0010675787925720215, 0.0011106282472610474, 0.0011536777019500732, 0.0011967271566390991, 0.001239776611328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 9.0, 14.0, 19.0, 25.0, 56.0, 382.0, 300.0, 71.0, 21.0, 16.0, 11.0, 10.0, 8.0, 6.0, 5.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004260540008544922, -0.00041420385241508484, -0.0004023537039756775, -0.00039050355553627014, -0.0003786534070968628, -0.00036680325865745544, -0.0003549531102180481, -0.00034310296177864075, -0.0003312528133392334, -0.00031940266489982605, -0.0003075525164604187, -0.00029570236802101135, -0.000283852219581604, -0.00027200207114219666, -0.0002601519227027893, -0.00024830177426338196, -0.0002364516258239746, -0.00022460147738456726, -0.0002127513289451599, -0.00020090118050575256, -0.00018905103206634521, -0.00017720088362693787, -0.00016535073518753052, -0.00015350058674812317, -0.00014165043830871582, -0.00012980028986930847, -0.00011795014142990112, -0.00010609999299049377, -9.424984455108643e-05, -8.239969611167908e-05, -7.054954767227173e-05, -5.869939923286438e-05, -4.684925079345703e-05, -3.499910235404968e-05, -2.3148953914642334e-05, -1.1298805475234985e-05, 5.513429641723633e-07, 1.2401491403579712e-05, 2.425163984298706e-05, 3.610178828239441e-05, 4.795193672180176e-05, 5.9802085161209106e-05, 7.165223360061646e-05, 8.35023820400238e-05, 9.535253047943115e-05, 0.0001072026789188385, 0.00011905282735824585, 0.0001309029757976532, 0.00014275312423706055, 0.0001546032726764679, 0.00016645342111587524, 0.0001783035695552826, 0.00019015371799468994, 0.0002020038664340973, 0.00021385401487350464, 0.000225704163312912, 0.00023755431175231934, 0.0002494044601917267, 0.00026125460863113403, 0.0002731047570705414, 0.00028495490550994873, 0.0002968050539493561, 0.00030865520238876343, 0.0003205053508281708, 0.0003323554992675781]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 8.0, 11.0, 13.0, 10.0, 15.0, 25.0, 26.0, 40.0, 55.0, 61.0, 99.0, 131.0, 149.0, 106.0, 81.0, 36.0, 27.0, 24.0, 19.0, 5.0, 13.0, 6.0, 8.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6888121962547302, -0.6692164540290833, -0.6496207118034363, -0.6300249695777893, -0.6104292273521423, -0.5908334851264954, -0.5712377429008484, -0.5516420006752014, -0.5320462584495544, -0.5124505162239075, -0.4928547739982605, -0.4732590317726135, -0.45366328954696655, -0.4340675473213196, -0.4144718050956726, -0.39487606287002563, -0.37528032064437866, -0.3556845784187317, -0.3360888361930847, -0.31649309396743774, -0.29689735174179077, -0.2773016095161438, -0.2577058672904968, -0.23811012506484985, -0.21851438283920288, -0.1989186406135559, -0.17932289838790894, -0.15972715616226196, -0.140131413936615, -0.12053567171096802, -0.10093992948532104, -0.08134418725967407, -0.061748385429382324, -0.04215264320373535, -0.02255690097808838, -0.0029611587524414062, 0.016634583473205566, 0.03623032569885254, 0.05582606792449951, 0.07542181015014648, 0.09501755237579346, 0.11461329460144043, 0.1342090368270874, 0.15380477905273438, 0.17340052127838135, 0.19299626350402832, 0.2125920057296753, 0.23218774795532227, 0.25178349018096924, 0.2713792324066162, 0.2909749746322632, 0.31057071685791016, 0.33016645908355713, 0.3497622013092041, 0.3693579435348511, 0.38895368576049805, 0.408549427986145, 0.428145170211792, 0.44774091243743896, 0.46733665466308594, 0.4869323968887329, 0.5065281391143799, 0.5261238813400269, 0.5457196235656738, 0.5653153657913208]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 11.0, 20.0, 46.0, 80.0, 126.0, 168.0, 161.0, 154.0, 104.0, 70.0, 42.0, 13.0, 10.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25674569606781006, -0.22958506643772125, -0.20242442190647125, -0.17526379227638245, -0.14810314774513245, -0.12094251811504364, -0.09378188848495483, -0.06662124395370483, -0.03946061432361603, -0.012299979105591774, 0.01486065611243248, 0.042021289467811584, 0.06918192654848099, 0.09634256362915039, 0.1235031932592392, 0.1506638377904892, 0.177824467420578, 0.2049850970506668, 0.2321457415819168, 0.2593063712120056, 0.2864670157432556, 0.3136276602745056, 0.3407882750034332, 0.3679489195346832, 0.39510953426361084, 0.42227017879486084, 0.44943079352378845, 0.47659143805503845, 0.5037520527839661, 0.5309126973152161, 0.5580733418464661, 0.5852339863777161, 0.6123946309089661, 0.6395552754402161, 0.6667159199714661, 0.6938765048980713, 0.7210371494293213, 0.7481977939605713, 0.7753584384918213, 0.8025190830230713, 0.8296797275543213, 0.8568403720855713, 0.8840010166168213, 0.9111616611480713, 0.9383222460746765, 0.9654828906059265, 0.9926435351371765, 1.0198042392730713, 1.0469647645950317, 1.0741254091262817, 1.1012860536575317, 1.1284466981887817, 1.1556073427200317, 1.1827679872512817, 1.2099285125732422, 1.2370891571044922, 1.2642499208450317, 1.2914105653762817, 1.3185712099075317, 1.3457318544387817, 1.3728924989700317, 1.4000531435012817, 1.4272136688232422, 1.4543743133544922, 1.4815349578857422]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 10.0, 12.0, 20.0, 30.0, 56.0, 334.0, 3600.0, 49387.0, 959514.0, 32629.0, 2559.0, 216.0, 60.0, 30.0, 20.0, 9.0, 3.0, 5.0, 2.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.337890625, -1.295318603515625, -1.25274658203125, -1.210174560546875, -1.1676025390625, -1.125030517578125, -1.08245849609375, -1.039886474609375, -0.997314453125, -0.954742431640625, -0.91217041015625, -0.869598388671875, -0.8270263671875, -0.784454345703125, -0.74188232421875, -0.699310302734375, -0.65673828125, -0.614166259765625, -0.57159423828125, -0.529022216796875, -0.4864501953125, -0.443878173828125, -0.40130615234375, -0.358734130859375, -0.316162109375, -0.273590087890625, -0.23101806640625, -0.188446044921875, -0.1458740234375, -0.103302001953125, -0.06072998046875, -0.018157958984375, 0.0244140625, 0.066986083984375, 0.10955810546875, 0.152130126953125, 0.1947021484375, 0.237274169921875, 0.27984619140625, 0.322418212890625, 0.364990234375, 0.407562255859375, 0.45013427734375, 0.492706298828125, 0.5352783203125, 0.577850341796875, 0.62042236328125, 0.662994384765625, 0.70556640625, 0.748138427734375, 0.79071044921875, 0.833282470703125, 0.8758544921875, 0.918426513671875, 0.96099853515625, 1.003570556640625, 1.046142578125, 1.088714599609375, 1.13128662109375, 1.173858642578125, 1.2164306640625, 1.259002685546875, 1.30157470703125, 1.344146728515625, 1.38671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 7.0, 9.0, 12.0, 10.0, 18.0, 21.0, 34.0, 24.0, 43.0, 46.0, 42.0, 51.0, 51.0, 53.0, 64.0, 64.0, 69.0, 57.0, 52.0, 50.0, 36.0, 32.0, 27.0, 27.0, 20.0, 7.0, 13.0, 11.0, 13.0, 4.0, 6.0, 8.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0194244384765625, -0.01880359649658203, -0.018182754516601562, -0.017561912536621094, -0.016941070556640625, -0.016320228576660156, -0.015699386596679688, -0.015078544616699219, -0.01445770263671875, -0.013836860656738281, -0.013216018676757812, -0.012595176696777344, -0.011974334716796875, -0.011353492736816406, -0.010732650756835938, -0.010111808776855469, -0.009490966796875, -0.008870124816894531, -0.008249282836914062, -0.007628440856933594, -0.007007598876953125, -0.006386756896972656, -0.0057659149169921875, -0.005145072937011719, -0.00452423095703125, -0.0039033889770507812, -0.0032825469970703125, -0.0026617050170898438, -0.002040863037109375, -0.0014200210571289062, -0.0007991790771484375, -0.00017833709716796875, 0.0004425048828125, 0.0010633468627929688, 0.0016841888427734375, 0.0023050308227539062, 0.002925872802734375, 0.0035467147827148438, 0.0041675567626953125, 0.004788398742675781, 0.00540924072265625, 0.006030082702636719, 0.0066509246826171875, 0.007271766662597656, 0.007892608642578125, 0.008513450622558594, 0.009134292602539062, 0.009755134582519531, 0.0103759765625, 0.010996818542480469, 0.011617660522460938, 0.012238502502441406, 0.012859344482421875, 0.013480186462402344, 0.014101028442382812, 0.014721870422363281, 0.01534271240234375, 0.01596355438232422, 0.016584396362304688, 0.017205238342285156, 0.017826080322265625, 0.018446922302246094, 0.019067764282226562, 0.01968860626220703, 0.0203094482421875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 11.0, 10.0, 15.0, 21.0, 35.0, 35.0, 58.0, 75.0, 116.0, 134.0, 201.0, 338.0, 491.0, 656.0, 938.0, 1296.0, 2018.0, 2876.0, 4502.0, 7294.0, 12572.0, 24308.0, 56214.0, 199894.0, 541040.0, 108935.0, 38554.0, 18211.0, 10066.0, 5891.0, 3852.0, 2446.0, 1651.0, 1156.0, 800.0, 571.0, 383.0, 249.0, 177.0, 145.0, 99.0, 57.0, 40.0, 41.0, 38.0, 22.0, 5.0, 5.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1343994140625, -0.13023757934570312, -0.12607574462890625, -0.12191390991210938, -0.1177520751953125, -0.11359024047851562, -0.10942840576171875, -0.10526657104492188, -0.101104736328125, -0.09694290161132812, -0.09278106689453125, -0.08861923217773438, -0.0844573974609375, -0.08029556274414062, -0.07613372802734375, -0.07197189331054688, -0.06781005859375, -0.06364822387695312, -0.05948638916015625, -0.055324554443359375, -0.0511627197265625, -0.047000885009765625, -0.04283905029296875, -0.038677215576171875, -0.034515380859375, -0.030353546142578125, -0.02619171142578125, -0.022029876708984375, -0.0178680419921875, -0.013706207275390625, -0.00954437255859375, -0.005382537841796875, -0.001220703125, 0.002941131591796875, 0.00710296630859375, 0.011264801025390625, 0.0154266357421875, 0.019588470458984375, 0.02375030517578125, 0.027912139892578125, 0.032073974609375, 0.036235809326171875, 0.04039764404296875, 0.044559478759765625, 0.0487213134765625, 0.052883148193359375, 0.05704498291015625, 0.061206817626953125, 0.06536865234375, 0.06953048706054688, 0.07369232177734375, 0.07785415649414062, 0.0820159912109375, 0.08617782592773438, 0.09033966064453125, 0.09450149536132812, 0.098663330078125, 0.10282516479492188, 0.10698699951171875, 0.11114883422851562, 0.1153106689453125, 0.11947250366210938, 0.12363433837890625, 0.12779617309570312, 0.1319580078125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 6.0, 6.0, 4.0, 4.0, 2.0, 6.0, 8.0, 9.0, 11.0, 14.0, 7.0, 15.0, 23.0, 27.0, 36.0, 47.0, 66.0, 80.0, 72.0, 75.0, 78.0, 85.0, 70.0, 45.0, 44.0, 32.0, 15.0, 17.0, 21.0, 10.0, 6.0, 8.0, 11.0, 12.0, 5.0, 2.0, 4.0, 5.0, 4.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07489013671875, -0.0725870132446289, -0.07028388977050781, -0.06798076629638672, -0.06567764282226562, -0.06337451934814453, -0.06107139587402344, -0.058768272399902344, -0.05646514892578125, -0.054162025451660156, -0.05185890197753906, -0.04955577850341797, -0.047252655029296875, -0.04494953155517578, -0.04264640808105469, -0.040343284606933594, -0.0380401611328125, -0.035737037658691406, -0.03343391418457031, -0.03113079071044922, -0.028827667236328125, -0.02652454376220703, -0.024221420288085938, -0.021918296813964844, -0.01961517333984375, -0.017312049865722656, -0.015008926391601562, -0.012705802917480469, -0.010402679443359375, -0.008099555969238281, -0.0057964324951171875, -0.0034933090209960938, -0.001190185546875, 0.0011129379272460938, 0.0034160614013671875, 0.005719184875488281, 0.008022308349609375, 0.010325431823730469, 0.012628555297851562, 0.014931678771972656, 0.01723480224609375, 0.019537925720214844, 0.021841049194335938, 0.02414417266845703, 0.026447296142578125, 0.02875041961669922, 0.031053543090820312, 0.033356666564941406, 0.0356597900390625, 0.037962913513183594, 0.04026603698730469, 0.04256916046142578, 0.044872283935546875, 0.04717540740966797, 0.04947853088378906, 0.051781654357910156, 0.05408477783203125, 0.056387901306152344, 0.05869102478027344, 0.06099414825439453, 0.06329727172851562, 0.06560039520263672, 0.06790351867675781, 0.0702066421508789, 0.072509765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 4.0, 5.0, 7.0, 7.0, 9.0, 11.0, 18.0, 22.0, 30.0, 54.0, 50.0, 83.0, 140.0, 164.0, 204.0, 310.0, 418.0, 597.0, 886.0, 1513.0, 3502.0, 19245.0, 1002110.0, 12185.0, 2847.0, 1296.0, 826.0, 511.0, 417.0, 278.0, 221.0, 154.0, 121.0, 102.0, 56.0, 45.0, 26.0, 21.0, 22.0, 19.0, 9.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646484375, -3.518096923828125, -3.38970947265625, -3.261322021484375, -3.1329345703125, -3.004547119140625, -2.87615966796875, -2.747772216796875, -2.619384765625, -2.490997314453125, -2.36260986328125, -2.234222412109375, -2.1058349609375, -1.977447509765625, -1.84906005859375, -1.720672607421875, -1.59228515625, -1.463897705078125, -1.33551025390625, -1.207122802734375, -1.0787353515625, -0.950347900390625, -0.82196044921875, -0.693572998046875, -0.565185546875, -0.436798095703125, -0.30841064453125, -0.180023193359375, -0.0516357421875, 0.076751708984375, 0.20513916015625, 0.333526611328125, 0.4619140625, 0.590301513671875, 0.71868896484375, 0.847076416015625, 0.9754638671875, 1.103851318359375, 1.23223876953125, 1.360626220703125, 1.489013671875, 1.617401123046875, 1.74578857421875, 1.874176025390625, 2.0025634765625, 2.130950927734375, 2.25933837890625, 2.387725830078125, 2.51611328125, 2.644500732421875, 2.77288818359375, 2.901275634765625, 3.0296630859375, 3.158050537109375, 3.28643798828125, 3.414825439453125, 3.543212890625, 3.671600341796875, 3.79998779296875, 3.928375244140625, 4.0567626953125, 4.185150146484375, 4.31353759765625, 4.441925048828125, 4.5703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 8.0, 15.0, 32.0, 821.0, 47.0, 14.0, 7.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011720657348632812, -0.0011391863226890564, -0.0011063069105148315, -0.0010734274983406067, -0.0010405480861663818, -0.001007668673992157, -0.0009747892618179321, -0.0009419098496437073, -0.0009090304374694824, -0.0008761510252952576, -0.0008432716131210327, -0.0008103922009468079, -0.000777512788772583, -0.0007446333765983582, -0.0007117539644241333, -0.0006788745522499084, -0.0006459951400756836, -0.0006131157279014587, -0.0005802363157272339, -0.000547356903553009, -0.0005144774913787842, -0.0004815980792045593, -0.00044871866703033447, -0.0004158392548561096, -0.00038295984268188477, -0.0003500804305076599, -0.00031720101833343506, -0.0002843216061592102, -0.00025144219398498535, -0.0002185627818107605, -0.00018568336963653564, -0.0001528039574623108, -0.00011992454528808594, -8.704513311386108e-05, -5.416572093963623e-05, -2.1286308765411377e-05, 1.1593103408813477e-05, 4.447251558303833e-05, 7.735192775726318e-05, 0.00011023133993148804, 0.0001431107521057129, 0.00017599016427993774, 0.0002088695764541626, 0.00024174898862838745, 0.0002746284008026123, 0.00030750781297683716, 0.000340387225151062, 0.00037326663732528687, 0.0004061460494995117, 0.00043902546167373657, 0.0004719048738479614, 0.0005047842860221863, 0.0005376636981964111, 0.000570543110370636, 0.0006034225225448608, 0.0006363019347190857, 0.0006691813468933105, 0.0007020607590675354, 0.0007349401712417603, 0.0007678195834159851, 0.00080069899559021, 0.0008335784077644348, 0.0008664578199386597, 0.0008993372321128845, 0.0009322166442871094]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 5.0, 10.0, 12.0, 13.0, 22.0, 31.0, 36.0, 49.0, 85.0, 130.0, 207.0, 322.0, 367.0, 632.0, 1016.0, 1787.0, 2958.0, 5531.0, 12267.0, 43673.0, 943286.0, 18821.0, 7627.0, 3820.0, 2204.0, 1303.0, 776.0, 479.0, 337.0, 262.0, 150.0, 108.0, 56.0, 42.0, 24.0, 17.0, 24.0, 21.0, 10.0, 4.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.70166015625, -0.6798782348632812, -0.6580963134765625, -0.6363143920898438, -0.614532470703125, -0.5927505493164062, -0.5709686279296875, -0.5491867065429688, -0.52740478515625, -0.5056228637695312, -0.4838409423828125, -0.46205902099609375, -0.440277099609375, -0.41849517822265625, -0.3967132568359375, -0.37493133544921875, -0.3531494140625, -0.33136749267578125, -0.3095855712890625, -0.28780364990234375, -0.266021728515625, -0.24423980712890625, -0.2224578857421875, -0.20067596435546875, -0.17889404296875, -0.15711212158203125, -0.1353302001953125, -0.11354827880859375, -0.091766357421875, -0.06998443603515625, -0.0482025146484375, -0.02642059326171875, -0.004638671875, 0.01714324951171875, 0.0389251708984375, 0.06070709228515625, 0.082489013671875, 0.10427093505859375, 0.1260528564453125, 0.14783477783203125, 0.16961669921875, 0.19139862060546875, 0.2131805419921875, 0.23496246337890625, 0.256744384765625, 0.27852630615234375, 0.3003082275390625, 0.32209014892578125, 0.3438720703125, 0.36565399169921875, 0.3874359130859375, 0.40921783447265625, 0.430999755859375, 0.45278167724609375, 0.4745635986328125, 0.49634552001953125, 0.51812744140625, 0.5399093627929688, 0.5616912841796875, 0.5834732055664062, 0.605255126953125, 0.6270370483398438, 0.6488189697265625, 0.6706008911132812, 0.6923828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 8.0, 5.0, 8.0, 4.0, 11.0, 24.0, 800.0, 36.0, 12.0, 19.0, 17.0, 5.0, 4.0, 3.0, 2.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.244384765625, -0.23358917236328125, -0.2227935791015625, -0.21199798583984375, -0.201202392578125, -0.19040679931640625, -0.1796112060546875, -0.16881561279296875, -0.15802001953125, -0.14722442626953125, -0.1364288330078125, -0.12563323974609375, -0.114837646484375, -0.10404205322265625, -0.0932464599609375, -0.08245086669921875, -0.0716552734375, -0.06085968017578125, -0.0500640869140625, -0.03926849365234375, -0.028472900390625, -0.01767730712890625, -0.0068817138671875, 0.00391387939453125, 0.01470947265625, 0.02550506591796875, 0.0363006591796875, 0.04709625244140625, 0.057891845703125, 0.06868743896484375, 0.0794830322265625, 0.09027862548828125, 0.10107421875, 0.11186981201171875, 0.1226654052734375, 0.13346099853515625, 0.144256591796875, 0.15505218505859375, 0.1658477783203125, 0.17664337158203125, 0.18743896484375, 0.19823455810546875, 0.2090301513671875, 0.21982574462890625, 0.230621337890625, 0.24141693115234375, 0.2522125244140625, 0.26300811767578125, 0.2738037109375, 0.28459930419921875, 0.2953948974609375, 0.30619049072265625, 0.316986083984375, 0.32778167724609375, 0.3385772705078125, 0.34937286376953125, 0.36016845703125, 0.37096405029296875, 0.3817596435546875, 0.39255523681640625, 0.403350830078125, 0.41414642333984375, 0.4249420166015625, 0.43573760986328125, 0.446533203125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 3.0, 11.0, 21.0, 35.0, 121.0, 356.0, 301.0, 61.0, 31.0, 13.0, 9.0, 7.0, 2.0, 3.0, 5.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.77084732055664, -10.471405982971191, -10.171965599060059, -9.87252426147461, -9.573083877563477, -9.273642539978027, -8.974201202392578, -8.674760818481445, -8.375319480895996, -8.075878143310547, -7.776437759399414, -7.476996421813965, -7.177555561065674, -6.878114700317383, -6.578673839569092, -6.279232978820801, -5.97979211807251, -5.680351257324219, -5.380910396575928, -5.081469535827637, -4.7820281982421875, -4.4825873374938965, -4.1831464767456055, -3.8837053775787354, -3.5842645168304443, -3.2848236560821533, -2.985382556915283, -2.685941696166992, -2.386500835418701, -2.087059736251831, -1.78761887550354, -1.48817777633667, -1.188736915588379, -0.8892959356307983, -0.5898550152778625, -0.29041409492492676, 0.009026885032653809, 0.3084678649902344, 0.6079087257385254, 0.9073498249053955, 1.2067906856536865, 1.506231665611267, 1.8056726455688477, 2.1051135063171387, 2.4045543670654297, 2.7039954662323, 3.003436326980591, 3.302877426147461, 3.602318286895752, 3.901759147644043, 4.201200008392334, 4.500640869140625, 4.800082206726074, 5.099523067474365, 5.398963928222656, 5.6984052658081055, 5.997845649719238, 6.297286510467529, 6.59672737121582, 6.8961687088012695, 7.1956095695495605, 7.495050430297852, 7.794491291046143, 8.093932151794434, 8.393373489379883]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 6.0, 6.0, 14.0, 7.0, 12.0, 17.0, 20.0, 10.0, 20.0, 32.0, 24.0, 23.0, 29.0, 38.0, 22.0, 38.0, 29.0, 31.0, 47.0, 44.0, 39.0, 34.0, 31.0, 40.0, 31.0, 39.0, 25.0, 32.0, 25.0, 20.0, 30.0, 19.0, 24.0, 20.0, 28.0, 17.0, 16.0, 13.0, 10.0, 6.0, 6.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3396891951560974, -0.328610360622406, -0.3175315260887146, -0.3064526915550232, -0.2953738570213318, -0.284294992685318, -0.2732161581516266, -0.2621373236179352, -0.2510584890842438, -0.23997965455055237, -0.22890082001686096, -0.21782197058200836, -0.20674313604831696, -0.19566430151462555, -0.18458545207977295, -0.17350661754608154, -0.16242778301239014, -0.15134894847869873, -0.14027011394500732, -0.12919126451015472, -0.11811242997646332, -0.10703359544277191, -0.09595475345849991, -0.0848759114742279, -0.0737970769405365, -0.06271824240684509, -0.05163940042257309, -0.040560562163591385, -0.02948172390460968, -0.018402885645627975, -0.007324047386646271, 0.0037547945976257324, 0.014833599328994751, 0.025912437587976456, 0.03699127584695816, 0.048070114105939865, 0.05914895236492157, 0.07022778689861298, 0.08130662888288498, 0.09238547086715698, 0.10346430540084839, 0.1145431399345398, 0.1256219744682312, 0.1367008239030838, 0.1477796584367752, 0.1588584929704666, 0.1699373424053192, 0.18101617693901062, 0.19209501147270203, 0.20317384600639343, 0.21425268054008484, 0.22533152997493744, 0.23641036450862885, 0.24748919904232025, 0.25856804847717285, 0.26964688301086426, 0.28072571754455566, 0.29180455207824707, 0.3028833866119385, 0.3139622211456299, 0.3250410556793213, 0.3361199200153351, 0.3471987545490265, 0.3582775890827179, 0.3693564236164093]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 6.0, 12.0, 11.0, 19.0, 38.0, 40.0, 87.0, 131.0, 239.0, 390.0, 732.0, 1285.0, 2647.0, 5726.0, 14209.0, 70288.0, 4057483.0, 24247.0, 8918.0, 3819.0, 1841.0, 934.0, 530.0, 277.0, 156.0, 67.0, 62.0, 31.0, 22.0, 9.0, 11.0, 6.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.8359375, -6.66162109375, -6.4873046875, -6.31298828125, -6.138671875, -5.96435546875, -5.7900390625, -5.61572265625, -5.44140625, -5.26708984375, -5.0927734375, -4.91845703125, -4.744140625, -4.56982421875, -4.3955078125, -4.22119140625, -4.046875, -3.87255859375, -3.6982421875, -3.52392578125, -3.349609375, -3.17529296875, -3.0009765625, -2.82666015625, -2.65234375, -2.47802734375, -2.3037109375, -2.12939453125, -1.955078125, -1.78076171875, -1.6064453125, -1.43212890625, -1.2578125, -1.08349609375, -0.9091796875, -0.73486328125, -0.560546875, -0.38623046875, -0.2119140625, -0.03759765625, 0.13671875, 0.31103515625, 0.4853515625, 0.65966796875, 0.833984375, 1.00830078125, 1.1826171875, 1.35693359375, 1.53125, 1.70556640625, 1.8798828125, 2.05419921875, 2.228515625, 2.40283203125, 2.5771484375, 2.75146484375, 2.92578125, 3.10009765625, 3.2744140625, 3.44873046875, 3.623046875, 3.79736328125, 3.9716796875, 4.14599609375, 4.3203125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 10.0, 7.0, 3.0, 5.0, 13.0, 6.0, 12.0, 6.0, 15.0, 25.0, 71.0, 238.0, 291.0, 150.0, 34.0, 16.0, 16.0, 9.0, 7.0, 8.0, 8.0, 7.0, 7.0, 10.0, 3.0, 4.0, 6.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1748046875, -0.16938209533691406, -0.16395950317382812, -0.1585369110107422, -0.15311431884765625, -0.1476917266845703, -0.14226913452148438, -0.13684654235839844, -0.1314239501953125, -0.12600135803222656, -0.12057876586914062, -0.11515617370605469, -0.10973358154296875, -0.10431098937988281, -0.09888839721679688, -0.09346580505371094, -0.088043212890625, -0.08262062072753906, -0.07719802856445312, -0.07177543640136719, -0.06635284423828125, -0.06093025207519531, -0.055507659912109375, -0.05008506774902344, -0.0446624755859375, -0.03923988342285156, -0.033817291259765625, -0.028394699096679688, -0.02297210693359375, -0.017549514770507812, -0.012126922607421875, -0.0067043304443359375, -0.00128173828125, 0.0041408538818359375, 0.009563446044921875, 0.014986038208007812, 0.02040863037109375, 0.025831222534179688, 0.031253814697265625, 0.03667640686035156, 0.0420989990234375, 0.04752159118652344, 0.052944183349609375, 0.05836677551269531, 0.06378936767578125, 0.06921195983886719, 0.07463455200195312, 0.08005714416503906, 0.085479736328125, 0.09090232849121094, 0.09632492065429688, 0.10174751281738281, 0.10717010498046875, 0.11259269714355469, 0.11801528930664062, 0.12343788146972656, 0.1288604736328125, 0.13428306579589844, 0.13970565795898438, 0.1451282501220703, 0.15055084228515625, 0.1559734344482422, 0.16139602661132812, 0.16681861877441406, 0.1722412109375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 15.0, 17.0, 23.0, 45.0, 68.0, 121.0, 188.0, 357.0, 608.0, 1236.0, 2920.0, 8415.0, 31430.0, 4058515.0, 69792.0, 12712.0, 4236.0, 1734.0, 826.0, 412.0, 232.0, 148.0, 82.0, 60.0, 30.0, 17.0, 10.0, 9.0, 12.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6328125, -3.514434814453125, -3.39605712890625, -3.277679443359375, -3.1593017578125, -3.040924072265625, -2.92254638671875, -2.804168701171875, -2.685791015625, -2.567413330078125, -2.44903564453125, -2.330657958984375, -2.2122802734375, -2.093902587890625, -1.97552490234375, -1.857147216796875, -1.73876953125, -1.620391845703125, -1.50201416015625, -1.383636474609375, -1.2652587890625, -1.146881103515625, -1.02850341796875, -0.910125732421875, -0.791748046875, -0.673370361328125, -0.55499267578125, -0.436614990234375, -0.3182373046875, -0.199859619140625, -0.08148193359375, 0.036895751953125, 0.1552734375, 0.273651123046875, 0.39202880859375, 0.510406494140625, 0.6287841796875, 0.747161865234375, 0.86553955078125, 0.983917236328125, 1.102294921875, 1.220672607421875, 1.33905029296875, 1.457427978515625, 1.5758056640625, 1.694183349609375, 1.81256103515625, 1.930938720703125, 2.04931640625, 2.167694091796875, 2.28607177734375, 2.404449462890625, 2.5228271484375, 2.641204833984375, 2.75958251953125, 2.877960205078125, 2.996337890625, 3.114715576171875, 3.23309326171875, 3.351470947265625, 3.4698486328125, 3.588226318359375, 3.70660400390625, 3.824981689453125, 3.943359375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 5.0, 9.0, 9.0, 22.0, 80.0, 3565.0, 258.0, 61.0, 19.0, 7.0, 8.0, 3.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.193359375, -1.1580047607421875, -1.122650146484375, -1.0872955322265625, -1.05194091796875, -1.0165863037109375, -0.981231689453125, -0.9458770751953125, -0.9105224609375, -0.8751678466796875, -0.839813232421875, -0.8044586181640625, -0.76910400390625, -0.7337493896484375, -0.698394775390625, -0.6630401611328125, -0.627685546875, -0.5923309326171875, -0.556976318359375, -0.5216217041015625, -0.48626708984375, -0.4509124755859375, -0.415557861328125, -0.3802032470703125, -0.3448486328125, -0.3094940185546875, -0.274139404296875, -0.2387847900390625, -0.20343017578125, -0.1680755615234375, -0.132720947265625, -0.0973663330078125, -0.06201171875, -0.0266571044921875, 0.008697509765625, 0.0440521240234375, 0.07940673828125, 0.1147613525390625, 0.150115966796875, 0.1854705810546875, 0.2208251953125, 0.2561798095703125, 0.291534423828125, 0.3268890380859375, 0.36224365234375, 0.3975982666015625, 0.432952880859375, 0.4683074951171875, 0.503662109375, 0.5390167236328125, 0.574371337890625, 0.6097259521484375, 0.64508056640625, 0.6804351806640625, 0.715789794921875, 0.7511444091796875, 0.7864990234375, 0.8218536376953125, 0.857208251953125, 0.8925628662109375, 0.92791748046875, 0.9632720947265625, 0.998626708984375, 1.0339813232421875, 1.0693359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 7.0, 6.0, 14.0, 23.0, 51.0, 93.0, 229.0, 325.0, 118.0, 54.0, 29.0, 18.0, 10.0, 12.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.74766731262207, -5.625807762145996, -5.503947734832764, -5.3820881843566895, -5.260228157043457, -5.138368606567383, -5.01650857925415, -4.894649028778076, -4.772789001464844, -4.6509294509887695, -4.529069423675537, -4.407209873199463, -4.2853498458862305, -4.163490295410156, -4.041630268096924, -3.9197707176208496, -3.7979109287261963, -3.676051139831543, -3.5541913509368896, -3.4323315620422363, -3.310471773147583, -3.1886119842529297, -3.0667524337768555, -2.944892406463623, -2.823032855987549, -2.7011730670928955, -2.579313278198242, -2.457453489303589, -2.3355937004089355, -2.2137339115142822, -2.091874122619629, -1.9700144529342651, -1.8481547832489014, -1.726294994354248, -1.6044352054595947, -1.4825754165649414, -1.360715627670288, -1.2388558387756348, -1.116996169090271, -0.9951363801956177, -0.8732765913009644, -0.751416802406311, -0.6295570135116577, -0.5076972842216492, -0.38583749532699585, -0.26397770643234253, -0.14211797714233398, -0.020258188247680664, 0.10160160064697266, 0.22346137464046478, 0.3453211486339569, 0.46718090772628784, 0.5890406966209412, 0.7109004855155945, 0.832760214805603, 0.9546200037002563, 1.0764797925949097, 1.198339581489563, 1.3201993703842163, 1.44205904006958, 1.5639188289642334, 1.6857786178588867, 1.80763840675354, 1.9294981956481934, 2.0513579845428467]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 4.0, 8.0, 13.0, 15.0, 9.0, 8.0, 13.0, 18.0, 20.0, 20.0, 31.0, 24.0, 28.0, 33.0, 53.0, 38.0, 43.0, 55.0, 45.0, 34.0, 53.0, 34.0, 54.0, 44.0, 33.0, 35.0, 40.0, 25.0, 28.0, 19.0, 25.0, 22.0, 18.0, 8.0, 6.0, 7.0, 9.0, 11.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6442031860351562, -0.6242426633834839, -0.6042822003364563, -0.5843216776847839, -0.5643611550331116, -0.544400691986084, -0.5244401693344116, -0.5044796466827393, -0.4845191538333893, -0.4645586609840393, -0.44459813833236694, -0.42463764548301697, -0.404677152633667, -0.38471662998199463, -0.36475613713264465, -0.3447956442832947, -0.3248351216316223, -0.30487462878227234, -0.2849141061306, -0.26495361328125, -0.24499310553073883, -0.22503259778022766, -0.20507210493087769, -0.18511159718036652, -0.16515108942985535, -0.14519058167934418, -0.125230073928833, -0.10526958107948303, -0.08530907332897186, -0.0653485655784607, -0.04538806527853012, -0.02542756497859955, -0.005467116832733154, 0.014493387192487717, 0.03445389121770859, 0.05441439524292946, 0.07437489926815033, 0.0943354070186615, 0.11429590731859207, 0.13425640761852264, 0.1542169153690338, 0.17417742311954498, 0.19413793087005615, 0.21409842371940613, 0.2340589314699173, 0.25401943922042847, 0.27397993206977844, 0.2939404249191284, 0.3139009475708008, 0.33386144042015076, 0.3538219630718231, 0.3737824559211731, 0.39374297857284546, 0.41370347142219543, 0.4336639642715454, 0.4536244869232178, 0.47358497977256775, 0.4935454726219177, 0.5135059952735901, 0.5334665179252625, 0.55342698097229, 0.5733875036239624, 0.5933480262756348, 0.6133084893226624, 0.6332690119743347]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 9.0, 16.0, 12.0, 20.0, 32.0, 48.0, 59.0, 146.0, 220.0, 356.0, 690.0, 1432.0, 3531.0, 11516.0, 64907.0, 794739.0, 144090.0, 18319.0, 4890.0, 1803.0, 770.0, 383.0, 215.0, 123.0, 64.0, 44.0, 33.0, 25.0, 21.0, 8.0, 6.0, 5.0, 0.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.40185546875, -0.3911857604980469, -0.38051605224609375, -0.3698463439941406, -0.3591766357421875, -0.3485069274902344, -0.33783721923828125, -0.3271675109863281, -0.316497802734375, -0.3058280944824219, -0.29515838623046875, -0.2844886779785156, -0.2738189697265625, -0.2631492614746094, -0.25247955322265625, -0.24180984497070312, -0.23114013671875, -0.22047042846679688, -0.20980072021484375, -0.19913101196289062, -0.1884613037109375, -0.17779159545898438, -0.16712188720703125, -0.15645217895507812, -0.145782470703125, -0.13511276245117188, -0.12444305419921875, -0.11377334594726562, -0.1031036376953125, -0.09243392944335938, -0.08176422119140625, -0.07109451293945312, -0.0604248046875, -0.049755096435546875, -0.03908538818359375, -0.028415679931640625, -0.0177459716796875, -0.007076263427734375, 0.00359344482421875, 0.014263153076171875, 0.024932861328125, 0.035602569580078125, 0.04627227783203125, 0.056941986083984375, 0.0676116943359375, 0.07828140258789062, 0.08895111083984375, 0.09962081909179688, 0.11029052734375, 0.12096023559570312, 0.13162994384765625, 0.14229965209960938, 0.1529693603515625, 0.16363906860351562, 0.17430877685546875, 0.18497848510742188, 0.195648193359375, 0.20631790161132812, 0.21698760986328125, 0.22765731811523438, 0.2383270263671875, 0.24899673461914062, 0.25966644287109375, 0.2703361511230469, 0.281005859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 6.0, 6.0, 12.0, 14.0, 20.0, 34.0, 38.0, 52.0, 67.0, 116.0, 126.0, 117.0, 109.0, 103.0, 59.0, 46.0, 23.0, 21.0, 8.0, 5.0, 1.0, 2.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1748046875, -1.1431732177734375, -1.111541748046875, -1.0799102783203125, -1.04827880859375, -1.0166473388671875, -0.985015869140625, -0.9533843994140625, -0.9217529296875, -0.8901214599609375, -0.858489990234375, -0.8268585205078125, -0.79522705078125, -0.7635955810546875, -0.731964111328125, -0.7003326416015625, -0.668701171875, -0.6370697021484375, -0.605438232421875, -0.5738067626953125, -0.54217529296875, -0.5105438232421875, -0.478912353515625, -0.4472808837890625, -0.4156494140625, -0.3840179443359375, -0.352386474609375, -0.3207550048828125, -0.28912353515625, -0.2574920654296875, -0.225860595703125, -0.1942291259765625, -0.16259765625, -0.1309661865234375, -0.099334716796875, -0.0677032470703125, -0.03607177734375, -0.0044403076171875, 0.027191162109375, 0.0588226318359375, 0.0904541015625, 0.1220855712890625, 0.153717041015625, 0.1853485107421875, 0.21697998046875, 0.2486114501953125, 0.280242919921875, 0.3118743896484375, 0.343505859375, 0.3751373291015625, 0.406768798828125, 0.4384002685546875, 0.47003173828125, 0.5016632080078125, 0.533294677734375, 0.5649261474609375, 0.5965576171875, 0.6281890869140625, 0.659820556640625, 0.6914520263671875, 0.72308349609375, 0.7547149658203125, 0.786346435546875, 0.8179779052734375, 0.849609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 7.0, 4.0, 10.0, 14.0, 15.0, 24.0, 30.0, 44.0, 39.0, 64.0, 85.0, 128.0, 183.0, 386.0, 905.0, 3103.0, 14960.0, 130963.0, 817191.0, 66828.0, 9605.0, 2227.0, 755.0, 337.0, 174.0, 112.0, 97.0, 50.0, 46.0, 38.0, 32.0, 18.0, 18.0, 14.0, 12.0, 11.0, 4.0, 2.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050018310546875, -0.04831504821777344, -0.046611785888671875, -0.04490852355957031, -0.04320526123046875, -0.04150199890136719, -0.039798736572265625, -0.03809547424316406, -0.0363922119140625, -0.03468894958496094, -0.032985687255859375, -0.03128242492675781, -0.02957916259765625, -0.027875900268554688, -0.026172637939453125, -0.024469375610351562, -0.02276611328125, -0.021062850952148438, -0.019359588623046875, -0.017656326293945312, -0.01595306396484375, -0.014249801635742188, -0.012546539306640625, -0.010843276977539062, -0.0091400146484375, -0.0074367523193359375, -0.005733489990234375, -0.0040302276611328125, -0.00232696533203125, -0.0006237030029296875, 0.001079559326171875, 0.0027828216552734375, 0.004486083984375, 0.0061893463134765625, 0.007892608642578125, 0.009595870971679688, 0.01129913330078125, 0.013002395629882812, 0.014705657958984375, 0.016408920288085938, 0.0181121826171875, 0.019815444946289062, 0.021518707275390625, 0.023221969604492188, 0.02492523193359375, 0.026628494262695312, 0.028331756591796875, 0.030035018920898438, 0.03173828125, 0.03344154357910156, 0.035144805908203125, 0.03684806823730469, 0.03855133056640625, 0.04025459289550781, 0.041957855224609375, 0.04366111755371094, 0.0453643798828125, 0.04706764221191406, 0.048770904541015625, 0.05047416687011719, 0.05217742919921875, 0.05388069152832031, 0.055583953857421875, 0.05728721618652344, 0.058990478515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 7.0, 6.0, 3.0, 7.0, 9.0, 5.0, 10.0, 18.0, 16.0, 25.0, 32.0, 36.0, 34.0, 33.0, 44.0, 30.0, 42.0, 50.0, 51.0, 53.0, 55.0, 47.0, 38.0, 45.0, 42.0, 48.0, 39.0, 51.0, 20.0, 15.0, 20.0, 15.0, 7.0, 11.0, 9.0, 9.0, 8.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.27734375, -1.2337799072265625, -1.190216064453125, -1.1466522216796875, -1.10308837890625, -1.0595245361328125, -1.015960693359375, -0.9723968505859375, -0.9288330078125, -0.8852691650390625, -0.841705322265625, -0.7981414794921875, -0.75457763671875, -0.7110137939453125, -0.667449951171875, -0.6238861083984375, -0.580322265625, -0.5367584228515625, -0.493194580078125, -0.4496307373046875, -0.40606689453125, -0.3625030517578125, -0.318939208984375, -0.2753753662109375, -0.2318115234375, -0.1882476806640625, -0.144683837890625, -0.1011199951171875, -0.05755615234375, -0.0139923095703125, 0.029571533203125, 0.0731353759765625, 0.11669921875, 0.1602630615234375, 0.203826904296875, 0.2473907470703125, 0.29095458984375, 0.3345184326171875, 0.378082275390625, 0.4216461181640625, 0.4652099609375, 0.5087738037109375, 0.552337646484375, 0.5959014892578125, 0.63946533203125, 0.6830291748046875, 0.726593017578125, 0.7701568603515625, 0.813720703125, 0.8572845458984375, 0.900848388671875, 0.9444122314453125, 0.98797607421875, 1.0315399169921875, 1.075103759765625, 1.1186676025390625, 1.1622314453125, 1.2057952880859375, 1.249359130859375, 1.2929229736328125, 1.33648681640625, 1.3800506591796875, 1.423614501953125, 1.4671783447265625, 1.5107421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 6.0, 6.0, 6.0, 12.0, 12.0, 18.0, 35.0, 37.0, 52.0, 69.0, 86.0, 136.0, 169.0, 213.0, 321.0, 434.0, 581.0, 837.0, 1161.0, 1613.0, 2378.0, 3475.0, 5344.0, 8596.0, 14349.0, 27380.0, 64455.0, 307856.0, 468946.0, 70529.0, 28886.0, 14894.0, 8602.0, 5414.0, 3542.0, 2383.0, 1591.0, 1149.0, 800.0, 585.0, 402.0, 311.0, 236.0, 167.0, 118.0, 109.0, 69.0, 45.0, 37.0, 37.0, 30.0, 11.0, 11.0, 10.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.0011262893676757812, -0.0010911375284194946, -0.001055985689163208, -0.0010208338499069214, -0.0009856820106506348, -0.0009505301713943481, -0.0009153783321380615, -0.0008802264928817749, -0.0008450746536254883, -0.0008099228143692017, -0.000774770975112915, -0.0007396191358566284, -0.0007044672966003418, -0.0006693154573440552, -0.0006341636180877686, -0.0005990117788314819, -0.0005638599395751953, -0.0005287081003189087, -0.0004935562610626221, -0.00045840442180633545, -0.00042325258255004883, -0.0003881007432937622, -0.0003529489040374756, -0.00031779706478118896, -0.00028264522552490234, -0.0002474933862686157, -0.0002123415470123291, -0.00017718970775604248, -0.00014203786849975586, -0.00010688602924346924, -7.173418998718262e-05, -3.6582350730895996e-05, -1.430511474609375e-06, 3.3721327781677246e-05, 6.887316703796387e-05, 0.00010402500629425049, 0.0001391768455505371, 0.00017432868480682373, 0.00020948052406311035, 0.00024463236331939697, 0.0002797842025756836, 0.0003149360418319702, 0.00035008788108825684, 0.00038523972034454346, 0.0004203915596008301, 0.0004555433988571167, 0.0004906952381134033, 0.0005258470773696899, 0.0005609989166259766, 0.0005961507558822632, 0.0006313025951385498, 0.0006664544343948364, 0.000701606273651123, 0.0007367581129074097, 0.0007719099521636963, 0.0008070617914199829, 0.0008422136306762695, 0.0008773654699325562, 0.0009125173091888428, 0.0009476691484451294, 0.000982820987701416, 0.0010179728269577026, 0.0010531246662139893, 0.0010882765054702759, 0.0011234283447265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 12.0, 4.0, 1.0, 3.0, 12.0, 6.0, 5.0, 19.0, 9.0, 15.0, 12.0, 51.0, 49.0, 89.0, 336.0, 148.0, 77.0, 29.0, 33.0, 16.0, 13.0, 25.0, 5.0, 5.0, 2.0, 12.0, 4.0, 0.0, 12.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001220703125, -0.00011766329407691956, -0.00011325627565383911, -0.00010884925723075867, -0.00010444223880767822, -0.00010003522038459778, -9.562820196151733e-05, -9.122118353843689e-05, -8.681416511535645e-05, -8.2407146692276e-05, -7.800012826919556e-05, -7.359310984611511e-05, -6.918609142303467e-05, -6.477907299995422e-05, -6.037205457687378e-05, -5.5965036153793335e-05, -5.155801773071289e-05, -4.7150999307632446e-05, -4.2743980884552e-05, -3.833696246147156e-05, -3.392994403839111e-05, -2.952292561531067e-05, -2.5115907192230225e-05, -2.070888876914978e-05, -1.6301870346069336e-05, -1.1894851922988892e-05, -7.487833499908447e-06, -3.080815076828003e-06, 1.3262033462524414e-06, 5.733221769332886e-06, 1.014024019241333e-05, 1.4547258615493774e-05, 1.895427703857422e-05, 2.3361295461654663e-05, 2.7768313884735107e-05, 3.217533230781555e-05, 3.6582350730895996e-05, 4.098936915397644e-05, 4.5396387577056885e-05, 4.980340600013733e-05, 5.4210424423217773e-05, 5.861744284629822e-05, 6.302446126937866e-05, 6.74314796924591e-05, 7.183849811553955e-05, 7.624551653862e-05, 8.065253496170044e-05, 8.505955338478088e-05, 8.946657180786133e-05, 9.387359023094177e-05, 9.828060865402222e-05, 0.00010268762707710266, 0.0001070946455001831, 0.00011150166392326355, 0.000115908682346344, 0.00012031570076942444, 0.00012472271919250488, 0.00012912973761558533, 0.00013353675603866577, 0.00013794377446174622, 0.00014235079288482666, 0.0001467578113079071, 0.00015116482973098755, 0.000155571848154068, 0.00015997886657714844]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 5.0, 18.0, 16.0, 22.0, 35.0, 48.0, 64.0, 101.0, 124.0, 184.0, 250.0, 390.0, 537.0, 735.0, 1051.0, 1477.0, 2264.0, 3638.0, 6258.0, 12162.0, 30105.0, 113415.0, 734200.0, 88717.0, 25999.0, 10738.0, 5710.0, 3381.0, 2176.0, 1418.0, 971.0, 662.0, 488.0, 330.0, 230.0, 173.0, 121.0, 95.0, 69.0, 46.0, 33.0, 28.0, 25.0, 14.0, 9.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011463165283203125, -0.0011098384857177734, -0.0010733604431152344, -0.0010368824005126953, -0.0010004043579101562, -0.0009639263153076172, -0.0009274482727050781, -0.0008909702301025391, -0.0008544921875, -0.0008180141448974609, -0.0007815361022949219, -0.0007450580596923828, -0.0007085800170898438, -0.0006721019744873047, -0.0006356239318847656, -0.0005991458892822266, -0.0005626678466796875, -0.0005261898040771484, -0.0004897117614746094, -0.0004532337188720703, -0.00041675567626953125, -0.0003802776336669922, -0.0003437995910644531, -0.00030732154846191406, -0.000270843505859375, -0.00023436546325683594, -0.00019788742065429688, -0.0001614093780517578, -0.00012493133544921875, -8.845329284667969e-05, -5.1975250244140625e-05, -1.5497207641601562e-05, 2.09808349609375e-05, 5.745887756347656e-05, 9.393692016601562e-05, 0.0001304149627685547, 0.00016689300537109375, 0.0002033710479736328, 0.00023984909057617188, 0.00027632713317871094, 0.00031280517578125, 0.00034928321838378906, 0.0003857612609863281, 0.0004222393035888672, 0.00045871734619140625, 0.0004951953887939453, 0.0005316734313964844, 0.0005681514739990234, 0.0006046295166015625, 0.0006411075592041016, 0.0006775856018066406, 0.0007140636444091797, 0.0007505416870117188, 0.0007870197296142578, 0.0008234977722167969, 0.0008599758148193359, 0.000896453857421875, 0.0009329319000244141, 0.0009694099426269531, 0.0010058879852294922, 0.0010423660278320312, 0.0010788440704345703, 0.0011153221130371094, 0.0011518001556396484, 0.0011882781982421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 10.0, 14.0, 14.0, 15.0, 37.0, 45.0, 69.0, 104.0, 279.0, 137.0, 81.0, 55.0, 42.0, 19.0, 11.0, 6.0, 5.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004153251647949219, -0.0004025772213935852, -0.00038982927799224854, -0.00037708133459091187, -0.0003643333911895752, -0.0003515854477882385, -0.00033883750438690186, -0.0003260895609855652, -0.0003133416175842285, -0.00030059367418289185, -0.0002878457307815552, -0.0002750977873802185, -0.00026234984397888184, -0.00024960190057754517, -0.0002368539571762085, -0.00022410601377487183, -0.00021135807037353516, -0.00019861012697219849, -0.00018586218357086182, -0.00017311424016952515, -0.00016036629676818848, -0.0001476183533668518, -0.00013487040996551514, -0.00012212246656417847, -0.0001093745231628418, -9.662657976150513e-05, -8.387863636016846e-05, -7.113069295883179e-05, -5.838274955749512e-05, -4.563480615615845e-05, -3.288686275482178e-05, -2.0138919353485107e-05, -7.3909759521484375e-06, 5.356967449188232e-06, 1.8104910850524902e-05, 3.085285425186157e-05, 4.360079765319824e-05, 5.634874105453491e-05, 6.909668445587158e-05, 8.184462785720825e-05, 9.459257125854492e-05, 0.00010734051465988159, 0.00012008845806121826, 0.00013283640146255493, 0.0001455843448638916, 0.00015833228826522827, 0.00017108023166656494, 0.0001838281750679016, 0.00019657611846923828, 0.00020932406187057495, 0.00022207200527191162, 0.0002348199486732483, 0.00024756789207458496, 0.00026031583547592163, 0.0002730637788772583, 0.00028581172227859497, 0.00029855966567993164, 0.0003113076090812683, 0.000324055552482605, 0.00033680349588394165, 0.0003495514392852783, 0.000362299382686615, 0.00037504732608795166, 0.00038779526948928833, 0.000400543212890625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 11.0, 12.0, 24.0, 51.0, 114.0, 437.0, 210.0, 63.0, 38.0, 14.0, 11.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.689807176589966, -2.625455617904663, -2.5611042976379395, -2.4967527389526367, -2.432401418685913, -2.3680498600006104, -2.3036985397338867, -2.239346981048584, -2.1749954223632812, -2.1106438636779785, -2.046292543411255, -1.9819411039352417, -1.9175896644592285, -1.8532381057739258, -1.7888866662979126, -1.7245352268218994, -1.6601839065551758, -1.5958324670791626, -1.5314810276031494, -1.4671295881271362, -1.402778148651123, -1.3384265899658203, -1.2740751504898071, -1.209723711013794, -1.1453722715377808, -1.0810208320617676, -1.0166693925857544, -0.9523178935050964, -0.8879664540290833, -0.8236150145530701, -0.7592635154724121, -0.6949120759963989, -0.6305607557296753, -0.5662093162536621, -0.5018578767776489, -0.43750637769699097, -0.3731549382209778, -0.3088034987449646, -0.24445202946662903, -0.18010056018829346, -0.11574912071228027, -0.051397666335105896, 0.012953788042068481, 0.07730524241924286, 0.14165669679641724, 0.20600813627243042, 0.270359605550766, 0.33471107482910156, 0.39906251430511475, 0.46341395378112793, 0.5277653932571411, 0.5921168923377991, 0.6564683318138123, 0.7208197712898254, 0.7851712703704834, 0.8495227098464966, 0.9138741493225098, 0.978225588798523, 1.0425770282745361, 1.1069284677505493, 1.1712799072265625, 1.2356314659118652, 1.2999829053878784, 1.3643343448638916, 1.4286857843399048]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 6.0, 12.0, 7.0, 6.0, 15.0, 9.0, 13.0, 24.0, 21.0, 21.0, 22.0, 33.0, 35.0, 38.0, 52.0, 35.0, 53.0, 41.0, 40.0, 37.0, 47.0, 42.0, 44.0, 42.0, 31.0, 34.0, 36.0, 33.0, 24.0, 19.0, 23.0, 22.0, 12.0, 12.0, 5.0, 6.0, 9.0, 4.0, 10.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2573203444480896, -0.24927844107151031, -0.24123655259609222, -0.23319464921951294, -0.22515276074409485, -0.21711085736751556, -0.20906895399093628, -0.2010270655155182, -0.1929851621389389, -0.18494325876235962, -0.17690137028694153, -0.16885946691036224, -0.16081756353378296, -0.15277567505836487, -0.14473377168178558, -0.1366918683052063, -0.1286499798297882, -0.12060808390378952, -0.11256618797779083, -0.10452428460121155, -0.09648238867521286, -0.08844049274921417, -0.08039858937263489, -0.0723566934466362, -0.06431479752063751, -0.056272901594638824, -0.04823100194334984, -0.04018910229206085, -0.032147206366062164, -0.024105310440063477, -0.01606341078877449, -0.008021511137485504, 2.0384788513183594e-05, 0.00806228257715702, 0.016104180365800858, 0.024146078154444695, 0.03218797594308853, 0.04022987186908722, 0.048271771520376205, 0.05631367117166519, 0.06435556709766388, 0.07239746302366257, 0.08043935894966125, 0.08848126232624054, 0.09652315825223923, 0.10456505417823792, 0.1126069575548172, 0.12064885348081589, 0.12869074940681458, 0.13673265278339386, 0.14477454125881195, 0.15281644463539124, 0.16085833311080933, 0.1689002364873886, 0.1769421398639679, 0.184984028339386, 0.19302593171596527, 0.20106783509254456, 0.20910972356796265, 0.21715162694454193, 0.22519353032112122, 0.2332354187965393, 0.2412773221731186, 0.24931922554969788, 0.25736111402511597]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 7.0, 6.0, 7.0, 9.0, 19.0, 9.0, 28.0, 36.0, 40.0, 53.0, 80.0, 124.0, 162.0, 230.0, 339.0, 522.0, 774.0, 1215.0, 1961.0, 3337.0, 6192.0, 11845.0, 25776.0, 66108.0, 275413.0, 495571.0, 92755.0, 33326.0, 14792.0, 7285.0, 4076.0, 2254.0, 1456.0, 885.0, 568.0, 410.0, 267.0, 160.0, 130.0, 79.0, 65.0, 52.0, 25.0, 25.0, 23.0, 12.0, 11.0, 10.0, 5.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.398193359375, -0.3858070373535156, -0.37342071533203125, -0.3610343933105469, -0.3486480712890625, -0.3362617492675781, -0.32387542724609375, -0.3114891052246094, -0.299102783203125, -0.2867164611816406, -0.27433013916015625, -0.2619438171386719, -0.2495574951171875, -0.23717117309570312, -0.22478485107421875, -0.21239852905273438, -0.20001220703125, -0.18762588500976562, -0.17523956298828125, -0.16285324096679688, -0.1504669189453125, -0.13808059692382812, -0.12569427490234375, -0.11330795288085938, -0.100921630859375, -0.08853530883789062, -0.07614898681640625, -0.06376266479492188, -0.0513763427734375, -0.038990020751953125, -0.02660369873046875, -0.014217376708984375, -0.0018310546875, 0.010555267333984375, 0.02294158935546875, 0.035327911376953125, 0.0477142333984375, 0.060100555419921875, 0.07248687744140625, 0.08487319946289062, 0.097259521484375, 0.10964584350585938, 0.12203216552734375, 0.13441848754882812, 0.1468048095703125, 0.15919113159179688, 0.17157745361328125, 0.18396377563476562, 0.19635009765625, 0.20873641967773438, 0.22112274169921875, 0.23350906372070312, 0.2458953857421875, 0.2582817077636719, 0.27066802978515625, 0.2830543518066406, 0.295440673828125, 0.3078269958496094, 0.32021331787109375, 0.3325996398925781, 0.3449859619140625, 0.3573722839355469, 0.36975860595703125, 0.3821449279785156, 0.39453125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 5.0, 3.0, 7.0, 9.0, 3.0, 15.0, 31.0, 32.0, 61.0, 88.0, 135.0, 129.0, 148.0, 111.0, 82.0, 45.0, 29.0, 21.0, 12.0, 7.0, 10.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054718017578125, -0.052994728088378906, -0.05127143859863281, -0.04954814910888672, -0.047824859619140625, -0.04610157012939453, -0.04437828063964844, -0.042654991149902344, -0.04093170166015625, -0.039208412170410156, -0.03748512268066406, -0.03576183319091797, -0.034038543701171875, -0.03231525421142578, -0.030591964721679688, -0.028868675231933594, -0.0271453857421875, -0.025422096252441406, -0.023698806762695312, -0.02197551727294922, -0.020252227783203125, -0.01852893829345703, -0.016805648803710938, -0.015082359313964844, -0.01335906982421875, -0.011635780334472656, -0.009912490844726562, -0.008189201354980469, -0.006465911865234375, -0.004742622375488281, -0.0030193328857421875, -0.0012960433959960938, 0.00042724609375, 0.0021505355834960938, 0.0038738250732421875, 0.005597114562988281, 0.007320404052734375, 0.009043693542480469, 0.010766983032226562, 0.012490272521972656, 0.01421356201171875, 0.015936851501464844, 0.017660140991210938, 0.01938343048095703, 0.021106719970703125, 0.02283000946044922, 0.024553298950195312, 0.026276588439941406, 0.0279998779296875, 0.029723167419433594, 0.03144645690917969, 0.03316974639892578, 0.034893035888671875, 0.03661632537841797, 0.03833961486816406, 0.040062904357910156, 0.04178619384765625, 0.043509483337402344, 0.04523277282714844, 0.04695606231689453, 0.048679351806640625, 0.05040264129638672, 0.05212593078613281, 0.053849220275878906, 0.055572509765625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 7.0, 10.0, 12.0, 16.0, 16.0, 42.0, 45.0, 74.0, 113.0, 149.0, 238.0, 337.0, 478.0, 784.0, 1171.0, 1774.0, 2912.0, 4757.0, 8166.0, 14103.0, 26000.0, 50967.0, 115146.0, 389444.0, 252661.0, 87101.0, 40766.0, 21603.0, 11665.0, 6724.0, 4074.0, 2489.0, 1617.0, 969.0, 671.0, 453.0, 309.0, 218.0, 126.0, 101.0, 70.0, 50.0, 27.0, 34.0, 27.0, 12.0, 9.0, 8.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.09283447265625, -0.08950042724609375, -0.0861663818359375, -0.08283233642578125, -0.079498291015625, -0.07616424560546875, -0.0728302001953125, -0.06949615478515625, -0.066162109375, -0.06282806396484375, -0.0594940185546875, -0.05615997314453125, -0.052825927734375, -0.04949188232421875, -0.0461578369140625, -0.04282379150390625, -0.03948974609375, -0.03615570068359375, -0.0328216552734375, -0.02948760986328125, -0.026153564453125, -0.02281951904296875, -0.0194854736328125, -0.01615142822265625, -0.0128173828125, -0.00948333740234375, -0.0061492919921875, -0.00281524658203125, 0.000518798828125, 0.00385284423828125, 0.0071868896484375, 0.01052093505859375, 0.01385498046875, 0.01718902587890625, 0.0205230712890625, 0.02385711669921875, 0.027191162109375, 0.03052520751953125, 0.0338592529296875, 0.03719329833984375, 0.04052734375, 0.04386138916015625, 0.0471954345703125, 0.05052947998046875, 0.053863525390625, 0.05719757080078125, 0.0605316162109375, 0.06386566162109375, 0.06719970703125, 0.07053375244140625, 0.0738677978515625, 0.07720184326171875, 0.080535888671875, 0.08386993408203125, 0.0872039794921875, 0.09053802490234375, 0.0938720703125, 0.09720611572265625, 0.1005401611328125, 0.10387420654296875, 0.107208251953125, 0.11054229736328125, 0.1138763427734375, 0.11721038818359375, 0.12054443359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 6.0, 13.0, 10.0, 4.0, 17.0, 15.0, 27.0, 18.0, 30.0, 24.0, 31.0, 48.0, 69.0, 40.0, 61.0, 64.0, 72.0, 53.0, 46.0, 42.0, 50.0, 43.0, 34.0, 33.0, 28.0, 28.0, 13.0, 18.0, 11.0, 15.0, 5.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06494140625, -0.06298589706420898, -0.06103038787841797, -0.05907487869262695, -0.05711936950683594, -0.05516386032104492, -0.053208351135253906, -0.05125284194946289, -0.049297332763671875, -0.04734182357788086, -0.045386314392089844, -0.04343080520629883, -0.04147529602050781, -0.0395197868347168, -0.03756427764892578, -0.035608768463134766, -0.03365325927734375, -0.031697750091552734, -0.02974224090576172, -0.027786731719970703, -0.025831222534179688, -0.023875713348388672, -0.021920204162597656, -0.01996469497680664, -0.018009185791015625, -0.01605367660522461, -0.014098167419433594, -0.012142658233642578, -0.010187149047851562, -0.008231639862060547, -0.006276130676269531, -0.004320621490478516, -0.0023651123046875, -0.0004096031188964844, 0.0015459060668945312, 0.003501415252685547, 0.0054569244384765625, 0.007412433624267578, 0.009367942810058594, 0.01132345199584961, 0.013278961181640625, 0.01523447036743164, 0.017189979553222656, 0.019145488739013672, 0.021100997924804688, 0.023056507110595703, 0.02501201629638672, 0.026967525482177734, 0.02892303466796875, 0.030878543853759766, 0.03283405303955078, 0.0347895622253418, 0.03674507141113281, 0.03870058059692383, 0.040656089782714844, 0.04261159896850586, 0.044567108154296875, 0.04652261734008789, 0.048478126525878906, 0.05043363571166992, 0.05238914489746094, 0.05434465408325195, 0.05630016326904297, 0.058255672454833984, 0.060211181640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 10.0, 6.0, 11.0, 16.0, 19.0, 20.0, 41.0, 50.0, 88.0, 118.0, 193.0, 282.0, 403.0, 749.0, 1638.0, 6344.0, 970341.0, 61020.0, 4127.0, 1267.0, 677.0, 363.0, 245.0, 160.0, 106.0, 79.0, 46.0, 44.0, 19.0, 20.0, 22.0, 9.0, 8.0, 2.0, 4.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434326171875, -0.4197883605957031, -0.40525054931640625, -0.3907127380371094, -0.3761749267578125, -0.3616371154785156, -0.34709930419921875, -0.3325614929199219, -0.318023681640625, -0.3034858703613281, -0.28894805908203125, -0.2744102478027344, -0.2598724365234375, -0.24533462524414062, -0.23079681396484375, -0.21625900268554688, -0.20172119140625, -0.18718338012695312, -0.17264556884765625, -0.15810775756835938, -0.1435699462890625, -0.12903213500976562, -0.11449432373046875, -0.09995651245117188, -0.085418701171875, -0.07088088989257812, -0.05634307861328125, -0.041805267333984375, -0.0272674560546875, -0.012729644775390625, 0.00180816650390625, 0.016345977783203125, 0.0308837890625, 0.045421600341796875, 0.05995941162109375, 0.07449722290039062, 0.0890350341796875, 0.10357284545898438, 0.11811065673828125, 0.13264846801757812, 0.147186279296875, 0.16172409057617188, 0.17626190185546875, 0.19079971313476562, 0.2053375244140625, 0.21987533569335938, 0.23441314697265625, 0.24895095825195312, 0.26348876953125, 0.2780265808105469, 0.29256439208984375, 0.3071022033691406, 0.3216400146484375, 0.3361778259277344, 0.35071563720703125, 0.3652534484863281, 0.379791259765625, 0.3943290710449219, 0.40886688232421875, 0.4234046936035156, 0.4379425048828125, 0.4524803161621094, 0.46701812744140625, 0.4815559387207031, 0.49609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 12.0, 9.0, 19.0, 40.0, 294.0, 480.0, 59.0, 26.0, 10.0, 15.0, 6.0, 5.0, 2.0, 3.0, 2.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18235969543457e-05, -6.90678134560585e-05, -6.63120299577713e-05, -6.35562464594841e-05, -6.08004629611969e-05, -5.80446794629097e-05, -5.52888959646225e-05, -5.25331124663353e-05, -4.9777328968048096e-05, -4.7021545469760895e-05, -4.4265761971473694e-05, -4.150997847318649e-05, -3.875419497489929e-05, -3.599841147661209e-05, -3.324262797832489e-05, -3.048684448003769e-05, -2.7731060981750488e-05, -2.4975277483463287e-05, -2.2219493985176086e-05, -1.9463710486888885e-05, -1.6707926988601685e-05, -1.3952143490314484e-05, -1.1196359992027283e-05, -8.440576493740082e-06, -5.684792995452881e-06, -2.92900949716568e-06, -1.73225998878479e-07, 2.582557499408722e-06, 5.338340997695923e-06, 8.094124495983124e-06, 1.0849907994270325e-05, 1.3605691492557526e-05, 1.6361474990844727e-05, 1.9117258489131927e-05, 2.187304198741913e-05, 2.462882548570633e-05, 2.738460898399353e-05, 3.014039248228073e-05, 3.289617598056793e-05, 3.565195947885513e-05, 3.8407742977142334e-05, 4.1163526475429535e-05, 4.3919309973716736e-05, 4.667509347200394e-05, 4.943087697029114e-05, 5.218666046857834e-05, 5.494244396686554e-05, 5.769822746515274e-05, 6.045401096343994e-05, 6.320979446172714e-05, 6.596557796001434e-05, 6.872136145830154e-05, 7.147714495658875e-05, 7.423292845487595e-05, 7.698871195316315e-05, 7.974449545145035e-05, 8.250027894973755e-05, 8.525606244802475e-05, 8.801184594631195e-05, 9.076762944459915e-05, 9.352341294288635e-05, 9.627919644117355e-05, 9.903497993946075e-05, 0.00010179076343774796, 0.00010454654693603516]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 9.0, 6.0, 6.0, 10.0, 16.0, 11.0, 21.0, 31.0, 40.0, 70.0, 79.0, 110.0, 158.0, 202.0, 263.0, 401.0, 539.0, 801.0, 1094.0, 1707.0, 2534.0, 4415.0, 9279.0, 38778.0, 948974.0, 20659.0, 7380.0, 3708.0, 2268.0, 1469.0, 1010.0, 696.0, 502.0, 370.0, 237.0, 191.0, 114.0, 101.0, 75.0, 52.0, 45.0, 29.0, 33.0, 20.0, 7.0, 15.0, 6.0, 3.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12176513671875, -0.11800193786621094, -0.11423873901367188, -0.11047554016113281, -0.10671234130859375, -0.10294914245605469, -0.09918594360351562, -0.09542274475097656, -0.0916595458984375, -0.08789634704589844, -0.08413314819335938, -0.08036994934082031, -0.07660675048828125, -0.07284355163574219, -0.06908035278320312, -0.06531715393066406, -0.061553955078125, -0.05779075622558594, -0.054027557373046875, -0.05026435852050781, -0.04650115966796875, -0.04273796081542969, -0.038974761962890625, -0.03521156311035156, -0.0314483642578125, -0.027685165405273438, -0.023921966552734375, -0.020158767700195312, -0.01639556884765625, -0.012632369995117188, -0.008869171142578125, -0.0051059722900390625, -0.0013427734375, 0.0024204254150390625, 0.006183624267578125, 0.009946823120117188, 0.01371002197265625, 0.017473220825195312, 0.021236419677734375, 0.024999618530273438, 0.0287628173828125, 0.03252601623535156, 0.036289215087890625, 0.04005241394042969, 0.04381561279296875, 0.04757881164550781, 0.051342010498046875, 0.05510520935058594, 0.058868408203125, 0.06263160705566406, 0.06639480590820312, 0.07015800476074219, 0.07392120361328125, 0.07768440246582031, 0.08144760131835938, 0.08521080017089844, 0.0889739990234375, 0.09273719787597656, 0.09650039672851562, 0.10026359558105469, 0.10402679443359375, 0.10778999328613281, 0.11155319213867188, 0.11531639099121094, 0.11907958984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 6.0, 6.0, 6.0, 35.0, 208.0, 615.0, 50.0, 9.0, 15.0, 6.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07421875, -0.07176399230957031, -0.06930923461914062, -0.06685447692871094, -0.06439971923828125, -0.06194496154785156, -0.059490203857421875, -0.05703544616699219, -0.0545806884765625, -0.05212593078613281, -0.049671173095703125, -0.04721641540527344, -0.04476165771484375, -0.04230690002441406, -0.039852142333984375, -0.03739738464355469, -0.034942626953125, -0.03248786926269531, -0.030033111572265625, -0.027578353881835938, -0.02512359619140625, -0.022668838500976562, -0.020214080810546875, -0.017759323120117188, -0.0153045654296875, -0.012849807739257812, -0.010395050048828125, -0.007940292358398438, -0.00548553466796875, -0.0030307769775390625, -0.000576019287109375, 0.0018787384033203125, 0.00433349609375, 0.0067882537841796875, 0.009243011474609375, 0.011697769165039062, 0.01415252685546875, 0.016607284545898438, 0.019062042236328125, 0.021516799926757812, 0.0239715576171875, 0.026426315307617188, 0.028881072998046875, 0.03133583068847656, 0.03379058837890625, 0.03624534606933594, 0.038700103759765625, 0.04115486145019531, 0.043609619140625, 0.04606437683105469, 0.048519134521484375, 0.05097389221191406, 0.05342864990234375, 0.05588340759277344, 0.058338165283203125, 0.06079292297363281, 0.0632476806640625, 0.06570243835449219, 0.06815719604492188, 0.07061195373535156, 0.07306671142578125, 0.07552146911621094, 0.07797622680664062, 0.08043098449707031, 0.0828857421875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 10.0, 15.0, 29.0, 51.0, 46.0, 135.0, 296.0, 208.0, 97.0, 47.0, 26.0, 15.0, 6.0, 10.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49589839577674866, -0.466234415769577, -0.4365704655647278, -0.40690648555755615, -0.3772425055503845, -0.3475785255432129, -0.31791457533836365, -0.288250595331192, -0.2585866451263428, -0.22892268002033234, -0.1992587000131607, -0.16959473490715027, -0.13993075489997864, -0.1102667897939682, -0.08060282468795776, -0.05093884468078613, -0.021274864673614502, 0.008389106020331383, 0.03805307671427727, 0.067717045545578, 0.09738101810216904, 0.12704499065876007, 0.1567089557647705, 0.18637293577194214, 0.21603690087795258, 0.245700865983963, 0.27536484599113464, 0.3050287961959839, 0.3346927762031555, 0.36435675621032715, 0.3940207362174988, 0.4236847162246704, 0.45334869623184204, 0.48301267623901367, 0.5126766562461853, 0.5423406362533569, 0.5720045566558838, 0.6016685366630554, 0.631332516670227, 0.6609964966773987, 0.6906604766845703, 0.7203244566917419, 0.7499884366989136, 0.7796523571014404, 0.8093163371086121, 0.8389803171157837, 0.8686442971229553, 0.898308277130127, 0.9279721975326538, 0.9576361775398254, 0.9873001575469971, 1.016964077949524, 1.0466281175613403, 1.0762920379638672, 1.1059560775756836, 1.1356199979782104, 1.1652840375900269, 1.1949479579925537, 1.2246119976043701, 1.254275918006897, 1.2839399576187134, 1.3136038780212402, 1.3432679176330566, 1.3729318380355835, 1.4025957584381104]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 3.0, 8.0, 7.0, 11.0, 10.0, 13.0, 17.0, 18.0, 20.0, 24.0, 32.0, 28.0, 33.0, 30.0, 31.0, 33.0, 32.0, 31.0, 35.0, 45.0, 33.0, 38.0, 29.0, 38.0, 34.0, 32.0, 37.0, 33.0, 39.0, 31.0, 19.0, 21.0, 15.0, 26.0, 18.0, 17.0, 20.0, 6.0, 6.0, 13.0, 8.0, 6.0, 1.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0], "bins": [-0.19357718527317047, -0.1878954917192459, -0.18221378326416016, -0.1765320897102356, -0.17085039615631104, -0.16516868770122528, -0.15948699414730072, -0.15380528569221497, -0.1481235921382904, -0.14244189858436584, -0.1367601901292801, -0.13107849657535553, -0.12539680302143097, -0.11971509456634521, -0.11403340101242065, -0.1083517000079155, -0.10267000645399094, -0.09698830544948578, -0.09130661189556122, -0.08562491089105606, -0.0799432098865509, -0.07426151633262634, -0.06857981532812119, -0.06289811432361603, -0.05721641704440117, -0.05153471976518631, -0.04585301876068115, -0.04017132148146629, -0.034489624202251434, -0.028807923197746277, -0.023126225918531418, -0.01744452491402626, -0.011762827634811401, -0.0060811289586126804, -0.0003994302824139595, 0.005282267928123474, 0.010963967069983482, 0.01664566621184349, 0.02232736349105835, 0.028009064495563507, 0.033690761774778366, 0.039372459053993225, 0.04505416005849838, 0.05073585733771324, 0.0564175546169281, 0.06209925562143326, 0.06778095662593842, 0.07346265017986298, 0.07914435118436813, 0.08482605218887329, 0.09050774574279785, 0.09618944674730301, 0.10187114775180817, 0.10755284130573273, 0.11323454231023788, 0.11891624331474304, 0.1245979368686676, 0.13027963042259216, 0.13596133887767792, 0.14164303243160248, 0.14732472598552704, 0.1530064344406128, 0.15868812799453735, 0.16436982154846191, 0.17005153000354767]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 8.0, 9.0, 20.0, 15.0, 30.0, 34.0, 51.0, 76.0, 123.0, 150.0, 246.0, 337.0, 480.0, 754.0, 1213.0, 1971.0, 3402.0, 6191.0, 12757.0, 31245.0, 4052242.0, 46928.0, 17086.0, 8082.0, 4262.0, 2421.0, 1458.0, 908.0, 567.0, 393.0, 281.0, 184.0, 118.0, 69.0, 52.0, 33.0, 33.0, 18.0, 14.0, 8.0, 7.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.42724609375, -0.4155845642089844, -0.40392303466796875, -0.3922615051269531, -0.3805999755859375, -0.3689384460449219, -0.35727691650390625, -0.3456153869628906, -0.333953857421875, -0.3222923278808594, -0.31063079833984375, -0.2989692687988281, -0.2873077392578125, -0.2756462097167969, -0.26398468017578125, -0.2523231506347656, -0.24066162109375, -0.22900009155273438, -0.21733856201171875, -0.20567703247070312, -0.1940155029296875, -0.18235397338867188, -0.17069244384765625, -0.15903091430664062, -0.147369384765625, -0.13570785522460938, -0.12404632568359375, -0.11238479614257812, -0.1007232666015625, -0.08906173706054688, -0.07740020751953125, -0.06573867797851562, -0.0540771484375, -0.042415618896484375, -0.03075408935546875, -0.019092559814453125, -0.0074310302734375, 0.004230499267578125, 0.01589202880859375, 0.027553558349609375, 0.039215087890625, 0.050876617431640625, 0.06253814697265625, 0.07419967651367188, 0.0858612060546875, 0.09752273559570312, 0.10918426513671875, 0.12084579467773438, 0.13250732421875, 0.14416885375976562, 0.15583038330078125, 0.16749191284179688, 0.1791534423828125, 0.19081497192382812, 0.20247650146484375, 0.21413803100585938, 0.225799560546875, 0.23746109008789062, 0.24912261962890625, 0.2607841491699219, 0.2724456787109375, 0.2841072082519531, 0.29576873779296875, 0.3074302673339844, 0.319091796875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 9.0, 10.0, 8.0, 17.0, 18.0, 17.0, 38.0, 50.0, 47.0, 36.0, 53.0, 51.0, 50.0, 61.0, 66.0, 63.0, 58.0, 48.0, 61.0, 43.0, 50.0, 33.0, 19.0, 16.0, 19.0, 12.0, 9.0, 10.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02142333984375, -0.020842552185058594, -0.020261764526367188, -0.01968097686767578, -0.019100189208984375, -0.01851940155029297, -0.017938613891601562, -0.017357826232910156, -0.01677703857421875, -0.016196250915527344, -0.015615463256835938, -0.015034675598144531, -0.014453887939453125, -0.013873100280761719, -0.013292312622070312, -0.012711524963378906, -0.0121307373046875, -0.011549949645996094, -0.010969161987304688, -0.010388374328613281, -0.009807586669921875, -0.009226799011230469, -0.008646011352539062, -0.008065223693847656, -0.00748443603515625, -0.006903648376464844, -0.0063228607177734375, -0.005742073059082031, -0.005161285400390625, -0.004580497741699219, -0.0039997100830078125, -0.0034189224243164062, -0.002838134765625, -0.0022573471069335938, -0.0016765594482421875, -0.0010957717895507812, -0.000514984130859375, 6.580352783203125e-05, 0.0006465911865234375, 0.0012273788452148438, 0.00180816650390625, 0.0023889541625976562, 0.0029697418212890625, 0.0035505294799804688, 0.004131317138671875, 0.004712104797363281, 0.0052928924560546875, 0.005873680114746094, 0.0064544677734375, 0.007035255432128906, 0.0076160430908203125, 0.008196830749511719, 0.008777618408203125, 0.009358406066894531, 0.009939193725585938, 0.010519981384277344, 0.01110076904296875, 0.011681556701660156, 0.012262344360351562, 0.012843132019042969, 0.013423919677734375, 0.014004707336425781, 0.014585494995117188, 0.015166282653808594, 0.0157470703125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 3.0, 2.0, 4.0, 9.0, 14.0, 17.0, 74.0, 504.0, 6458.0, 4079072.0, 104321.0, 3318.0, 278.0, 48.0, 25.0, 15.0, 15.0, 15.0, 6.0, 10.0, 9.0, 8.0, 1.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.5390625, -0.5221633911132812, -0.5052642822265625, -0.48836517333984375, -0.471466064453125, -0.45456695556640625, -0.4376678466796875, -0.42076873779296875, -0.40386962890625, -0.38697052001953125, -0.3700714111328125, -0.35317230224609375, -0.336273193359375, -0.31937408447265625, -0.3024749755859375, -0.28557586669921875, -0.2686767578125, -0.25177764892578125, -0.2348785400390625, -0.21797943115234375, -0.201080322265625, -0.18418121337890625, -0.1672821044921875, -0.15038299560546875, -0.13348388671875, -0.11658477783203125, -0.0996856689453125, -0.08278656005859375, -0.065887451171875, -0.04898834228515625, -0.0320892333984375, -0.01519012451171875, 0.001708984375, 0.01860809326171875, 0.0355072021484375, 0.05240631103515625, 0.069305419921875, 0.08620452880859375, 0.1031036376953125, 0.12000274658203125, 0.13690185546875, 0.15380096435546875, 0.1707000732421875, 0.18759918212890625, 0.204498291015625, 0.22139739990234375, 0.2382965087890625, 0.25519561767578125, 0.2720947265625, 0.28899383544921875, 0.3058929443359375, 0.32279205322265625, 0.339691162109375, 0.35659027099609375, 0.3734893798828125, 0.39038848876953125, 0.40728759765625, 0.42418670654296875, 0.4410858154296875, 0.45798492431640625, 0.474884033203125, 0.49178314208984375, 0.5086822509765625, 0.5255813598632812, 0.54248046875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 3.0, 7.0, 7.0, 11.0, 5.0, 5.0, 3.0, 13.0, 12.0, 26.0, 68.0, 391.0, 3105.0, 224.0, 42.0, 19.0, 18.0, 13.0, 10.0, 7.0, 10.0, 10.0, 10.0, 8.0, 5.0, 6.0, 1.0, 5.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.04345703125, -0.04226970672607422, -0.04108238220214844, -0.039895057678222656, -0.038707733154296875, -0.037520408630371094, -0.03633308410644531, -0.03514575958251953, -0.03395843505859375, -0.03277111053466797, -0.03158378601074219, -0.030396461486816406, -0.029209136962890625, -0.028021812438964844, -0.026834487915039062, -0.02564716339111328, -0.0244598388671875, -0.02327251434326172, -0.022085189819335938, -0.020897865295410156, -0.019710540771484375, -0.018523216247558594, -0.017335891723632812, -0.01614856719970703, -0.01496124267578125, -0.013773918151855469, -0.012586593627929688, -0.011399269104003906, -0.010211944580078125, -0.009024620056152344, -0.007837295532226562, -0.006649971008300781, -0.005462646484375, -0.004275321960449219, -0.0030879974365234375, -0.0019006729125976562, -0.000713348388671875, 0.00047397613525390625, 0.0016613006591796875, 0.0028486251831054688, 0.00403594970703125, 0.005223274230957031, 0.0064105987548828125, 0.007597923278808594, 0.008785247802734375, 0.009972572326660156, 0.011159896850585938, 0.012347221374511719, 0.0135345458984375, 0.014721870422363281, 0.015909194946289062, 0.017096519470214844, 0.018283843994140625, 0.019471168518066406, 0.020658493041992188, 0.02184581756591797, 0.02303314208984375, 0.02422046661376953, 0.025407791137695312, 0.026595115661621094, 0.027782440185546875, 0.028969764709472656, 0.030157089233398438, 0.03134441375732422, 0.03253173828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 7.0, 9.0, 14.0, 15.0, 14.0, 25.0, 31.0, 38.0, 74.0, 98.0, 151.0, 125.0, 85.0, 68.0, 64.0, 35.0, 30.0, 29.0, 18.0, 11.0, 12.0, 6.0, 6.0, 5.0, 2.0, 5.0, 5.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05711132287979126, -0.054692450910806656, -0.05227358266711235, -0.04985471069812775, -0.04743584245443344, -0.04501697048544884, -0.04259809851646423, -0.04017923027276993, -0.03776036202907562, -0.03534149006009102, -0.03292262181639671, -0.03050374984741211, -0.028084881603717804, -0.0256660096347332, -0.023247139528393745, -0.02082826942205429, -0.018409397453069687, -0.015990527346730232, -0.013571657240390778, -0.011152786202728748, -0.008733916096389294, -0.006315045990049839, -0.0038961749523878098, -0.001477304846048355, 0.0009415652602910995, 0.003360435599461198, 0.005779305938631296, 0.008198176510632038, 0.010617046616971493, 0.013035916723310947, 0.015454787760972977, 0.01787365786731243, 0.020292527973651886, 0.02271139807999134, 0.025130268186330795, 0.0275491401553154, 0.029968008399009705, 0.03238688036799431, 0.03480575233697891, 0.03722462058067322, 0.03964348882436752, 0.04206236079335213, 0.04448122903704643, 0.046900101006031036, 0.04931896924972534, 0.051737841218709946, 0.05415671318769455, 0.056575581431388855, 0.05899445340037346, 0.06141332536935806, 0.06383219361305237, 0.06625106185674667, 0.06866993755102158, 0.07108880579471588, 0.07350767403841019, 0.07592654228210449, 0.0783454179763794, 0.0807642862200737, 0.0831831619143486, 0.08560203015804291, 0.08802089840173721, 0.09043976664543152, 0.09285864233970642, 0.09527751058340073, 0.09769637882709503]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 9.0, 3.0, 11.0, 8.0, 16.0, 13.0, 13.0, 21.0, 28.0, 26.0, 23.0, 29.0, 35.0, 34.0, 30.0, 43.0, 34.0, 40.0, 39.0, 45.0, 47.0, 43.0, 48.0, 33.0, 39.0, 36.0, 37.0, 27.0, 34.0, 28.0, 26.0, 21.0, 16.0, 12.0, 8.0, 12.0, 8.0, 4.0, 4.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.043136149644851685, -0.041827425360679626, -0.04051870107650757, -0.03920997679233551, -0.03790125250816345, -0.036592528223991394, -0.035283803939819336, -0.03397507965564728, -0.03266635537147522, -0.03135763108730316, -0.030048906803131104, -0.028740182518959045, -0.027431458234786987, -0.02612273395061493, -0.02481400966644287, -0.023505285382270813, -0.022196561098098755, -0.020887836813926697, -0.01957911252975464, -0.01827038824558258, -0.016961663961410522, -0.015652939677238464, -0.014344215393066406, -0.013035491108894348, -0.01172676682472229, -0.010418042540550232, -0.009109318256378174, -0.007800593972206116, -0.006491869688034058, -0.0051831454038619995, -0.0038744211196899414, -0.0025656968355178833, -0.0012569762766361237, 5.174800753593445e-05, 0.0013604722917079926, 0.0026691965758800507, 0.003977920860052109, 0.005286645144224167, 0.006595369428396225, 0.007904093712568283, 0.009212817996740341, 0.0105215422809124, 0.011830266565084457, 0.013138990849256516, 0.014447715133428574, 0.01575643941760063, 0.01706516370177269, 0.018373887985944748, 0.019682612270116806, 0.020991336554288864, 0.022300060838460922, 0.02360878512263298, 0.02491750940680504, 0.026226233690977097, 0.027534957975149155, 0.028843682259321213, 0.03015240654349327, 0.03146113082766533, 0.03276985511183739, 0.034078579396009445, 0.0353873036801815, 0.03669602796435356, 0.03800475224852562, 0.03931347653269768, 0.040622200816869736]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 11.0, 17.0, 25.0, 39.0, 72.0, 104.0, 221.0, 395.0, 820.0, 2036.0, 6472.0, 31449.0, 291263.0, 652420.0, 49386.0, 9158.0, 2635.0, 1005.0, 487.0, 234.0, 126.0, 70.0, 50.0, 25.0, 11.0, 11.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01161956787109375, -0.011314749717712402, -0.011009931564331055, -0.010705113410949707, -0.01040029525756836, -0.010095477104187012, -0.009790658950805664, -0.009485840797424316, -0.009181022644042969, -0.008876204490661621, -0.008571386337280273, -0.008266568183898926, -0.007961750030517578, -0.0076569318771362305, -0.007352113723754883, -0.007047295570373535, -0.0067424774169921875, -0.00643765926361084, -0.006132841110229492, -0.0058280229568481445, -0.005523204803466797, -0.005218386650085449, -0.0049135684967041016, -0.004608750343322754, -0.004303932189941406, -0.003999114036560059, -0.003694295883178711, -0.0033894777297973633, -0.0030846595764160156, -0.002779841423034668, -0.0024750232696533203, -0.0021702051162719727, -0.001865386962890625, -0.0015605688095092773, -0.0012557506561279297, -0.000950932502746582, -0.0006461143493652344, -0.0003412961959838867, -3.647804260253906e-05, 0.0002683401107788086, 0.0005731582641601562, 0.0008779764175415039, 0.0011827945709228516, 0.0014876127243041992, 0.0017924308776855469, 0.0020972490310668945, 0.002402067184448242, 0.00270688533782959, 0.0030117034912109375, 0.003316521644592285, 0.003621339797973633, 0.0039261579513549805, 0.004230976104736328, 0.004535794258117676, 0.0048406124114990234, 0.005145430564880371, 0.005450248718261719, 0.005755066871643066, 0.006059885025024414, 0.006364703178405762, 0.006669521331787109, 0.006974339485168457, 0.007279157638549805, 0.007583975791931152, 0.0078887939453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 14.0, 15.0, 18.0, 17.0, 26.0, 33.0, 43.0, 46.0, 39.0, 62.0, 56.0, 68.0, 71.0, 76.0, 66.0, 58.0, 42.0, 57.0, 41.0, 41.0, 34.0, 19.0, 19.0, 9.0, 13.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042694091796875, -0.04150104522705078, -0.04030799865722656, -0.039114952087402344, -0.037921905517578125, -0.036728858947753906, -0.03553581237792969, -0.03434276580810547, -0.03314971923828125, -0.03195667266845703, -0.030763626098632812, -0.029570579528808594, -0.028377532958984375, -0.027184486389160156, -0.025991439819335938, -0.02479839324951172, -0.0236053466796875, -0.02241230010986328, -0.021219253540039062, -0.020026206970214844, -0.018833160400390625, -0.017640113830566406, -0.016447067260742188, -0.015254020690917969, -0.01406097412109375, -0.012867927551269531, -0.011674880981445312, -0.010481834411621094, -0.009288787841796875, -0.008095741271972656, -0.0069026947021484375, -0.005709648132324219, -0.0045166015625, -0.0033235549926757812, -0.0021305084228515625, -0.0009374618530273438, 0.000255584716796875, 0.0014486312866210938, 0.0026416778564453125, 0.0038347244262695312, 0.00502777099609375, 0.006220817565917969, 0.0074138641357421875, 0.008606910705566406, 0.009799957275390625, 0.010993003845214844, 0.012186050415039062, 0.013379096984863281, 0.0145721435546875, 0.01576519012451172, 0.016958236694335938, 0.018151283264160156, 0.019344329833984375, 0.020537376403808594, 0.021730422973632812, 0.02292346954345703, 0.02411651611328125, 0.02530956268310547, 0.026502609252929688, 0.027695655822753906, 0.028888702392578125, 0.030081748962402344, 0.03127479553222656, 0.03246784210205078, 0.033660888671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 15.0, 11.0, 21.0, 19.0, 33.0, 42.0, 54.0, 72.0, 101.0, 115.0, 202.0, 344.0, 915.0, 3095.0, 15484.0, 149999.0, 812889.0, 54538.0, 7572.0, 1715.0, 533.0, 257.0, 145.0, 93.0, 83.0, 52.0, 40.0, 17.0, 24.0, 17.0, 15.0, 9.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0023040771484375, -0.0022280514240264893, -0.0021520256996154785, -0.0020759999752044678, -0.001999974250793457, -0.0019239485263824463, -0.0018479228019714355, -0.0017718970775604248, -0.001695871353149414, -0.0016198456287384033, -0.0015438199043273926, -0.0014677941799163818, -0.001391768455505371, -0.0013157427310943604, -0.0012397170066833496, -0.0011636912822723389, -0.0010876655578613281, -0.0010116398334503174, -0.0009356141090393066, -0.0008595883846282959, -0.0007835626602172852, -0.0007075369358062744, -0.0006315112113952637, -0.0005554854869842529, -0.0004794597625732422, -0.00040343403816223145, -0.0003274083137512207, -0.00025138258934020996, -0.00017535686492919922, -9.933114051818848e-05, -2.3305416107177734e-05, 5.272030830383301e-05, 0.00012874603271484375, 0.0002047717571258545, 0.00028079748153686523, 0.000356823205947876, 0.0004328489303588867, 0.0005088746547698975, 0.0005849003791809082, 0.0006609261035919189, 0.0007369518280029297, 0.0008129775524139404, 0.0008890032768249512, 0.0009650290012359619, 0.0010410547256469727, 0.0011170804500579834, 0.0011931061744689941, 0.0012691318988800049, 0.0013451576232910156, 0.0014211833477020264, 0.0014972090721130371, 0.0015732347965240479, 0.0016492605209350586, 0.0017252862453460693, 0.00180131196975708, 0.0018773376941680908, 0.0019533634185791016, 0.0020293891429901123, 0.002105414867401123, 0.002181440591812134, 0.0022574663162231445, 0.0023334920406341553, 0.002409517765045166, 0.0024855434894561768, 0.0025615692138671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 9.0, 7.0, 13.0, 16.0, 17.0, 22.0, 22.0, 30.0, 32.0, 32.0, 55.0, 39.0, 62.0, 54.0, 41.0, 39.0, 64.0, 54.0, 46.0, 52.0, 41.0, 31.0, 37.0, 35.0, 39.0, 18.0, 22.0, 10.0, 12.0, 12.0, 12.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.059051513671875, -0.05709981918334961, -0.05514812469482422, -0.05319643020629883, -0.05124473571777344, -0.04929304122924805, -0.047341346740722656, -0.045389652252197266, -0.043437957763671875, -0.041486263275146484, -0.039534568786621094, -0.0375828742980957, -0.03563117980957031, -0.03367948532104492, -0.03172779083251953, -0.02977609634399414, -0.02782440185546875, -0.02587270736694336, -0.02392101287841797, -0.021969318389892578, -0.020017623901367188, -0.018065929412841797, -0.016114234924316406, -0.014162540435791016, -0.012210845947265625, -0.010259151458740234, -0.008307456970214844, -0.006355762481689453, -0.0044040679931640625, -0.002452373504638672, -0.0005006790161132812, 0.0014510154724121094, 0.0034027099609375, 0.005354404449462891, 0.007306098937988281, 0.009257793426513672, 0.011209487915039062, 0.013161182403564453, 0.015112876892089844, 0.017064571380615234, 0.019016265869140625, 0.020967960357666016, 0.022919654846191406, 0.024871349334716797, 0.026823043823242188, 0.028774738311767578, 0.03072643280029297, 0.03267812728881836, 0.03462982177734375, 0.03658151626586914, 0.03853321075439453, 0.04048490524291992, 0.04243659973144531, 0.0443882942199707, 0.046339988708496094, 0.048291683197021484, 0.050243377685546875, 0.052195072174072266, 0.054146766662597656, 0.05609846115112305, 0.05805015563964844, 0.06000185012817383, 0.06195354461669922, 0.06390523910522461, 0.06585693359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 10.0, 9.0, 11.0, 11.0, 15.0, 27.0, 44.0, 39.0, 52.0, 97.0, 112.0, 166.0, 251.0, 313.0, 475.0, 703.0, 1106.0, 1678.0, 2913.0, 5177.0, 10096.0, 23000.0, 72413.0, 688233.0, 174999.0, 36027.0, 14095.0, 6755.0, 3570.0, 2104.0, 1295.0, 878.0, 526.0, 392.0, 248.0, 193.0, 151.0, 94.0, 82.0, 54.0, 41.0, 34.0, 20.0, 14.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.415346145629883e-05, -3.314018249511719e-05, -3.212690353393555e-05, -3.1113624572753906e-05, -3.0100345611572266e-05, -2.9087066650390625e-05, -2.8073787689208984e-05, -2.7060508728027344e-05, -2.6047229766845703e-05, -2.5033950805664062e-05, -2.4020671844482422e-05, -2.300739288330078e-05, -2.199411392211914e-05, -2.09808349609375e-05, -1.996755599975586e-05, -1.895427703857422e-05, -1.7940998077392578e-05, -1.6927719116210938e-05, -1.5914440155029297e-05, -1.4901161193847656e-05, -1.3887882232666016e-05, -1.2874603271484375e-05, -1.1861324310302734e-05, -1.0848045349121094e-05, -9.834766387939453e-06, -8.821487426757812e-06, -7.808208465576172e-06, -6.794929504394531e-06, -5.781650543212891e-06, -4.76837158203125e-06, -3.7550926208496094e-06, -2.7418136596679688e-06, -1.7285346984863281e-06, -7.152557373046875e-07, 2.980232238769531e-07, 1.3113021850585938e-06, 2.3245811462402344e-06, 3.337860107421875e-06, 4.351139068603516e-06, 5.364418029785156e-06, 6.377696990966797e-06, 7.3909759521484375e-06, 8.404254913330078e-06, 9.417533874511719e-06, 1.043081283569336e-05, 1.1444091796875e-05, 1.245737075805664e-05, 1.3470649719238281e-05, 1.4483928680419922e-05, 1.5497207641601562e-05, 1.6510486602783203e-05, 1.7523765563964844e-05, 1.8537044525146484e-05, 1.9550323486328125e-05, 2.0563602447509766e-05, 2.1576881408691406e-05, 2.2590160369873047e-05, 2.3603439331054688e-05, 2.4616718292236328e-05, 2.562999725341797e-05, 2.664327621459961e-05, 2.765655517578125e-05, 2.866983413696289e-05, 2.968311309814453e-05, 3.069639205932617e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 1.0, 4.0, 12.0, 15.0, 29.0, 24.0, 105.0, 63.0, 182.0, 97.0, 92.0, 177.0, 53.0, 59.0, 25.0, 26.0, 7.0, 6.0, 9.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.9408762454986572e-06, -1.8551945686340332e-06, -1.7695128917694092e-06, -1.6838312149047852e-06, -1.5981495380401611e-06, -1.5124678611755371e-06, -1.426786184310913e-06, -1.341104507446289e-06, -1.255422830581665e-06, -1.169741153717041e-06, -1.084059476852417e-06, -9.98377799987793e-07, -9.126961231231689e-07, -8.270144462585449e-07, -7.413327693939209e-07, -6.556510925292969e-07, -5.699694156646729e-07, -4.842877388000488e-07, -3.986060619354248e-07, -3.129243850708008e-07, -2.2724270820617676e-07, -1.4156103134155273e-07, -5.587935447692871e-08, 2.9802322387695312e-08, 1.1548399925231934e-07, 2.0116567611694336e-07, 2.868473529815674e-07, 3.725290298461914e-07, 4.5821070671081543e-07, 5.438923835754395e-07, 6.295740604400635e-07, 7.152557373046875e-07, 8.009374141693115e-07, 8.866190910339355e-07, 9.723007678985596e-07, 1.0579824447631836e-06, 1.1436641216278076e-06, 1.2293457984924316e-06, 1.3150274753570557e-06, 1.4007091522216797e-06, 1.4863908290863037e-06, 1.5720725059509277e-06, 1.6577541828155518e-06, 1.7434358596801758e-06, 1.8291175365447998e-06, 1.914799213409424e-06, 2.000480890274048e-06, 2.086162567138672e-06, 2.171844244003296e-06, 2.25752592086792e-06, 2.343207597732544e-06, 2.428889274597168e-06, 2.514570951461792e-06, 2.600252628326416e-06, 2.68593430519104e-06, 2.771615982055664e-06, 2.857297658920288e-06, 2.942979335784912e-06, 3.028661012649536e-06, 3.11434268951416e-06, 3.200024366378784e-06, 3.285706043243408e-06, 3.3713877201080322e-06, 3.4570693969726562e-06]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 11.0, 13.0, 19.0, 21.0, 38.0, 44.0, 65.0, 88.0, 135.0, 227.0, 291.0, 464.0, 702.0, 1188.0, 1717.0, 2861.0, 4748.0, 9671.0, 19427.0, 51340.0, 538071.0, 336828.0, 42949.0, 17150.0, 8314.0, 4864.0, 2549.0, 1634.0, 1057.0, 725.0, 404.0, 303.0, 191.0, 147.0, 87.0, 50.0, 52.0, 27.0, 22.0, 21.0, 9.0, 9.0, 1.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5212764739990234e-05, -2.442300319671631e-05, -2.3633241653442383e-05, -2.2843480110168457e-05, -2.205371856689453e-05, -2.1263957023620605e-05, -2.047419548034668e-05, -1.9684433937072754e-05, -1.8894672393798828e-05, -1.8104910850524902e-05, -1.7315149307250977e-05, -1.652538776397705e-05, -1.5735626220703125e-05, -1.49458646774292e-05, -1.4156103134155273e-05, -1.3366341590881348e-05, -1.2576580047607422e-05, -1.1786818504333496e-05, -1.099705696105957e-05, -1.0207295417785645e-05, -9.417533874511719e-06, -8.627772331237793e-06, -7.838010787963867e-06, -7.048249244689941e-06, -6.258487701416016e-06, -5.46872615814209e-06, -4.678964614868164e-06, -3.889203071594238e-06, -3.0994415283203125e-06, -2.3096799850463867e-06, -1.519918441772461e-06, -7.301568984985352e-07, 5.960464477539063e-08, 8.493661880493164e-07, 1.6391277313232422e-06, 2.428889274597168e-06, 3.2186508178710938e-06, 4.0084123611450195e-06, 4.798173904418945e-06, 5.587935447692871e-06, 6.377696990966797e-06, 7.167458534240723e-06, 7.957220077514648e-06, 8.746981620788574e-06, 9.5367431640625e-06, 1.0326504707336426e-05, 1.1116266250610352e-05, 1.1906027793884277e-05, 1.2695789337158203e-05, 1.3485550880432129e-05, 1.4275312423706055e-05, 1.506507396697998e-05, 1.5854835510253906e-05, 1.6644597053527832e-05, 1.7434358596801758e-05, 1.8224120140075684e-05, 1.901388168334961e-05, 1.9803643226623535e-05, 2.059340476989746e-05, 2.1383166313171387e-05, 2.2172927856445312e-05, 2.2962689399719238e-05, 2.3752450942993164e-05, 2.454221248626709e-05, 2.5331974029541016e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 7.0, 5.0, 13.0, 13.0, 11.0, 12.0, 30.0, 32.0, 52.0, 83.0, 176.0, 270.0, 92.0, 45.0, 37.0, 27.0, 14.0, 15.0, 13.0, 6.0, 6.0, 5.0, 2.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.940696716308594e-06, -8.711591362953186e-06, -8.482486009597778e-06, -8.25338065624237e-06, -8.024275302886963e-06, -7.795169949531555e-06, -7.5660645961761475e-06, -7.33695924282074e-06, -7.107853889465332e-06, -6.878748536109924e-06, -6.649643182754517e-06, -6.420537829399109e-06, -6.191432476043701e-06, -5.9623271226882935e-06, -5.733221769332886e-06, -5.504116415977478e-06, -5.27501106262207e-06, -5.045905709266663e-06, -4.816800355911255e-06, -4.587695002555847e-06, -4.3585896492004395e-06, -4.129484295845032e-06, -3.900378942489624e-06, -3.6712735891342163e-06, -3.4421682357788086e-06, -3.213062882423401e-06, -2.983957529067993e-06, -2.7548521757125854e-06, -2.5257468223571777e-06, -2.29664146900177e-06, -2.0675361156463623e-06, -1.8384307622909546e-06, -1.6093254089355469e-06, -1.3802200555801392e-06, -1.1511147022247314e-06, -9.220093488693237e-07, -6.92903995513916e-07, -4.637986421585083e-07, -2.3469328880310059e-07, -5.587935447692871e-09, 2.2351741790771484e-07, 4.5262277126312256e-07, 6.817281246185303e-07, 9.10833477973938e-07, 1.1399388313293457e-06, 1.3690441846847534e-06, 1.5981495380401611e-06, 1.8272548913955688e-06, 2.0563602447509766e-06, 2.2854655981063843e-06, 2.514570951461792e-06, 2.7436763048171997e-06, 2.9727816581726074e-06, 3.201887011528015e-06, 3.430992364883423e-06, 3.6600977182388306e-06, 3.889203071594238e-06, 4.118308424949646e-06, 4.347413778305054e-06, 4.5765191316604614e-06, 4.805624485015869e-06, 5.034729838371277e-06, 5.2638351917266846e-06, 5.492940545082092e-06, 5.7220458984375e-06]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 10.0, 7.0, 12.0, 35.0, 41.0, 96.0, 250.0, 307.0, 129.0, 63.0, 23.0, 12.0, 11.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04296470433473587, -0.03970448672771454, -0.036444272845983505, -0.03318405523896217, -0.02992383949458599, -0.02666362375020981, -0.023403406143188477, -0.020143190398812294, -0.01688297465443611, -0.013622758910059929, -0.010362542234361172, -0.0071023255586624146, -0.003842109814286232, -0.0005818940699100494, 0.0026783235371112823, 0.005938539281487465, 0.009198755025863647, 0.01245897077023983, 0.015719186514616013, 0.018979404121637344, 0.022239619866013527, 0.02549983561038971, 0.02876005321741104, 0.03202027082443237, 0.035280484706163406, 0.03854070231318474, 0.04180091619491577, 0.0450611338019371, 0.048321351408958435, 0.05158156529068947, 0.0548417828977108, 0.058101996779441833, 0.06136222183704376, 0.0646224394440651, 0.06788265705108643, 0.07114286720752716, 0.07440308481454849, 0.07766330242156982, 0.08092352002859116, 0.08418373763561249, 0.08744394779205322, 0.09070416539907455, 0.09396438300609589, 0.09722459316253662, 0.10048481076955795, 0.10374502837657928, 0.10700524598360062, 0.11026546359062195, 0.11352568119764328, 0.11678589880466461, 0.12004611641168594, 0.12330633401870728, 0.126566544175148, 0.12982675433158875, 0.13308697938919067, 0.1363471895456314, 0.13960741460323334, 0.14286762475967407, 0.146127849817276, 0.14938805997371674, 0.15264828503131866, 0.1559084951877594, 0.15916872024536133, 0.16242893040180206, 0.1656891405582428]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 8.0, 17.0, 14.0, 16.0, 15.0, 20.0, 33.0, 34.0, 39.0, 34.0, 48.0, 46.0, 54.0, 57.0, 57.0, 59.0, 61.0, 58.0, 45.0, 46.0, 48.0, 38.0, 36.0, 31.0, 24.0, 18.0, 14.0, 11.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029998144134879112, -0.029059167951345444, -0.028120189905166626, -0.027181213721632957, -0.02624223567545414, -0.02530325949192047, -0.024364281445741653, -0.023425305262207985, -0.022486329078674316, -0.021547352895140648, -0.02060837484896183, -0.01966939866542816, -0.018730420619249344, -0.017791444435715675, -0.016852468252182007, -0.01591349020600319, -0.014974512159824371, -0.014035535044968128, -0.013096557930111885, -0.012157581746578217, -0.011218603700399399, -0.01027962751686573, -0.009340650402009487, -0.008401673287153244, -0.007462696172297001, -0.006523719057440758, -0.005584741942584515, -0.004645765293389559, -0.0037067881785333157, -0.0027678110636770725, -0.0018288344144821167, -0.0008898572996258736, 4.911981523036957e-05, 0.0009880968136712909, 0.0019270738121122122, 0.0028660506941378117, 0.003805027808994055, 0.004744004923850298, 0.005682981573045254, 0.006621958687901497, 0.00756093580275774, 0.008499912917613983, 0.009438890032470226, 0.01037786714732647, 0.011316843330860138, 0.012255821377038956, 0.013194797560572624, 0.014133774675428867, 0.01507275179028511, 0.01601172797381878, 0.016950706019997597, 0.017889682203531265, 0.018828660249710083, 0.01976763643324375, 0.02070661261677742, 0.021645590662956238, 0.022584568709135056, 0.023523544892668724, 0.024462522938847542, 0.02540149912238121, 0.026340477168560028, 0.027279453352093697, 0.028218429535627365, 0.029157407581806183, 0.03009638376533985]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 4.0, 9.0, 5.0, 3.0, 8.0, 6.0, 15.0, 10.0, 13.0, 16.0, 20.0, 10.0, 19.0, 19.0, 28.0, 28.0, 31.0, 32.0, 43.0, 82.0, 1168.0, 46023.0, 968844.0, 30922.0, 798.0, 72.0, 45.0, 38.0, 37.0, 30.0, 29.0, 15.0, 14.0, 16.0, 5.0, 9.0, 16.0, 10.0, 7.0, 6.0, 6.0, 3.0, 8.0, 5.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.13232421875, -0.12824630737304688, -0.12416839599609375, -0.12009048461914062, -0.1160125732421875, -0.11193466186523438, -0.10785675048828125, -0.10377883911132812, -0.099700927734375, -0.09562301635742188, -0.09154510498046875, -0.08746719360351562, -0.0833892822265625, -0.07931137084960938, -0.07523345947265625, -0.07115554809570312, -0.06707763671875, -0.06299972534179688, -0.05892181396484375, -0.054843902587890625, -0.0507659912109375, -0.046688079833984375, -0.04261016845703125, -0.038532257080078125, -0.034454345703125, -0.030376434326171875, -0.02629852294921875, -0.022220611572265625, -0.0181427001953125, -0.014064788818359375, -0.00998687744140625, -0.005908966064453125, -0.0018310546875, 0.002246856689453125, 0.00632476806640625, 0.010402679443359375, 0.0144805908203125, 0.018558502197265625, 0.02263641357421875, 0.026714324951171875, 0.030792236328125, 0.034870147705078125, 0.03894805908203125, 0.043025970458984375, 0.0471038818359375, 0.051181793212890625, 0.05525970458984375, 0.059337615966796875, 0.06341552734375, 0.06749343872070312, 0.07157135009765625, 0.07564926147460938, 0.0797271728515625, 0.08380508422851562, 0.08788299560546875, 0.09196090698242188, 0.096038818359375, 0.10011672973632812, 0.10419464111328125, 0.10827255249023438, 0.1123504638671875, 0.11642837524414062, 0.12050628662109375, 0.12458419799804688, 0.128662109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 33.0, 92.0, 201.0, 296.0, 231.0, 126.0, 34.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020751953125, -0.0017027854919433594, -0.0013303756713867188, -0.0009579658508300781, -0.0005855560302734375, -0.00021314620971679688, 0.00015926361083984375, 0.0005316734313964844, 0.000904083251953125, 0.0012764930725097656, 0.0016489028930664062, 0.002021312713623047, 0.0023937225341796875, 0.002766132354736328, 0.0031385421752929688, 0.0035109519958496094, 0.00388336181640625, 0.004255771636962891, 0.004628181457519531, 0.005000591278076172, 0.0053730010986328125, 0.005745410919189453, 0.006117820739746094, 0.006490230560302734, 0.006862640380859375, 0.007235050201416016, 0.007607460021972656, 0.007979869842529297, 0.008352279663085938, 0.008724689483642578, 0.009097099304199219, 0.00946950912475586, 0.0098419189453125, 0.01021432876586914, 0.010586738586425781, 0.010959148406982422, 0.011331558227539062, 0.011703968048095703, 0.012076377868652344, 0.012448787689208984, 0.012821197509765625, 0.013193607330322266, 0.013566017150878906, 0.013938426971435547, 0.014310836791992188, 0.014683246612548828, 0.015055656433105469, 0.01542806625366211, 0.01580047607421875, 0.01617288589477539, 0.01654529571533203, 0.016917705535888672, 0.017290115356445312, 0.017662525177001953, 0.018034934997558594, 0.018407344818115234, 0.018779754638671875, 0.019152164459228516, 0.019524574279785156, 0.019896984100341797, 0.020269393920898438, 0.020641803741455078, 0.02101421356201172, 0.02138662338256836, 0.021759033203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 8.0, 7.0, 17.0, 26.0, 37.0, 65.0, 114.0, 139.0, 246.0, 428.0, 712.0, 1341.0, 2625.0, 5328.0, 10795.0, 25065.0, 69688.0, 366756.0, 441803.0, 74520.0, 26185.0, 11310.0, 5389.0, 2643.0, 1425.0, 762.0, 425.0, 263.0, 152.0, 91.0, 58.0, 50.0, 28.0, 18.0, 10.0, 9.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0127716064453125, -0.012384891510009766, -0.011998176574707031, -0.011611461639404297, -0.011224746704101562, -0.010838031768798828, -0.010451316833496094, -0.01006460189819336, -0.009677886962890625, -0.00929117202758789, -0.008904457092285156, -0.008517742156982422, -0.008131027221679688, -0.007744312286376953, -0.007357597351074219, -0.006970882415771484, -0.00658416748046875, -0.006197452545166016, -0.005810737609863281, -0.005424022674560547, -0.0050373077392578125, -0.004650592803955078, -0.004263877868652344, -0.0038771629333496094, -0.003490447998046875, -0.0031037330627441406, -0.0027170181274414062, -0.002330303192138672, -0.0019435882568359375, -0.0015568733215332031, -0.0011701583862304688, -0.0007834434509277344, -0.000396728515625, -1.0013580322265625e-05, 0.00037670135498046875, 0.0007634162902832031, 0.0011501312255859375, 0.0015368461608886719, 0.0019235610961914062, 0.0023102760314941406, 0.002696990966796875, 0.0030837059020996094, 0.0034704208374023438, 0.003857135772705078, 0.0042438507080078125, 0.004630565643310547, 0.005017280578613281, 0.005403995513916016, 0.00579071044921875, 0.006177425384521484, 0.006564140319824219, 0.006950855255126953, 0.0073375701904296875, 0.007724285125732422, 0.008111000061035156, 0.00849771499633789, 0.008884429931640625, 0.00927114486694336, 0.009657859802246094, 0.010044574737548828, 0.010431289672851562, 0.010818004608154297, 0.011204719543457031, 0.011591434478759766, 0.0119781494140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 15.0, 14.0, 16.0, 17.0, 18.0, 29.0, 29.0, 24.0, 31.0, 38.0, 43.0, 72.0, 64.0, 79.0, 72.0, 68.0, 64.0, 51.0, 52.0, 32.0, 33.0, 26.0, 23.0, 18.0, 9.0, 13.0, 11.0, 8.0, 6.0, 6.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.005428314208984375, -0.005263984203338623, -0.005099654197692871, -0.004935324192047119, -0.004770994186401367, -0.004606664180755615, -0.004442334175109863, -0.004278004169464111, -0.004113674163818359, -0.003949344158172607, -0.0037850141525268555, -0.0036206841468811035, -0.0034563541412353516, -0.0032920241355895996, -0.0031276941299438477, -0.0029633641242980957, -0.0027990341186523438, -0.002634704113006592, -0.00247037410736084, -0.002306044101715088, -0.002141714096069336, -0.001977384090423584, -0.001813054084777832, -0.00164872407913208, -0.0014843940734863281, -0.0013200640678405762, -0.0011557340621948242, -0.0009914040565490723, -0.0008270740509033203, -0.0006627440452575684, -0.0004984140396118164, -0.00033408403396606445, -0.0001697540283203125, -5.424022674560547e-06, 0.0001589059829711914, 0.00032323598861694336, 0.0004875659942626953, 0.0006518959999084473, 0.0008162260055541992, 0.0009805560111999512, 0.0011448860168457031, 0.001309216022491455, 0.001473546028137207, 0.001637876033782959, 0.001802206039428711, 0.001966536045074463, 0.002130866050720215, 0.002295196056365967, 0.0024595260620117188, 0.0026238560676574707, 0.0027881860733032227, 0.0029525160789489746, 0.0031168460845947266, 0.0032811760902404785, 0.0034455060958862305, 0.0036098361015319824, 0.0037741661071777344, 0.003938496112823486, 0.004102826118469238, 0.00426715612411499, 0.004431486129760742, 0.004595816135406494, 0.004760146141052246, 0.004924476146697998, 0.00508880615234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 10.0, 6.0, 11.0, 15.0, 21.0, 33.0, 37.0, 56.0, 77.0, 105.0, 139.0, 177.0, 282.0, 407.0, 615.0, 1030.0, 2046.0, 8106.0, 988274.0, 38580.0, 4358.0, 1499.0, 871.0, 533.0, 376.0, 286.0, 183.0, 102.0, 84.0, 60.0, 50.0, 37.0, 20.0, 16.0, 14.0, 9.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0305328369140625, -0.029541730880737305, -0.02855062484741211, -0.027559518814086914, -0.02656841278076172, -0.025577306747436523, -0.024586200714111328, -0.023595094680786133, -0.022603988647460938, -0.021612882614135742, -0.020621776580810547, -0.01963067054748535, -0.018639564514160156, -0.01764845848083496, -0.016657352447509766, -0.01566624641418457, -0.014675140380859375, -0.01368403434753418, -0.012692928314208984, -0.011701822280883789, -0.010710716247558594, -0.009719610214233398, -0.008728504180908203, -0.007737398147583008, -0.0067462921142578125, -0.005755186080932617, -0.004764080047607422, -0.0037729740142822266, -0.0027818679809570312, -0.001790761947631836, -0.0007996559143066406, 0.0001914501190185547, 0.00118255615234375, 0.0021736621856689453, 0.0031647682189941406, 0.004155874252319336, 0.005146980285644531, 0.0061380863189697266, 0.007129192352294922, 0.008120298385620117, 0.009111404418945312, 0.010102510452270508, 0.011093616485595703, 0.012084722518920898, 0.013075828552246094, 0.014066934585571289, 0.015058040618896484, 0.01604914665222168, 0.017040252685546875, 0.01803135871887207, 0.019022464752197266, 0.02001357078552246, 0.021004676818847656, 0.02199578285217285, 0.022986888885498047, 0.023977994918823242, 0.024969100952148438, 0.025960206985473633, 0.026951313018798828, 0.027942419052124023, 0.02893352508544922, 0.029924631118774414, 0.03091573715209961, 0.031906843185424805, 0.03289794921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 8.0, 1.0, 1.0, 5.0, 4.0, 9.0, 16.0, 12.0, 72.0, 747.0, 74.0, 16.0, 9.0, 7.0, 5.0, 2.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0609626770019531e-05, -1.0310672223567963e-05, -1.0011717677116394e-05, -9.712763130664825e-06, -9.413808584213257e-06, -9.114854037761688e-06, -8.81589949131012e-06, -8.516944944858551e-06, -8.217990398406982e-06, -7.919035851955414e-06, -7.620081305503845e-06, -7.321126759052277e-06, -7.022172212600708e-06, -6.723217666149139e-06, -6.424263119697571e-06, -6.125308573246002e-06, -5.826354026794434e-06, -5.527399480342865e-06, -5.228444933891296e-06, -4.929490387439728e-06, -4.630535840988159e-06, -4.3315812945365906e-06, -4.032626748085022e-06, -3.7336722016334534e-06, -3.4347176551818848e-06, -3.135763108730316e-06, -2.8368085622787476e-06, -2.537854015827179e-06, -2.2388994693756104e-06, -1.9399449229240417e-06, -1.6409903764724731e-06, -1.3420358300209045e-06, -1.043081283569336e-06, -7.441267371177673e-07, -4.4517219066619873e-07, -1.4621764421463013e-07, 1.5273690223693848e-07, 4.516914486885071e-07, 7.506459951400757e-07, 1.0496005415916443e-06, 1.3485550880432129e-06, 1.6475096344947815e-06, 1.94646418094635e-06, 2.2454187273979187e-06, 2.5443732738494873e-06, 2.843327820301056e-06, 3.1422823667526245e-06, 3.441236913204193e-06, 3.7401914596557617e-06, 4.03914600610733e-06, 4.338100552558899e-06, 4.6370550990104675e-06, 4.936009645462036e-06, 5.234964191913605e-06, 5.533918738365173e-06, 5.832873284816742e-06, 6.1318278312683105e-06, 6.430782377719879e-06, 6.729736924171448e-06, 7.028691470623016e-06, 7.327646017074585e-06, 7.6266005635261536e-06, 7.925555109977722e-06, 8.22450965642929e-06, 8.52346420288086e-06]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 10.0, 11.0, 16.0, 31.0, 37.0, 65.0, 77.0, 132.0, 184.0, 276.0, 406.0, 701.0, 1111.0, 1987.0, 3747.0, 8557.0, 29759.0, 941951.0, 39587.0, 10379.0, 4229.0, 2105.0, 1190.0, 675.0, 459.0, 293.0, 198.0, 121.0, 78.0, 61.0, 35.0, 23.0, 16.0, 13.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.00885772705078125, -0.008628129959106445, -0.00839853286743164, -0.008168935775756836, -0.007939338684082031, -0.0077097415924072266, -0.007480144500732422, -0.007250547409057617, -0.0070209503173828125, -0.006791353225708008, -0.006561756134033203, -0.0063321590423583984, -0.006102561950683594, -0.005872964859008789, -0.005643367767333984, -0.00541377067565918, -0.005184173583984375, -0.00495457649230957, -0.004724979400634766, -0.004495382308959961, -0.004265785217285156, -0.0040361881256103516, -0.003806591033935547, -0.003576993942260742, -0.0033473968505859375, -0.003117799758911133, -0.002888202667236328, -0.0026586055755615234, -0.0024290084838867188, -0.002199411392211914, -0.0019698143005371094, -0.0017402172088623047, -0.0015106201171875, -0.0012810230255126953, -0.0010514259338378906, -0.0008218288421630859, -0.0005922317504882812, -0.00036263465881347656, -0.00013303756713867188, 9.655952453613281e-05, 0.0003261566162109375, 0.0005557537078857422, 0.0007853507995605469, 0.0010149478912353516, 0.0012445449829101562, 0.001474142074584961, 0.0017037391662597656, 0.0019333362579345703, 0.002162933349609375, 0.0023925304412841797, 0.0026221275329589844, 0.002851724624633789, 0.0030813217163085938, 0.0033109188079833984, 0.003540515899658203, 0.003770112991333008, 0.0039997100830078125, 0.004229307174682617, 0.004458904266357422, 0.0046885013580322266, 0.004918098449707031, 0.005147695541381836, 0.005377292633056641, 0.005606889724731445, 0.00583648681640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 5.0, 9.0, 7.0, 16.0, 16.0, 21.0, 102.0, 600.0, 104.0, 28.0, 10.0, 12.0, 16.0, 6.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0037975311279296875, -0.00369909405708313, -0.0036006569862365723, -0.0035022199153900146, -0.003403782844543457, -0.0033053457736968994, -0.003206908702850342, -0.003108471632003784, -0.0030100345611572266, -0.002911597490310669, -0.0028131604194641113, -0.0027147233486175537, -0.002616286277770996, -0.0025178492069244385, -0.002419412136077881, -0.0023209750652313232, -0.0022225379943847656, -0.002124100923538208, -0.0020256638526916504, -0.0019272267818450928, -0.0018287897109985352, -0.0017303526401519775, -0.00163191556930542, -0.0015334784984588623, -0.0014350414276123047, -0.001336604356765747, -0.0012381672859191895, -0.0011397302150726318, -0.0010412931442260742, -0.0009428560733795166, -0.000844419002532959, -0.0007459819316864014, -0.0006475448608398438, -0.0005491077899932861, -0.0004506707191467285, -0.0003522336483001709, -0.0002537965774536133, -0.00015535950660705566, -5.692243576049805e-05, 4.151463508605957e-05, 0.0001399517059326172, 0.0002383887767791748, 0.0003368258476257324, 0.00043526291847229004, 0.0005336999893188477, 0.0006321370601654053, 0.0007305741310119629, 0.0008290112018585205, 0.0009274482727050781, 0.0010258853435516357, 0.0011243224143981934, 0.001222759485244751, 0.0013211965560913086, 0.0014196336269378662, 0.0015180706977844238, 0.0016165077686309814, 0.001714944839477539, 0.0018133819103240967, 0.0019118189811706543, 0.002010256052017212, 0.0021086931228637695, 0.002207130193710327, 0.0023055672645568848, 0.0024040043354034424, 0.00250244140625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 11.0, 11.0, 19.0, 30.0, 68.0, 149.0, 349.0, 187.0, 67.0, 47.0, 21.0, 11.0, 8.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04293232411146164, -0.040832292288541794, -0.03873226046562195, -0.0366322286427021, -0.03453219681978226, -0.03243216499686241, -0.030332135036587715, -0.02823210321366787, -0.026132071390748024, -0.02403203956782818, -0.021932007744908333, -0.019831977784633636, -0.01773194596171379, -0.015631914138793945, -0.0135318823158741, -0.011431850492954254, -0.009331818670034409, -0.007231786847114563, -0.005131755489856005, -0.0030317241325974464, -0.0009316923096776009, 0.0011683395132422447, 0.0032683704048395157, 0.005368402227759361, 0.007468434050679207, 0.009568465873599052, 0.011668497696518898, 0.013768528588116169, 0.01586855947971344, 0.017968591302633286, 0.02006862312555313, 0.022168654948472977, 0.024268686771392822, 0.026368718594312668, 0.028468750417232513, 0.03056878224015236, 0.032668814063072205, 0.03476884588599205, 0.036868877708911896, 0.03896890580654144, 0.04106894135475159, 0.04316897317767143, 0.04526900500059128, 0.047369036823511124, 0.04946906864643097, 0.051569100469350815, 0.05366913229227066, 0.05576916038990021, 0.05786919221282005, 0.0599692240357399, 0.062069255858659744, 0.06416928768157959, 0.06626931577920914, 0.06836935132741928, 0.07046937942504883, 0.07256941497325897, 0.07466944307088852, 0.07676947116851807, 0.07886950671672821, 0.08096953481435776, 0.0830695703625679, 0.08516959846019745, 0.08726963400840759, 0.08936966210603714, 0.09146969765424728]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 3.0, 11.0, 10.0, 16.0, 17.0, 20.0, 31.0, 34.0, 25.0, 23.0, 42.0, 39.0, 38.0, 42.0, 45.0, 48.0, 45.0, 66.0, 36.0, 47.0, 41.0, 49.0, 37.0, 31.0, 24.0, 26.0, 22.0, 21.0, 18.0, 21.0, 12.0, 11.0, 13.0, 8.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010672792792320251, -0.010297577828168869, -0.009922361932694912, -0.00954714696854353, -0.009171931073069572, -0.00879671610891819, -0.008421500213444233, -0.00804628524929285, -0.007671069353818893, -0.007295853924006224, -0.006920638494193554, -0.006545423064380884, -0.006170207634568214, -0.005794992204755545, -0.005419776774942875, -0.0050445618107914925, -0.004669346380978823, -0.004294130951166153, -0.003918915521353483, -0.0035437000915408134, -0.0031684846617281437, -0.002793269231915474, -0.002418054034933448, -0.002042838605120778, -0.0016676231753081083, -0.0012924077454954386, -0.0009171923738904297, -0.0005419770022854209, -0.00016676157247275114, 0.0002084538573399186, 0.0005836691707372665, 0.0009588846005499363, 0.001334100030362606, 0.0017093154601752758, 0.0020845308899879456, 0.0024597463198006153, 0.002834961749613285, 0.003210177179425955, 0.003585392376407981, 0.003960607573390007, 0.004335823468863964, 0.004711038898676634, 0.005086254328489304, 0.005461469758301973, 0.005836685188114643, 0.006211900617927313, 0.006587116047739983, 0.006962331011891365, 0.007337546441704035, 0.0077127618715167046, 0.008087976835668087, 0.008463192731142044, 0.008838407695293427, 0.009213623590767384, 0.009588838554918766, 0.009964054450392723, 0.010339269414544106, 0.010714484378695488, 0.011089700274169445, 0.011464915238320827, 0.011840131133794785, 0.012215346097946167, 0.012590561993420124, 0.012965776957571507, 0.013340992853045464]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 6.0, 7.0, 9.0, 12.0, 10.0, 14.0, 16.0, 27.0, 28.0, 33.0, 69.0, 61.0, 79.0, 128.0, 143.0, 183.0, 291.0, 400.0, 582.0, 842.0, 1309.0, 1914.0, 3343.0, 6269.0, 13708.0, 39901.0, 3959510.0, 116817.0, 25458.0, 9872.0, 4908.0, 2764.0, 1649.0, 1145.0, 765.0, 536.0, 356.0, 252.0, 211.0, 169.0, 112.0, 91.0, 62.0, 53.0, 36.0, 29.0, 33.0, 33.0, 16.0, 13.0, 11.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193939208984375, -0.018764734268188477, -0.018135547637939453, -0.01750636100769043, -0.016877174377441406, -0.016247987747192383, -0.01561880111694336, -0.014989614486694336, -0.014360427856445312, -0.013731241226196289, -0.013102054595947266, -0.012472867965698242, -0.011843681335449219, -0.011214494705200195, -0.010585308074951172, -0.009956121444702148, -0.009326934814453125, -0.008697748184204102, -0.008068561553955078, -0.007439374923706055, -0.006810188293457031, -0.006181001663208008, -0.005551815032958984, -0.004922628402709961, -0.0042934417724609375, -0.003664255142211914, -0.0030350685119628906, -0.002405881881713867, -0.0017766952514648438, -0.0011475086212158203, -0.0005183219909667969, 0.00011086463928222656, 0.00074005126953125, 0.0013692378997802734, 0.001998424530029297, 0.0026276111602783203, 0.0032567977905273438, 0.003885984420776367, 0.004515171051025391, 0.005144357681274414, 0.0057735443115234375, 0.006402730941772461, 0.007031917572021484, 0.007661104202270508, 0.008290290832519531, 0.008919477462768555, 0.009548664093017578, 0.010177850723266602, 0.010807037353515625, 0.011436223983764648, 0.012065410614013672, 0.012694597244262695, 0.013323783874511719, 0.013952970504760742, 0.014582157135009766, 0.015211343765258789, 0.015840530395507812, 0.016469717025756836, 0.01709890365600586, 0.017728090286254883, 0.018357276916503906, 0.01898646354675293, 0.019615650177001953, 0.020244836807250977, 0.0208740234375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 8.0, 5.0, 13.0, 10.0, 37.0, 60.0, 98.0, 95.0, 111.0, 127.0, 146.0, 82.0, 70.0, 38.0, 37.0, 15.0, 4.0, 3.0, 7.0, 3.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0011205673217773438, -0.001087881624698639, -0.001055195927619934, -0.0010225102305412292, -0.0009898245334625244, -0.0009571388363838196, -0.0009244531393051147, -0.0008917674422264099, -0.0008590817451477051, -0.0008263960480690002, -0.0007937103509902954, -0.0007610246539115906, -0.0007283389568328857, -0.0006956532597541809, -0.0006629675626754761, -0.0006302818655967712, -0.0005975961685180664, -0.0005649104714393616, -0.0005322247743606567, -0.0004995390772819519, -0.00046685338020324707, -0.00043416768312454224, -0.0004014819860458374, -0.00036879628896713257, -0.00033611059188842773, -0.0003034248948097229, -0.00027073919773101807, -0.00023805350065231323, -0.0002053678035736084, -0.00017268210649490356, -0.00013999640941619873, -0.0001073107123374939, -7.462501525878906e-05, -4.193931818008423e-05, -9.253621101379395e-06, 2.343207597732544e-05, 5.6117773056030273e-05, 8.880347013473511e-05, 0.00012148916721343994, 0.00015417486429214478, 0.0001868605613708496, 0.00021954625844955444, 0.0002522319555282593, 0.0002849176526069641, 0.00031760334968566895, 0.0003502890467643738, 0.0003829747438430786, 0.00041566044092178345, 0.0004483461380004883, 0.0004810318350791931, 0.000513717532157898, 0.0005464032292366028, 0.0005790889263153076, 0.0006117746233940125, 0.0006444603204727173, 0.0006771460175514221, 0.000709831714630127, 0.0007425174117088318, 0.0007752031087875366, 0.0008078888058662415, 0.0008405745029449463, 0.0008732602000236511, 0.000905945897102356, 0.0009386315941810608, 0.0009713172912597656]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 5.0, 9.0, 9.0, 14.0, 37.0, 146.0, 637.0, 6485.0, 4159962.0, 25343.0, 1277.0, 215.0, 54.0, 30.0, 17.0, 13.0, 7.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.032989501953125, -0.03165292739868164, -0.03031635284423828, -0.028979778289794922, -0.027643203735351562, -0.026306629180908203, -0.024970054626464844, -0.023633480072021484, -0.022296905517578125, -0.020960330963134766, -0.019623756408691406, -0.018287181854248047, -0.016950607299804688, -0.015614032745361328, -0.014277458190917969, -0.01294088363647461, -0.01160430908203125, -0.01026773452758789, -0.008931159973144531, -0.007594585418701172, -0.0062580108642578125, -0.004921436309814453, -0.0035848617553710938, -0.0022482872009277344, -0.000911712646484375, 0.0004248619079589844, 0.0017614364624023438, 0.003098011016845703, 0.0044345855712890625, 0.005771160125732422, 0.007107734680175781, 0.00844430923461914, 0.0097808837890625, 0.01111745834350586, 0.012454032897949219, 0.013790607452392578, 0.015127182006835938, 0.016463756561279297, 0.017800331115722656, 0.019136905670166016, 0.020473480224609375, 0.021810054779052734, 0.023146629333496094, 0.024483203887939453, 0.025819778442382812, 0.027156352996826172, 0.02849292755126953, 0.02982950210571289, 0.03116607666015625, 0.03250265121459961, 0.03383922576904297, 0.03517580032348633, 0.03651237487792969, 0.03784894943237305, 0.039185523986816406, 0.040522098541259766, 0.041858673095703125, 0.043195247650146484, 0.044531822204589844, 0.0458683967590332, 0.04720497131347656, 0.04854154586791992, 0.04987812042236328, 0.05121469497680664, 0.05255126953125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 8.0, 14.0, 23.0, 23.0, 38.0, 72.0, 418.0, 3188.0, 117.0, 48.0, 40.0, 25.0, 11.0, 5.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.003536224365234375, -0.003446042537689209, -0.003355860710144043, -0.003265678882598877, -0.003175497055053711, -0.003085315227508545, -0.002995133399963379, -0.002904951572418213, -0.002814769744873047, -0.002724587917327881, -0.002634406089782715, -0.002544224262237549, -0.002454042434692383, -0.002363860607147217, -0.0022736787796020508, -0.0021834969520568848, -0.0020933151245117188, -0.0020031332969665527, -0.0019129514694213867, -0.0018227696418762207, -0.0017325878143310547, -0.0016424059867858887, -0.0015522241592407227, -0.0014620423316955566, -0.0013718605041503906, -0.0012816786766052246, -0.0011914968490600586, -0.0011013150215148926, -0.0010111331939697266, -0.0009209513664245605, -0.0008307695388793945, -0.0007405877113342285, -0.0006504058837890625, -0.0005602240562438965, -0.00047004222869873047, -0.00037986040115356445, -0.00028967857360839844, -0.00019949674606323242, -0.0001093149185180664, -1.913309097290039e-05, 7.104873657226562e-05, 0.00016123056411743164, 0.00025141239166259766, 0.00034159421920776367, 0.0004317760467529297, 0.0005219578742980957, 0.0006121397018432617, 0.0007023215293884277, 0.0007925033569335938, 0.0008826851844787598, 0.0009728670120239258, 0.0010630488395690918, 0.0011532306671142578, 0.0012434124946594238, 0.0013335943222045898, 0.0014237761497497559, 0.0015139579772949219, 0.0016041398048400879, 0.001694321632385254, 0.00178450345993042, 0.001874685287475586, 0.001964867115020752, 0.002055048942565918, 0.002145230770111084, 0.00223541259765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 6.0, 4.0, 8.0, 14.0, 19.0, 42.0, 75.0, 114.0, 279.0, 206.0, 116.0, 45.0, 30.0, 15.0, 13.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008478313684463501, -0.008161988109350204, -0.007845663465559483, -0.007529338356107473, -0.007213013246655464, -0.006896688137203455, -0.006580363027751446, -0.006264037918299437, -0.005947712808847427, -0.005631387699395418, -0.005315062589943409, -0.0049987374804914, -0.0046824123710393906, -0.004366087261587381, -0.004049762152135372, -0.003733437042683363, -0.0034171119332313538, -0.0031007868237793446, -0.0027844617143273354, -0.002468136604875326, -0.002151811495423317, -0.0018354863859713078, -0.0015191612765192986, -0.0012028361670672894, -0.0008865110576152802, -0.000570185948163271, -0.00025386083871126175, 6.246427074074745e-05, 0.00037878938019275665, 0.0006951144896447659, 0.001011439599096775, 0.0013277647085487843, 0.001644090749323368, 0.0019604158587753773, 0.0022767409682273865, 0.0025930660776793957, 0.002909391187131405, 0.003225716296583414, 0.0035420414060354233, 0.0038583665154874325, 0.004174691624939442, 0.004491016734391451, 0.00480734184384346, 0.005123666953295469, 0.0054399920627474785, 0.005756317172199488, 0.006072642281651497, 0.006388967391103506, 0.006705292500555515, 0.0070216176100075245, 0.007337942719459534, 0.007654267828911543, 0.007970592938363552, 0.008286917582154274, 0.00860324315726757, 0.008919568732380867, 0.009235893376171589, 0.00955221801996231, 0.009868543595075607, 0.010184869170188904, 0.010501193813979626, 0.010817518457770348, 0.011133844032883644, 0.01145016960799694, 0.011766494251787663]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 1.0, 6.0, 6.0, 4.0, 13.0, 8.0, 9.0, 20.0, 17.0, 24.0, 22.0, 34.0, 21.0, 28.0, 32.0, 39.0, 38.0, 36.0, 48.0, 40.0, 44.0, 49.0, 44.0, 45.0, 31.0, 34.0, 26.0, 31.0, 26.0, 17.0, 23.0, 23.0, 26.0, 20.0, 16.0, 18.0, 19.0, 10.0, 12.0, 11.0, 11.0, 6.0, 5.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0019440010655671358, -0.0018798209493979812, -0.0018156409496441483, -0.0017514608334749937, -0.0016872808337211609, -0.0016231007175520062, -0.0015589206013828516, -0.0014947406016290188, -0.0014305604854598641, -0.0013663803692907095, -0.0013022003695368767, -0.001238020253367722, -0.0011738401371985674, -0.0011096601374447346, -0.00104548002127558, -0.0009812999051064253, -0.0009171199053525925, -0.0008529398473910987, -0.000788759789429605, -0.0007245796732604504, -0.0006603996152989566, -0.0005962195573374629, -0.0005320394411683083, -0.00046785938320681453, -0.0004036793252453208, -0.00033949926728382707, -0.0002753191802185029, -0.00021113910770509392, -0.00014695903519168496, -8.277897723019123e-05, -1.8598890164867043e-05, 4.5581196900457144e-05, 0.00010976102203130722, 0.00017394109454471618, 0.00023812116705812514, 0.0003023012541234493, 0.00036648131208494306, 0.0004306613700464368, 0.0004948414862155914, 0.0005590215441770852, 0.0006232016021385789, 0.0006873816601000726, 0.0007515617180615664, 0.000815741834230721, 0.0008799218921922147, 0.0009441019501537085, 0.001008282066322863, 0.0010724621824920177, 0.0011366421822458506, 0.0012008222984150052, 0.001265002298168838, 0.0013291824143379927, 0.0013933624140918255, 0.0014575425302609801, 0.0015217226464301348, 0.0015859026461839676, 0.0016500827623531222, 0.0017142628785222769, 0.0017784428782761097, 0.0018426229944452643, 0.001906803110614419, 0.001970983110368252, 0.0020351631101220846, 0.002099343342706561, 0.002163523342460394]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 7.0, 10.0, 18.0, 26.0, 30.0, 57.0, 65.0, 112.0, 134.0, 199.0, 318.0, 507.0, 862.0, 1479.0, 2727.0, 5422.0, 12431.0, 35849.0, 152659.0, 661309.0, 121420.0, 31060.0, 11104.0, 4859.0, 2440.0, 1303.0, 725.0, 440.0, 302.0, 199.0, 130.0, 83.0, 70.0, 37.0, 34.0, 34.0, 17.0, 17.0, 15.0, 13.0, 8.0, 0.0, 5.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004711151123046875, -0.0004545450210571289, -0.0004379749298095703, -0.0004214048385620117, -0.0004048347473144531, -0.00038826465606689453, -0.00037169456481933594, -0.00035512447357177734, -0.00033855438232421875, -0.00032198429107666016, -0.00030541419982910156, -0.00028884410858154297, -0.0002722740173339844, -0.0002557039260864258, -0.0002391338348388672, -0.0002225637435913086, -0.00020599365234375, -0.0001894235610961914, -0.0001728534698486328, -0.00015628337860107422, -0.00013971328735351562, -0.00012314319610595703, -0.00010657310485839844, -9.000301361083984e-05, -7.343292236328125e-05, -5.6862831115722656e-05, -4.029273986816406e-05, -2.372264862060547e-05, -7.152557373046875e-06, 9.417533874511719e-06, 2.5987625122070312e-05, 4.2557716369628906e-05, 5.91278076171875e-05, 7.56978988647461e-05, 9.226799011230469e-05, 0.00010883808135986328, 0.00012540817260742188, 0.00014197826385498047, 0.00015854835510253906, 0.00017511844635009766, 0.00019168853759765625, 0.00020825862884521484, 0.00022482872009277344, 0.00024139881134033203, 0.0002579689025878906, 0.0002745389938354492, 0.0002911090850830078, 0.0003076791763305664, 0.000324249267578125, 0.0003408193588256836, 0.0003573894500732422, 0.0003739595413208008, 0.0003905296325683594, 0.00040709972381591797, 0.00042366981506347656, 0.00044023990631103516, 0.00045680999755859375, 0.00047338008880615234, 0.0004899501800537109, 0.0005065202713012695, 0.0005230903625488281, 0.0005396604537963867, 0.0005562305450439453, 0.0005728006362915039, 0.0005893707275390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 10.0, 6.0, 11.0, 14.0, 20.0, 20.0, 41.0, 66.0, 59.0, 83.0, 91.0, 106.0, 95.0, 82.0, 55.0, 53.0, 49.0, 33.0, 29.0, 14.0, 9.0, 10.0, 13.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0035648345947265625, -0.0034618079662323, -0.003358781337738037, -0.0032557547092437744, -0.0031527280807495117, -0.003049701452255249, -0.0029466748237609863, -0.0028436481952667236, -0.002740621566772461, -0.0026375949382781982, -0.0025345683097839355, -0.002431541681289673, -0.00232851505279541, -0.0022254884243011475, -0.0021224617958068848, -0.002019435167312622, -0.0019164085388183594, -0.0018133819103240967, -0.001710355281829834, -0.0016073286533355713, -0.0015043020248413086, -0.001401275396347046, -0.0012982487678527832, -0.0011952221393585205, -0.0010921955108642578, -0.0009891688823699951, -0.0008861422538757324, -0.0007831156253814697, -0.000680088996887207, -0.0005770623683929443, -0.00047403573989868164, -0.00037100911140441895, -0.00026798248291015625, -0.00016495585441589355, -6.192922592163086e-05, 4.1097402572631836e-05, 0.00014412403106689453, 0.0002471506595611572, 0.0003501772880554199, 0.0004532039165496826, 0.0005562305450439453, 0.000659257173538208, 0.0007622838020324707, 0.0008653104305267334, 0.0009683370590209961, 0.0010713636875152588, 0.0011743903160095215, 0.0012774169445037842, 0.0013804435729980469, 0.0014834702014923096, 0.0015864968299865723, 0.001689523458480835, 0.0017925500869750977, 0.0018955767154693604, 0.001998603343963623, 0.0021016299724578857, 0.0022046566009521484, 0.002307683229446411, 0.002410709857940674, 0.0025137364864349365, 0.0026167631149291992, 0.002719789743423462, 0.0028228163719177246, 0.0029258430004119873, 0.00302886962890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 9.0, 5.0, 10.0, 16.0, 17.0, 25.0, 30.0, 39.0, 35.0, 58.0, 64.0, 96.0, 127.0, 170.0, 360.0, 779.0, 2422.0, 8921.0, 46454.0, 680385.0, 270717.0, 28449.0, 6137.0, 1703.0, 614.0, 272.0, 149.0, 108.0, 77.0, 59.0, 43.0, 38.0, 37.0, 31.0, 20.0, 16.0, 10.0, 8.0, 9.0, 10.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00017690658569335938, -0.00017098337411880493, -0.0001650601625442505, -0.00015913695096969604, -0.0001532137393951416, -0.00014729052782058716, -0.00014136731624603271, -0.00013544410467147827, -0.00012952089309692383, -0.00012359768152236938, -0.00011767446994781494, -0.0001117512583732605, -0.00010582804679870605, -9.990483522415161e-05, -9.398162364959717e-05, -8.805841207504272e-05, -8.213520050048828e-05, -7.621198892593384e-05, -7.02887773513794e-05, -6.436556577682495e-05, -5.844235420227051e-05, -5.2519142627716064e-05, -4.659593105316162e-05, -4.067271947860718e-05, -3.4749507904052734e-05, -2.882629632949829e-05, -2.2903084754943848e-05, -1.6979873180389404e-05, -1.1056661605834961e-05, -5.133450031280518e-06, 7.897615432739258e-07, 6.712973117828369e-06, 1.2636184692382812e-05, 1.8559396266937256e-05, 2.44826078414917e-05, 3.0405819416046143e-05, 3.6329030990600586e-05, 4.225224256515503e-05, 4.817545413970947e-05, 5.4098665714263916e-05, 6.002187728881836e-05, 6.59450888633728e-05, 7.186830043792725e-05, 7.779151201248169e-05, 8.371472358703613e-05, 8.963793516159058e-05, 9.556114673614502e-05, 0.00010148435831069946, 0.0001074075698852539, 0.00011333078145980835, 0.00011925399303436279, 0.00012517720460891724, 0.00013110041618347168, 0.00013702362775802612, 0.00014294683933258057, 0.000148870050907135, 0.00015479326248168945, 0.0001607164740562439, 0.00016663968563079834, 0.00017256289720535278, 0.00017848610877990723, 0.00018440932035446167, 0.0001903325319290161, 0.00019625574350357056, 0.000202178955078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 6.0, 8.0, 4.0, 6.0, 11.0, 11.0, 12.0, 16.0, 20.0, 14.0, 20.0, 27.0, 37.0, 41.0, 33.0, 30.0, 40.0, 45.0, 44.0, 44.0, 37.0, 37.0, 54.0, 42.0, 52.0, 34.0, 47.0, 26.0, 30.0, 20.0, 22.0, 22.0, 14.0, 24.0, 14.0, 10.0, 10.0, 5.0, 5.0, 6.0, 10.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004520416259765625, -0.004369199275970459, -0.004217982292175293, -0.004066765308380127, -0.003915548324584961, -0.003764331340789795, -0.003613114356994629, -0.003461897373199463, -0.003310680389404297, -0.003159463405609131, -0.003008246421813965, -0.002857029438018799, -0.002705812454223633, -0.002554595470428467, -0.0024033784866333008, -0.0022521615028381348, -0.0021009445190429688, -0.0019497275352478027, -0.0017985105514526367, -0.0016472935676574707, -0.0014960765838623047, -0.0013448596000671387, -0.0011936426162719727, -0.0010424256324768066, -0.0008912086486816406, -0.0007399916648864746, -0.0005887746810913086, -0.0004375576972961426, -0.00028634071350097656, -0.00013512372970581055, 1.609325408935547e-05, 0.00016731023788452148, 0.0003185272216796875, 0.0004697442054748535, 0.0006209611892700195, 0.0007721781730651855, 0.0009233951568603516, 0.0010746121406555176, 0.0012258291244506836, 0.0013770461082458496, 0.0015282630920410156, 0.0016794800758361816, 0.0018306970596313477, 0.0019819140434265137, 0.0021331310272216797, 0.0022843480110168457, 0.0024355649948120117, 0.0025867819786071777, 0.0027379989624023438, 0.0028892159461975098, 0.0030404329299926758, 0.003191649913787842, 0.003342866897583008, 0.003494083881378174, 0.00364530086517334, 0.003796517848968506, 0.003947734832763672, 0.004098951816558838, 0.004250168800354004, 0.00440138578414917, 0.004552602767944336, 0.004703819751739502, 0.004855036735534668, 0.005006253719329834, 0.005157470703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 4.0, 9.0, 9.0, 0.0, 12.0, 17.0, 28.0, 47.0, 0.0, 42.0, 87.0, 109.0, 0.0, 183.0, 316.0, 512.0, 0.0, 899.0, 1573.0, 2900.0, 0.0, 6283.0, 18119.0, 96322.0, 793646.0, 0.0, 96894.0, 17828.0, 6216.0, 0.0, 2893.0, 1551.0, 865.0, 0.0, 481.0, 281.0, 150.0, 0.0, 110.0, 55.0, 44.0, 22.0, 0.0, 19.0, 13.0, 8.0, 0.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.5497207641601562e-06, -1.5040859580039978e-06, -1.4584511518478394e-06, -1.412816345691681e-06, -1.3671815395355225e-06, -1.321546733379364e-06, -1.2759119272232056e-06, -1.2302771210670471e-06, -1.1846423149108887e-06, -1.1390075087547302e-06, -1.0933727025985718e-06, -1.0477378964424133e-06, -1.0021030902862549e-06, -9.564682841300964e-07, -9.10833477973938e-07, -8.651986718177795e-07, -8.195638656616211e-07, -7.739290595054626e-07, -7.282942533493042e-07, -6.826594471931458e-07, -6.370246410369873e-07, -5.913898348808289e-07, -5.457550287246704e-07, -5.00120222568512e-07, -4.544854164123535e-07, -4.0885061025619507e-07, -3.632158041000366e-07, -3.175809979438782e-07, -2.7194619178771973e-07, -2.2631138563156128e-07, -1.8067657947540283e-07, -1.3504177331924438e-07, -8.940696716308594e-08, -4.377216100692749e-08, 1.862645149230957e-09, 4.7497451305389404e-08, 9.313225746154785e-08, 1.387670636177063e-07, 1.8440186977386475e-07, 2.300366759300232e-07, 2.7567148208618164e-07, 3.213062882423401e-07, 3.6694109439849854e-07, 4.12575900554657e-07, 4.5821070671081543e-07, 5.038455128669739e-07, 5.494803190231323e-07, 5.951151251792908e-07, 6.407499313354492e-07, 6.863847374916077e-07, 7.320195436477661e-07, 7.776543498039246e-07, 8.23289155960083e-07, 8.689239621162415e-07, 9.145587682723999e-07, 9.601935744285583e-07, 1.0058283805847168e-06, 1.0514631867408752e-06, 1.0970979928970337e-06, 1.1427327990531921e-06, 1.1883676052093506e-06, 1.234002411365509e-06, 1.2796372175216675e-06, 1.325272023677826e-06, 1.3709068298339844e-06]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 17.0, 0.0, 19.0, 0.0, 0.0, 33.0, 0.0, 56.0, 0.0, 0.0, 76.0, 0.0, 106.0, 0.0, 105.0, 0.0, 0.0, 146.0, 0.0, 133.0, 0.0, 102.0, 0.0, 0.0, 66.0, 0.0, 54.0, 0.0, 0.0, 34.0, 0.0, 31.0, 0.0, 14.0, 0.0, 0.0, 8.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.093193173408508e-07, -7.841736078262329e-07, -7.59027898311615e-07, -7.338821887969971e-07, -7.087364792823792e-07, -6.835907697677612e-07, -6.584450602531433e-07, -6.332993507385254e-07, -6.081536412239075e-07, -5.830079317092896e-07, -5.578622221946716e-07, -5.327165126800537e-07, -5.075708031654358e-07, -4.824250936508179e-07, -4.5727938413619995e-07, -4.3213367462158203e-07, -4.069879651069641e-07, -3.818422555923462e-07, -3.5669654607772827e-07, -3.3155083656311035e-07, -3.0640512704849243e-07, -2.812594175338745e-07, -2.561137080192566e-07, -2.3096799850463867e-07, -2.0582228899002075e-07, -1.8067657947540283e-07, -1.555308699607849e-07, -1.30385160446167e-07, -1.0523945093154907e-07, -8.009374141693115e-08, -5.494803190231323e-08, -2.9802322387695312e-08, -4.6566128730773926e-09, 2.0489096641540527e-08, 4.563480615615845e-08, 7.078051567077637e-08, 9.592622518539429e-08, 1.210719347000122e-07, 1.4621764421463013e-07, 1.7136335372924805e-07, 1.9650906324386597e-07, 2.2165477275848389e-07, 2.468004822731018e-07, 2.7194619178771973e-07, 2.9709190130233765e-07, 3.2223761081695557e-07, 3.473833203315735e-07, 3.725290298461914e-07, 3.976747393608093e-07, 4.2282044887542725e-07, 4.4796615839004517e-07, 4.731118679046631e-07, 4.98257577419281e-07, 5.234032869338989e-07, 5.485489964485168e-07, 5.736947059631348e-07, 5.988404154777527e-07, 6.239861249923706e-07, 6.491318345069885e-07, 6.742775440216064e-07, 6.994232535362244e-07, 7.245689630508423e-07, 7.497146725654602e-07, 7.748603820800781e-07]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 8.0, 8.0, 8.0, 21.0, 42.0, 22.0, 35.0, 77.0, 116.0, 145.0, 688.0, 816.0, 1588.0, 3225.0, 6769.0, 17870.0, 69393.0, 846396.0, 70133.0, 24361.0, 3110.0, 1653.0, 784.0, 479.0, 319.0, 160.0, 101.0, 86.0, 60.0, 33.0, 15.0, 7.0, 1.0, 11.0, 9.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.1988525986671448e-06, -2.132728695869446e-06, -2.066604793071747e-06, -2.000480890274048e-06, -1.934356987476349e-06, -1.86823308467865e-06, -1.802109181880951e-06, -1.735985279083252e-06, -1.669861376285553e-06, -1.603737473487854e-06, -1.537613570690155e-06, -1.471489667892456e-06, -1.405365765094757e-06, -1.339241862297058e-06, -1.2731179594993591e-06, -1.2069940567016602e-06, -1.1408701539039612e-06, -1.0747462511062622e-06, -1.0086223483085632e-06, -9.424984455108643e-07, -8.763745427131653e-07, -8.102506399154663e-07, -7.441267371177673e-07, -6.780028343200684e-07, -6.118789315223694e-07, -5.457550287246704e-07, -4.796311259269714e-07, -4.1350722312927246e-07, -3.473833203315735e-07, -2.812594175338745e-07, -2.1513551473617554e-07, -1.4901161193847656e-07, -8.288770914077759e-08, -1.6763806343078613e-08, 4.936009645462036e-08, 1.1548399925231934e-07, 1.816079020500183e-07, 2.477318048477173e-07, 3.1385570764541626e-07, 3.7997961044311523e-07, 4.461035132408142e-07, 5.122274160385132e-07, 5.783513188362122e-07, 6.444752216339111e-07, 7.105991244316101e-07, 7.767230272293091e-07, 8.428469300270081e-07, 9.08970832824707e-07, 9.75094735622406e-07, 1.041218638420105e-06, 1.107342541217804e-06, 1.173466444015503e-06, 1.239590346813202e-06, 1.3057142496109009e-06, 1.3718381524085999e-06, 1.4379620552062988e-06, 1.5040859580039978e-06, 1.5702098608016968e-06, 1.6363337635993958e-06, 1.7024576663970947e-06, 1.7685815691947937e-06, 1.8347054719924927e-06, 1.9008293747901917e-06, 1.9669532775878906e-06]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 19.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 104.0, 0.0, 0.0, 0.0, 688.0, 0.0, 0.0, 0.0, 0.0, 133.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.032626748085022e-07, -3.8929283618927e-07, -3.7532299757003784e-07, -3.6135315895080566e-07, -3.473833203315735e-07, -3.334134817123413e-07, -3.1944364309310913e-07, -3.0547380447387695e-07, -2.915039658546448e-07, -2.775341272354126e-07, -2.635642886161804e-07, -2.4959444999694824e-07, -2.3562461137771606e-07, -2.2165477275848389e-07, -2.076849341392517e-07, -1.9371509552001953e-07, -1.7974525690078735e-07, -1.6577541828155518e-07, -1.51805579662323e-07, -1.3783574104309082e-07, -1.2386590242385864e-07, -1.0989606380462646e-07, -9.592622518539429e-08, -8.195638656616211e-08, -6.798654794692993e-08, -5.4016709327697754e-08, -4.0046870708465576e-08, -2.60770320892334e-08, -1.210719347000122e-08, 1.862645149230957e-09, 1.5832483768463135e-08, 2.9802322387695312e-08, 4.377216100692749e-08, 5.774199962615967e-08, 7.171183824539185e-08, 8.568167686462402e-08, 9.96515154838562e-08, 1.1362135410308838e-07, 1.2759119272232056e-07, 1.4156103134155273e-07, 1.555308699607849e-07, 1.695007085800171e-07, 1.8347054719924927e-07, 1.9744038581848145e-07, 2.1141022443771362e-07, 2.253800630569458e-07, 2.39349901676178e-07, 2.5331974029541016e-07, 2.6728957891464233e-07, 2.812594175338745e-07, 2.952292561531067e-07, 3.0919909477233887e-07, 3.2316893339157104e-07, 3.371387720108032e-07, 3.511086106300354e-07, 3.650784492492676e-07, 3.7904828786849976e-07, 3.9301812648773193e-07, 4.069879651069641e-07, 4.209578037261963e-07, 4.3492764234542847e-07, 4.4889748096466064e-07, 4.628673195838928e-07, 4.76837158203125e-07]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 9.0, 15.0, 34.0, 57.0, 92.0, 212.0, 282.0, 142.0, 72.0, 36.0, 19.0, 11.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005370433442294598, -0.005179924424737692, -0.004989415407180786, -0.00479890638962388, -0.004608397372066975, -0.004417888354510069, -0.004227379336953163, -0.004036870319396257, -0.0038463613018393517, -0.003655852284282446, -0.00346534326672554, -0.0032748342491686344, -0.0030843252316117287, -0.002893816214054823, -0.002703307196497917, -0.0025127981789410114, -0.0023222891613841057, -0.0021317801438272, -0.0019412711262702942, -0.0017507621087133884, -0.0015602530911564827, -0.001369744073599577, -0.0011792350560426712, -0.0009887260384857655, -0.0007982170209288597, -0.000607708003371954, -0.0004171989858150482, -0.00022668996825814247, -3.6180950701236725e-05, 0.00015432806685566902, 0.00034483708441257477, 0.0005353461019694805, 0.000725854653865099, 0.0009163636714220047, 0.0011068726889789104, 0.0012973817065358162, 0.001487890724092722, 0.0016783997416496277, 0.0018689087592065334, 0.002059417776763439, 0.002249926794320345, 0.0024404358118772507, 0.0026309448294341564, 0.002821453846991062, 0.003011962864547968, 0.0032024718821048737, 0.0033929808996617794, 0.003583489917218685, 0.003773998934775591, 0.003964507952332497, 0.004155016969889402, 0.004345525987446308, 0.004536035005003214, 0.00472654402256012, 0.004917053040117025, 0.005107562057673931, 0.005298071075230837, 0.005488580092787743, 0.005679089110344648, 0.005869598127901554, 0.00606010714545846, 0.006250616163015366, 0.006441125180572271, 0.006631634198129177, 0.006822143215686083]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 1.0, 3.0, 7.0, 7.0, 8.0, 7.0, 14.0, 14.0, 17.0, 24.0, 28.0, 26.0, 27.0, 23.0, 41.0, 36.0, 33.0, 42.0, 54.0, 40.0, 47.0, 43.0, 48.0, 32.0, 38.0, 28.0, 28.0, 38.0, 21.0, 20.0, 29.0, 22.0, 17.0, 27.0, 17.0, 17.0, 14.0, 13.0, 8.0, 14.0, 5.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.001147820265032351, -0.0011132254730910063, -0.0010786307975649834, -0.0010440360056236386, -0.001009441213682294, -0.0009748464799486101, -0.0009402517462149262, -0.0009056569542735815, -0.0008710622205398977, -0.0008364674868062139, -0.0008018726948648691, -0.0007672779611311853, -0.0007326832273975015, -0.0006980884354561567, -0.0006634937017224729, -0.0006288989679887891, -0.0005943041760474443, -0.0005597094423137605, -0.0005251146503724158, -0.000490519916638732, -0.0004559251538012177, -0.0004213303909637034, -0.00038673565723001957, -0.0003521408943925053, -0.000317546131554991, -0.0002829513687174767, -0.00024835660587996244, -0.00021376187214627862, -0.00017916710930876434, -0.00014457234647125006, -0.000109977598185651, -7.538284990005195e-05, -4.078797064721584e-05, -6.193215085659176e-06, 2.840154047589749e-05, 6.299629603745416e-05, 9.759105159901083e-05, 0.0001321858144365251, 0.00016678056272212416, 0.0002013753110077232, 0.0002359700738452375, 0.0002705648366827518, 0.00030515959952026606, 0.0003397543332539499, 0.00037434909609146416, 0.00040894385892897844, 0.00044353859266266227, 0.00047813335550017655, 0.0005127281183376908, 0.0005473228520713747, 0.0005819176440127194, 0.0006165123777464032, 0.000651107169687748, 0.0006857019034214318, 0.0007202966371551156, 0.0007548914290964603, 0.0007894861628301442, 0.000824080896563828, 0.0008586756885051727, 0.0008932704222388566, 0.0009278651559725404, 0.0009624599479138851, 0.0009970547398552299, 0.0010316494153812528, 0.0010662442073225975]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 6.0, 4.0, 6.0, 9.0, 19.0, 23.0, 94.0, 413.0, 1994.0, 13582.0, 740226.0, 280151.0, 9985.0, 1534.0, 337.0, 74.0, 30.0, 13.0, 10.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.009735107421875, -0.009439468383789062, -0.009143829345703125, -0.008848190307617188, -0.00855255126953125, -0.008256912231445312, -0.007961273193359375, -0.0076656341552734375, -0.0073699951171875, -0.0070743560791015625, -0.006778717041015625, -0.0064830780029296875, -0.00618743896484375, -0.0058917999267578125, -0.005596160888671875, -0.0053005218505859375, -0.0050048828125, -0.0047092437744140625, -0.004413604736328125, -0.0041179656982421875, -0.00382232666015625, -0.0035266876220703125, -0.003231048583984375, -0.0029354095458984375, -0.0026397705078125, -0.0023441314697265625, -0.002048492431640625, -0.0017528533935546875, -0.00145721435546875, -0.0011615753173828125, -0.000865936279296875, -0.0005702972412109375, -0.000274658203125, 2.09808349609375e-05, 0.000316619873046875, 0.0006122589111328125, 0.00090789794921875, 0.0012035369873046875, 0.001499176025390625, 0.0017948150634765625, 0.0020904541015625, 0.0023860931396484375, 0.002681732177734375, 0.0029773712158203125, 0.00327301025390625, 0.0035686492919921875, 0.003864288330078125, 0.0041599273681640625, 0.00445556640625, 0.0047512054443359375, 0.005046844482421875, 0.0053424835205078125, 0.00563812255859375, 0.0059337615966796875, 0.006229400634765625, 0.0065250396728515625, 0.0068206787109375, 0.0071163177490234375, 0.007411956787109375, 0.0077075958251953125, 0.00800323486328125, 0.008298873901367188, 0.008594512939453125, 0.008890151977539062, 0.009185791015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 8.0, 7.0, 15.0, 32.0, 41.0, 63.0, 102.0, 131.0, 135.0, 118.0, 100.0, 95.0, 57.0, 21.0, 22.0, 13.0, 8.0, 7.0, 7.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003981590270996094, -0.00038904324173927307, -0.00037992745637893677, -0.00037081167101860046, -0.00036169588565826416, -0.00035258010029792786, -0.00034346431493759155, -0.00033434852957725525, -0.00032523274421691895, -0.00031611695885658264, -0.00030700117349624634, -0.00029788538813591003, -0.00028876960277557373, -0.0002796538174152374, -0.0002705380320549011, -0.0002614222466945648, -0.0002523064613342285, -0.0002431906759738922, -0.0002340748906135559, -0.0002249591052532196, -0.0002158433198928833, -0.000206727534532547, -0.0001976117491722107, -0.0001884959638118744, -0.00017938017845153809, -0.00017026439309120178, -0.00016114860773086548, -0.00015203282237052917, -0.00014291703701019287, -0.00013380125164985657, -0.00012468546628952026, -0.00011556968092918396, -0.00010645389556884766, -9.733811020851135e-05, -8.822232484817505e-05, -7.910653948783875e-05, -6.999075412750244e-05, -6.087496876716614e-05, -5.1759183406829834e-05, -4.264339804649353e-05, -3.3527612686157227e-05, -2.4411827325820923e-05, -1.529604196548462e-05, -6.1802566051483154e-06, 2.9355287551879883e-06, 1.2051314115524292e-05, 2.1167099475860596e-05, 3.02828848361969e-05, 3.93986701965332e-05, 4.851445555686951e-05, 5.763024091720581e-05, 6.674602627754211e-05, 7.586181163787842e-05, 8.497759699821472e-05, 9.409338235855103e-05, 0.00010320916771888733, 0.00011232495307922363, 0.00012144073843955994, 0.00013055652379989624, 0.00013967230916023254, 0.00014878809452056885, 0.00015790387988090515, 0.00016701966524124146, 0.00017613545060157776, 0.00018525123596191406]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 7.0, 9.0, 5.0, 13.0, 23.0, 31.0, 52.0, 65.0, 78.0, 153.0, 205.0, 291.0, 436.0, 735.0, 1126.0, 1803.0, 2927.0, 5270.0, 9473.0, 19771.0, 51292.0, 195541.0, 568727.0, 119542.0, 36934.0, 15168.0, 7727.0, 4256.0, 2519.0, 1563.0, 952.0, 649.0, 379.0, 254.0, 197.0, 122.0, 78.0, 42.0, 34.0, 23.0, 23.0, 16.0, 11.0, 10.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0009660720825195312, -0.0009379386901855469, -0.0009098052978515625, -0.0008816719055175781, -0.0008535385131835938, -0.0008254051208496094, -0.000797271728515625, -0.0007691383361816406, -0.0007410049438476562, -0.0007128715515136719, -0.0006847381591796875, -0.0006566047668457031, -0.0006284713745117188, -0.0006003379821777344, -0.00057220458984375, -0.0005440711975097656, -0.0005159378051757812, -0.0004878044128417969, -0.0004596710205078125, -0.0004315376281738281, -0.00040340423583984375, -0.0003752708435058594, -0.000347137451171875, -0.0003190040588378906, -0.00029087066650390625, -0.0002627372741699219, -0.0002346038818359375, -0.00020647048950195312, -0.00017833709716796875, -0.00015020370483398438, -0.0001220703125, -9.393692016601562e-05, -6.580352783203125e-05, -3.7670135498046875e-05, -9.5367431640625e-06, 1.8596649169921875e-05, 4.673004150390625e-05, 7.486343383789062e-05, 0.000102996826171875, 0.00013113021850585938, 0.00015926361083984375, 0.00018739700317382812, 0.0002155303955078125, 0.00024366378784179688, 0.00027179718017578125, 0.0002999305725097656, 0.00032806396484375, 0.0003561973571777344, 0.00038433074951171875, 0.0004124641418457031, 0.0004405975341796875, 0.0004687309265136719, 0.0004968643188476562, 0.0005249977111816406, 0.000553131103515625, 0.0005812644958496094, 0.0006093978881835938, 0.0006375312805175781, 0.0006656646728515625, 0.0006937980651855469, 0.0007219314575195312, 0.0007500648498535156, 0.0007781982421875, 0.0008063316345214844, 0.0008344650268554688]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 5.0, 4.0, 4.0, 3.0, 11.0, 11.0, 12.0, 20.0, 20.0, 32.0, 62.0, 67.0, 80.0, 89.0, 102.0, 101.0, 81.0, 59.0, 67.0, 45.0, 22.0, 22.0, 10.0, 16.0, 5.0, 8.0, 5.0, 3.0, 9.0, 3.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.0006017684936523438, -0.0005862228572368622, -0.0005706772208213806, -0.000555131584405899, -0.0005395859479904175, -0.0005240403115749359, -0.0005084946751594543, -0.0004929490387439728, -0.0004774034023284912, -0.00046185776591300964, -0.0004463121294975281, -0.0004307664930820465, -0.00041522085666656494, -0.0003996752202510834, -0.0003841295838356018, -0.00036858394742012024, -0.00035303831100463867, -0.0003374926745891571, -0.00032194703817367554, -0.00030640140175819397, -0.0002908557653427124, -0.00027531012892723083, -0.00025976449251174927, -0.0002442188560962677, -0.00022867321968078613, -0.00021312758326530457, -0.000197581946849823, -0.00018203631043434143, -0.00016649067401885986, -0.0001509450376033783, -0.00013539940118789673, -0.00011985376477241516, -0.0001043081283569336, -8.876249194145203e-05, -7.321685552597046e-05, -5.767121911048889e-05, -4.2125582695007324e-05, -2.6579946279525757e-05, -1.103430986404419e-05, 4.511326551437378e-06, 2.0056962966918945e-05, 3.560259938240051e-05, 5.114823579788208e-05, 6.669387221336365e-05, 8.223950862884521e-05, 9.778514504432678e-05, 0.00011333078145980835, 0.00012887641787528992, 0.00014442205429077148, 0.00015996769070625305, 0.00017551332712173462, 0.0001910589635372162, 0.00020660459995269775, 0.00022215023636817932, 0.0002376958727836609, 0.00025324150919914246, 0.000268787145614624, 0.0002843327820301056, 0.00029987841844558716, 0.0003154240548610687, 0.0003309696912765503, 0.00034651532769203186, 0.00036206096410751343, 0.000377606600522995, 0.00039315223693847656]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 7.0, 9.0, 18.0, 22.0, 25.0, 22.0, 47.0, 64.0, 78.0, 105.0, 182.0, 258.0, 407.0, 721.0, 1637.0, 4807.0, 22138.0, 999603.0, 12154.0, 3354.0, 1205.0, 553.0, 347.0, 241.0, 148.0, 96.0, 84.0, 57.0, 42.0, 28.0, 27.0, 19.0, 10.0, 6.0, 7.0, 7.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0078125, -0.007578253746032715, -0.00734400749206543, -0.0071097612380981445, -0.006875514984130859, -0.006641268730163574, -0.006407022476196289, -0.006172776222229004, -0.005938529968261719, -0.005704283714294434, -0.0054700374603271484, -0.005235791206359863, -0.005001544952392578, -0.004767298698425293, -0.004533052444458008, -0.004298806190490723, -0.0040645599365234375, -0.0038303136825561523, -0.003596067428588867, -0.003361821174621582, -0.003127574920654297, -0.0028933286666870117, -0.0026590824127197266, -0.0024248361587524414, -0.0021905899047851562, -0.001956343650817871, -0.001722097396850586, -0.0014878511428833008, -0.0012536048889160156, -0.0010193586349487305, -0.0007851123809814453, -0.0005508661270141602, -0.000316619873046875, -8.237361907958984e-05, 0.0001518726348876953, 0.00038611888885498047, 0.0006203651428222656, 0.0008546113967895508, 0.001088857650756836, 0.001323103904724121, 0.0015573501586914062, 0.0017915964126586914, 0.0020258426666259766, 0.0022600889205932617, 0.002494335174560547, 0.002728581428527832, 0.002962827682495117, 0.0031970739364624023, 0.0034313201904296875, 0.0036655664443969727, 0.003899812698364258, 0.004134058952331543, 0.004368305206298828, 0.004602551460266113, 0.0048367977142333984, 0.005071043968200684, 0.005305290222167969, 0.005539536476135254, 0.005773782730102539, 0.006008028984069824, 0.006242275238037109, 0.0064765214920043945, 0.00671076774597168, 0.006945013999938965, 0.00717926025390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 12.0, 10.0, 30.0, 86.0, 228.0, 306.0, 197.0, 102.0, 12.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-06, -1.7201527953147888e-06, -1.6521662473678589e-06, -1.584179699420929e-06, -1.516193151473999e-06, -1.448206603527069e-06, -1.3802200555801392e-06, -1.3122335076332092e-06, -1.2442469596862793e-06, -1.1762604117393494e-06, -1.1082738637924194e-06, -1.0402873158454895e-06, -9.723007678985596e-07, -9.043142199516296e-07, -8.363276720046997e-07, -7.683411240577698e-07, -7.003545761108398e-07, -6.323680281639099e-07, -5.6438148021698e-07, -4.9639493227005e-07, -4.284083843231201e-07, -3.604218363761902e-07, -2.9243528842926025e-07, -2.2444874048233032e-07, -1.564621925354004e-07, -8.847564458847046e-08, -2.0489096641540527e-08, 4.7497451305389404e-08, 1.1548399925231934e-07, 1.8347054719924927e-07, 2.514570951461792e-07, 3.1944364309310913e-07, 3.8743019104003906e-07, 4.55416738986969e-07, 5.234032869338989e-07, 5.913898348808289e-07, 6.593763828277588e-07, 7.273629307746887e-07, 7.953494787216187e-07, 8.633360266685486e-07, 9.313225746154785e-07, 9.993091225624084e-07, 1.0672956705093384e-06, 1.1352822184562683e-06, 1.2032687664031982e-06, 1.2712553143501282e-06, 1.339241862297058e-06, 1.407228410243988e-06, 1.475214958190918e-06, 1.543201506137848e-06, 1.6111880540847778e-06, 1.6791746020317078e-06, 1.7471611499786377e-06, 1.8151476979255676e-06, 1.8831342458724976e-06, 1.9511207938194275e-06, 2.0191073417663574e-06, 2.0870938897132874e-06, 2.1550804376602173e-06, 2.2230669856071472e-06, 2.291053533554077e-06, 2.359040081501007e-06, 2.427026629447937e-06, 2.495013177394867e-06, 2.562999725341797e-06]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 7.0, 14.0, 21.0, 22.0, 25.0, 25.0, 52.0, 52.0, 86.0, 110.0, 123.0, 183.0, 230.0, 334.0, 422.0, 578.0, 802.0, 1042.0, 1572.0, 2441.0, 4142.0, 9326.0, 38474.0, 949320.0, 21451.0, 6927.0, 3459.0, 2064.0, 1398.0, 1005.0, 726.0, 515.0, 390.0, 311.0, 209.0, 183.0, 109.0, 88.0, 73.0, 56.0, 53.0, 40.0, 25.0, 19.0, 15.0, 8.0, 8.0, 5.0, 8.0, 5.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0014104843139648438, -0.0013624131679534912, -0.0013143420219421387, -0.0012662708759307861, -0.0012181997299194336, -0.001170128583908081, -0.0011220574378967285, -0.001073986291885376, -0.0010259151458740234, -0.000977843999862671, -0.0009297728538513184, -0.0008817017078399658, -0.0008336305618286133, -0.0007855594158172607, -0.0007374882698059082, -0.0006894171237945557, -0.0006413459777832031, -0.0005932748317718506, -0.000545203685760498, -0.0004971325397491455, -0.00044906139373779297, -0.00040099024772644043, -0.0003529191017150879, -0.00030484795570373535, -0.0002567768096923828, -0.00020870566368103027, -0.00016063451766967773, -0.0001125633716583252, -6.449222564697266e-05, -1.6421079635620117e-05, 3.165006637573242e-05, 7.972121238708496e-05, 0.0001277923583984375, 0.00017586350440979004, 0.00022393465042114258, 0.0002720057964324951, 0.00032007694244384766, 0.0003681480884552002, 0.00041621923446655273, 0.0004642903804779053, 0.0005123615264892578, 0.0005604326725006104, 0.0006085038185119629, 0.0006565749645233154, 0.000704646110534668, 0.0007527172565460205, 0.000800788402557373, 0.0008488595485687256, 0.0008969306945800781, 0.0009450018405914307, 0.0009930729866027832, 0.0010411441326141357, 0.0010892152786254883, 0.0011372864246368408, 0.0011853575706481934, 0.001233428716659546, 0.0012814998626708984, 0.001329571008682251, 0.0013776421546936035, 0.001425713300704956, 0.0014737844467163086, 0.0015218555927276611, 0.0015699267387390137, 0.0016179978847503662, 0.0016660690307617188]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 28.0, 47.0, 763.0, 59.0, 18.0, 17.0, 9.0, 8.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009474754333496094, -0.0009143128991127014, -0.0008811503648757935, -0.0008479878306388855, -0.0008148252964019775, -0.0007816627621650696, -0.0007485002279281616, -0.0007153376936912537, -0.0006821751594543457, -0.0006490126252174377, -0.0006158500909805298, -0.0005826875567436218, -0.0005495250225067139, -0.0005163624882698059, -0.00048319995403289795, -0.00045003741979599, -0.00041687488555908203, -0.00038371235132217407, -0.0003505498170852661, -0.00031738728284835815, -0.0002842247486114502, -0.00025106221437454224, -0.00021789968013763428, -0.00018473714590072632, -0.00015157461166381836, -0.0001184120774269104, -8.524954319000244e-05, -5.208700895309448e-05, -1.8924474716186523e-05, 1.4238059520721436e-05, 4.7400593757629395e-05, 8.056312799453735e-05, 0.00011372566223144531, 0.00014688819646835327, 0.00018005073070526123, 0.0002132132649421692, 0.00024637579917907715, 0.0002795383334159851, 0.00031270086765289307, 0.000345863401889801, 0.000379025936126709, 0.00041218847036361694, 0.0004453510046005249, 0.00047851353883743286, 0.0005116760730743408, 0.0005448386073112488, 0.0005780011415481567, 0.0006111636757850647, 0.0006443262100219727, 0.0006774887442588806, 0.0007106512784957886, 0.0007438138127326965, 0.0007769763469696045, 0.0008101388812065125, 0.0008433014154434204, 0.0008764639496803284, 0.0009096264839172363, 0.0009427890181541443, 0.0009759515523910522, 0.0010091140866279602, 0.0010422766208648682, 0.0010754391551017761, 0.001108601689338684, 0.001141764223575592, 0.0011749267578125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 14.0, 19.0, 53.0, 131.0, 328.0, 254.0, 88.0, 52.0, 19.0, 13.0, 4.0, 3.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.018651174381375313, -0.018261179327964783, -0.017871186137199402, -0.017481191083788872, -0.01709119603037834, -0.01670120283961296, -0.01631120778620243, -0.01592121459543705, -0.01553121954202652, -0.015141225419938564, -0.014751231297850609, -0.014361236244440079, -0.013971242122352123, -0.013581248000264168, -0.013191252946853638, -0.012801258824765682, -0.012411264702677727, -0.012021270580589771, -0.011631276458501816, -0.011241281405091286, -0.01085128728300333, -0.010461293160915375, -0.010071298107504845, -0.00968130398541689, -0.009291309863328934, -0.008901315741240978, -0.008511321619153023, -0.008121326565742493, -0.007731332443654537, -0.007341338321566582, -0.006951343733817339, -0.006561349146068096, -0.006171355489641428, -0.005781360901892185, -0.00539136677980423, -0.005001372657716274, -0.0046113780699670315, -0.004221383482217789, -0.0038313893601298332, -0.003441395005211234, -0.003051400650292635, -0.002661406295374036, -0.0022714119404554367, -0.0018814175855368376, -0.0014914232306182384, -0.0011014288756996393, -0.0007114345207810402, -0.00032144016586244106, 6.855418905615807e-05, 0.0004585485439747572, 0.0008485428988933563, 0.0012385372538119555, 0.0016285316087305546, 0.0020185259636491537, 0.002408520318567753, 0.002798514673486352, 0.003188509028404951, 0.0035785033833235502, 0.003968497738242149, 0.004358491860330105, 0.004748486448079348, 0.00513848103582859, 0.005528475157916546, 0.005918469280004501, 0.006308463867753744]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 7.0, 5.0, 10.0, 9.0, 11.0, 11.0, 15.0, 27.0, 21.0, 31.0, 22.0, 28.0, 30.0, 26.0, 35.0, 39.0, 45.0, 59.0, 48.0, 49.0, 38.0, 46.0, 47.0, 37.0, 45.0, 33.0, 31.0, 23.0, 26.0, 22.0, 26.0, 22.0, 13.0, 10.0, 11.0, 11.0, 7.0, 2.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0010351123055443168, -0.0010026241652667522, -0.0009701360249891877, -0.0009376478847116232, -0.0009051597444340587, -0.0008726716041564941, -0.0008401835220865905, -0.000807695381809026, -0.0007752072415314615, -0.000742719101253897, -0.0007102309609763324, -0.0006777428206987679, -0.0006452547386288643, -0.0006127665983512998, -0.0005802784580737352, -0.0005477903177961707, -0.0005153021775186062, -0.00048281403724104166, -0.00045032589696347713, -0.00041783778578974307, -0.00038534964551217854, -0.000352861505234614, -0.00032037339406087995, -0.0002878852537833154, -0.0002553971135057509, -0.00022290897322818637, -0.00019042084750253707, -0.00015793272177688777, -0.00012544458149932325, -9.295644122175872e-05, -6.0468315496109426e-05, -2.798018977046013e-05, 4.50783409178257e-06, 3.699596709338948e-05, 6.948410009499639e-05, 0.0001019722330966033, 0.00013446036609821022, 0.00016694850637577474, 0.00019943663210142404, 0.00023192475782707334, 0.00026441289810463786, 0.0002969010383822024, 0.0003293891786597669, 0.000361877289833501, 0.0003943654301110655, 0.00042685357038863003, 0.0004593416815623641, 0.0004918298218399286, 0.0005243179621174932, 0.0005568061023950577, 0.0005892942426726222, 0.0006217823829501867, 0.0006542705232277513, 0.0006867586635053158, 0.0007192467455752194, 0.0007517348858527839, 0.0007842230261303484, 0.000816711166407913, 0.0008491993066854775, 0.000881687446963042, 0.0009141755290329456, 0.0009466636693105102, 0.0009791518095880747, 0.0010116399498656392, 0.0010441280901432037]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 11.0, 6.0, 14.0, 26.0, 28.0, 33.0, 56.0, 65.0, 97.0, 100.0, 190.0, 252.0, 349.0, 532.0, 758.0, 1160.0, 1849.0, 3050.0, 5921.0, 14152.0, 202727.0, 3931184.0, 16459.0, 6381.0, 3309.0, 1960.0, 1185.0, 783.0, 504.0, 326.0, 271.0, 166.0, 123.0, 66.0, 48.0, 42.0, 28.0, 26.0, 12.0, 13.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006389617919921875, -0.006202042102813721, -0.006014466285705566, -0.005826890468597412, -0.005639314651489258, -0.0054517388343811035, -0.005264163017272949, -0.005076587200164795, -0.004889011383056641, -0.004701435565948486, -0.004513859748840332, -0.004326283931732178, -0.0041387081146240234, -0.003951132297515869, -0.003763556480407715, -0.0035759806632995605, -0.0033884048461914062, -0.003200829029083252, -0.0030132532119750977, -0.0028256773948669434, -0.002638101577758789, -0.0024505257606506348, -0.0022629499435424805, -0.002075374126434326, -0.0018877983093261719, -0.0017002224922180176, -0.0015126466751098633, -0.001325070858001709, -0.0011374950408935547, -0.0009499192237854004, -0.0007623434066772461, -0.0005747675895690918, -0.0003871917724609375, -0.0001996159553527832, -1.2040138244628906e-05, 0.0001755356788635254, 0.0003631114959716797, 0.000550687313079834, 0.0007382631301879883, 0.0009258389472961426, 0.0011134147644042969, 0.0013009905815124512, 0.0014885663986206055, 0.0016761422157287598, 0.001863718032836914, 0.0020512938499450684, 0.0022388696670532227, 0.002426445484161377, 0.0026140213012695312, 0.0028015971183776855, 0.00298917293548584, 0.003176748752593994, 0.0033643245697021484, 0.0035519003868103027, 0.003739476203918457, 0.003927052021026611, 0.004114627838134766, 0.00430220365524292, 0.004489779472351074, 0.0046773552894592285, 0.004864931106567383, 0.005052506923675537, 0.005240082740783691, 0.005427658557891846, 0.005615234375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 7.0, 6.0, 9.0, 15.0, 10.0, 14.0, 17.0, 34.0, 65.0, 86.0, 126.0, 172.0, 129.0, 103.0, 71.0, 29.0, 17.0, 14.0, 14.0, 9.0, 6.0, 3.0, 5.0, 5.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.0005068778991699219, -0.0004943571984767914, -0.0004818364977836609, -0.0004693157970905304, -0.0004567950963973999, -0.0004442743957042694, -0.0004317536950111389, -0.0004192329943180084, -0.00040671229362487793, -0.00039419159293174744, -0.00038167089223861694, -0.00036915019154548645, -0.00035662949085235596, -0.00034410879015922546, -0.00033158808946609497, -0.0003190673887729645, -0.000306546688079834, -0.0002940259873867035, -0.000281505286693573, -0.0002689845860004425, -0.000256463885307312, -0.00024394318461418152, -0.00023142248392105103, -0.00021890178322792053, -0.00020638108253479004, -0.00019386038184165955, -0.00018133968114852905, -0.00016881898045539856, -0.00015629827976226807, -0.00014377757906913757, -0.00013125687837600708, -0.00011873617768287659, -0.0001062154769897461, -9.36947762966156e-05, -8.117407560348511e-05, -6.865337491035461e-05, -5.613267421722412e-05, -4.361197352409363e-05, -3.1091272830963135e-05, -1.857057213783264e-05, -6.0498714447021484e-06, 6.470829248428345e-06, 1.8991529941558838e-05, 3.151223063468933e-05, 4.4032931327819824e-05, 5.655363202095032e-05, 6.907433271408081e-05, 8.15950334072113e-05, 9.41157341003418e-05, 0.00010663643479347229, 0.00011915713548660278, 0.00013167783617973328, 0.00014419853687286377, 0.00015671923756599426, 0.00016923993825912476, 0.00018176063895225525, 0.00019428133964538574, 0.00020680204033851624, 0.00021932274103164673, 0.00023184344172477722, 0.0002443641424179077, 0.0002568848431110382, 0.0002694055438041687, 0.0002819262444972992, 0.0002944469451904297]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 3.0, 19.0, 18.0, 32.0, 46.0, 69.0, 116.0, 181.0, 332.0, 632.0, 1215.0, 2756.0, 8315.0, 56704.0, 4091524.0, 22823.0, 5251.0, 2062.0, 990.0, 467.0, 279.0, 164.0, 117.0, 57.0, 36.0, 23.0, 12.0, 13.0, 6.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00308990478515625, -0.002991199493408203, -0.0028924942016601562, -0.0027937889099121094, -0.0026950836181640625, -0.0025963783264160156, -0.0024976730346679688, -0.002398967742919922, -0.002300262451171875, -0.002201557159423828, -0.0021028518676757812, -0.0020041465759277344, -0.0019054412841796875, -0.0018067359924316406, -0.0017080307006835938, -0.0016093254089355469, -0.0015106201171875, -0.0014119148254394531, -0.0013132095336914062, -0.0012145042419433594, -0.0011157989501953125, -0.0010170936584472656, -0.0009183883666992188, -0.0008196830749511719, -0.000720977783203125, -0.0006222724914550781, -0.0005235671997070312, -0.0004248619079589844, -0.0003261566162109375, -0.00022745132446289062, -0.00012874603271484375, -3.0040740966796875e-05, 6.866455078125e-05, 0.00016736984252929688, 0.00026607513427734375, 0.0003647804260253906, 0.0004634857177734375, 0.0005621910095214844, 0.0006608963012695312, 0.0007596015930175781, 0.000858306884765625, 0.0009570121765136719, 0.0010557174682617188, 0.0011544227600097656, 0.0012531280517578125, 0.0013518333435058594, 0.0014505386352539062, 0.0015492439270019531, 0.00164794921875, 0.0017466545104980469, 0.0018453598022460938, 0.0019440650939941406, 0.0020427703857421875, 0.0021414756774902344, 0.0022401809692382812, 0.002338886260986328, 0.002437591552734375, 0.002536296844482422, 0.0026350021362304688, 0.0027337074279785156, 0.0028324127197265625, 0.0029311180114746094, 0.0030298233032226562, 0.003128528594970703, 0.00322723388671875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 6.0, 7.0, 17.0, 25.0, 43.0, 355.0, 3456.0, 85.0, 27.0, 13.0, 13.0, 5.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008959770202636719, -0.0008673444390296936, -0.0008387118577957153, -0.0008100792765617371, -0.0007814466953277588, -0.0007528141140937805, -0.0007241815328598022, -0.000695548951625824, -0.0006669163703918457, -0.0006382837891578674, -0.0006096512079238892, -0.0005810186266899109, -0.0005523860454559326, -0.0005237534642219543, -0.0004951208829879761, -0.0004664883017539978, -0.00043785572052001953, -0.00040922313928604126, -0.000380590558052063, -0.0003519579768180847, -0.00032332539558410645, -0.0002946928143501282, -0.0002660602331161499, -0.00023742765188217163, -0.00020879507064819336, -0.0001801624894142151, -0.00015152990818023682, -0.00012289732694625854, -9.426474571228027e-05, -6.5632164478302e-05, -3.699958324432373e-05, -8.367002010345459e-06, 2.0265579223632812e-05, 4.8898160457611084e-05, 7.753074169158936e-05, 0.00010616332292556763, 0.0001347959041595459, 0.00016342848539352417, 0.00019206106662750244, 0.0002206936478614807, 0.000249326229095459, 0.00027795881032943726, 0.00030659139156341553, 0.0003352239727973938, 0.00036385655403137207, 0.00039248913526535034, 0.0004211217164993286, 0.0004497542977333069, 0.00047838687896728516, 0.0005070194602012634, 0.0005356520414352417, 0.00056428462266922, 0.0005929172039031982, 0.0006215497851371765, 0.0006501823663711548, 0.0006788149476051331, 0.0007074475288391113, 0.0007360801100730896, 0.0007647126913070679, 0.0007933452725410461, 0.0008219778537750244, 0.0008506104350090027, 0.000879243016242981, 0.0009078755974769592, 0.0009365081787109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 7.0, 6.0, 14.0, 21.0, 34.0, 44.0, 55.0, 110.0, 167.0, 201.0, 118.0, 66.0, 49.0, 30.0, 23.0, 12.0, 13.0, 11.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019940270576626062, -0.001944428775459528, -0.0018948304932564497, -0.0018452322110533714, -0.0017956339288502932, -0.0017460356466472149, -0.0016964373644441366, -0.0016468390822410583, -0.00159724080003798, -0.0015476425178349018, -0.0014980442356318235, -0.0014484459534287453, -0.001398847671225667, -0.0013492493890225887, -0.0012996511068195105, -0.0012500528246164322, -0.001200454542413354, -0.0011508562602102757, -0.0011012579780071974, -0.0010516596958041191, -0.0010020614136010408, -0.0009524631313979626, -0.0009028648491948843, -0.000853266566991806, -0.0008036684012040496, -0.0007540701190009713, -0.000704471836797893, -0.0006548735545948148, -0.0006052752723917365, -0.0005556769901886582, -0.00050607870798558, -0.00045648045488633215, -0.00040688214357942343, -0.00035728386137634516, -0.0003076855791732669, -0.0002580872969701886, -0.00020848902931902558, -0.00015889076166786253, -0.00010929247946478426, -5.9694197261705995e-05, -1.0095915058627725e-05, 3.950236350647174e-05, 8.91006420715712e-05, 0.00013869891699869186, 0.00018829719920177013, 0.00023789546685293317, 0.00028749374905601144, 0.0003370920312590897, 0.000386690313462168, 0.00043628859566524625, 0.0004858868778683245, 0.0005354851600714028, 0.0005850834422744811, 0.0006346816662698984, 0.0006842799484729767, 0.000733878230676055, 0.0007834765128791332, 0.0008330747950822115, 0.0008826730772852898, 0.000932271359488368, 0.0009818696416914463, 0.0010314679238945246, 0.0010810662060976028, 0.0011306644883006811, 0.0011802627705037594]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 15.0, 12.0, 11.0, 19.0, 16.0, 26.0, 18.0, 24.0, 26.0, 26.0, 34.0, 36.0, 40.0, 56.0, 33.0, 51.0, 37.0, 42.0, 48.0, 45.0, 45.0, 43.0, 45.0, 29.0, 27.0, 19.0, 19.0, 27.0, 21.0, 18.0, 17.0, 12.0, 12.0, 5.0, 9.0, 7.0, 3.0, 4.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00046261108946055174, -0.00044712526141665876, -0.0004316394333727658, -0.00041615357622504234, -0.00040066774818114936, -0.0003851819201372564, -0.00036969606298953295, -0.00035421023494563997, -0.000338724406901747, -0.000323238578857854, -0.00030775275081396103, -0.0002922668936662376, -0.0002767810656223446, -0.00026129523757845163, -0.0002458093804307282, -0.00023032355238683522, -0.00021483772434294224, -0.00019935189629904926, -0.00018386605370324105, -0.00016838021110743284, -0.00015289438306353986, -0.00013740855501964688, -0.00012192271242383868, -0.00010643687710398808, -9.095104178413749e-05, -7.54652064642869e-05, -5.99793711444363e-05, -4.4493535824585706e-05, -2.9007700504735112e-05, -1.3521865184884518e-05, 1.9639701349660754e-06, 1.744980545481667e-05, 3.2935698982328176e-05, 4.842153430217877e-05, 6.390736962202936e-05, 7.939320494187996e-05, 9.487904026173055e-05, 0.00011036487558158115, 0.00012585071090143174, 0.00014133655349723995, 0.00015682238154113293, 0.0001723082095850259, 0.00018779405218083411, 0.00020327989477664232, 0.0002187657228205353, 0.00023425155086442828, 0.0002497374080121517, 0.0002652232360560447, 0.0002807090640999377, 0.00029619489214383066, 0.00031168072018772364, 0.0003271665773354471, 0.00034265240537934005, 0.00035813823342323303, 0.00037362409057095647, 0.00038910991861484945, 0.00040459574665874243, 0.0004200815747026354, 0.0004355674027465284, 0.0004510532598942518, 0.0004665390879381448, 0.0004820249159820378, 0.0004975107731297612, 0.0005129965720698237, 0.0005284824292175472]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 1.0, 8.0, 7.0, 9.0, 18.0, 16.0, 27.0, 29.0, 49.0, 81.0, 135.0, 154.0, 322.0, 657.0, 1382.0, 3587.0, 11138.0, 47034.0, 433784.0, 485835.0, 46503.0, 11223.0, 3594.0, 1408.0, 667.0, 318.0, 181.0, 123.0, 88.0, 44.0, 36.0, 22.0, 22.0, 15.0, 4.0, 3.0, 7.0, 5.0, 5.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.600950241088867e-05, -8.33217054605484e-05, -8.063390851020813e-05, -7.794611155986786e-05, -7.525831460952759e-05, -7.257051765918732e-05, -6.988272070884705e-05, -6.719492375850677e-05, -6.45071268081665e-05, -6.181932985782623e-05, -5.913153290748596e-05, -5.644373595714569e-05, -5.375593900680542e-05, -5.106814205646515e-05, -4.838034510612488e-05, -4.569254815578461e-05, -4.3004751205444336e-05, -4.0316954255104065e-05, -3.7629157304763794e-05, -3.494136035442352e-05, -3.225356340408325e-05, -2.956576645374298e-05, -2.687796950340271e-05, -2.419017255306244e-05, -2.1502375602722168e-05, -1.8814578652381897e-05, -1.6126781702041626e-05, -1.3438984751701355e-05, -1.0751187801361084e-05, -8.063390851020813e-06, -5.375593900680542e-06, -2.687796950340271e-06, 0.0, 2.687796950340271e-06, 5.375593900680542e-06, 8.063390851020813e-06, 1.0751187801361084e-05, 1.3438984751701355e-05, 1.6126781702041626e-05, 1.8814578652381897e-05, 2.1502375602722168e-05, 2.419017255306244e-05, 2.687796950340271e-05, 2.956576645374298e-05, 3.225356340408325e-05, 3.494136035442352e-05, 3.7629157304763794e-05, 4.0316954255104065e-05, 4.3004751205444336e-05, 4.569254815578461e-05, 4.838034510612488e-05, 5.106814205646515e-05, 5.375593900680542e-05, 5.644373595714569e-05, 5.913153290748596e-05, 6.181932985782623e-05, 6.45071268081665e-05, 6.719492375850677e-05, 6.988272070884705e-05, 7.257051765918732e-05, 7.525831460952759e-05, 7.794611155986786e-05, 8.063390851020813e-05, 8.33217054605484e-05, 8.600950241088867e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 4.0, 1.0, 2.0, 6.0, 10.0, 13.0, 14.0, 17.0, 21.0, 21.0, 33.0, 34.0, 30.0, 33.0, 45.0, 56.0, 45.0, 52.0, 55.0, 52.0, 49.0, 65.0, 50.0, 48.0, 30.0, 31.0, 23.0, 33.0, 22.0, 20.0, 14.0, 11.0, 19.0, 8.0, 6.0, 7.0, 7.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00045609474182128906, -0.0004422590136528015, -0.00042842328548431396, -0.0004145875573158264, -0.00040075182914733887, -0.0003869161009788513, -0.00037308037281036377, -0.0003592446446418762, -0.00034540891647338867, -0.0003315731883049011, -0.0003177374601364136, -0.000303901731967926, -0.0002900660037994385, -0.00027623027563095093, -0.0002623945474624634, -0.00024855881929397583, -0.00023472309112548828, -0.00022088736295700073, -0.00020705163478851318, -0.00019321590662002563, -0.00017938017845153809, -0.00016554445028305054, -0.000151708722114563, -0.00013787299394607544, -0.0001240372657775879, -0.00011020153760910034, -9.636580944061279e-05, -8.253008127212524e-05, -6.86943531036377e-05, -5.4858624935150146e-05, -4.10228967666626e-05, -2.718716859817505e-05, -1.33514404296875e-05, 4.842877388000488e-07, 1.4320015907287598e-05, 2.8155744075775146e-05, 4.1991472244262695e-05, 5.5827200412750244e-05, 6.966292858123779e-05, 8.349865674972534e-05, 9.733438491821289e-05, 0.00011117011308670044, 0.000125005841255188, 0.00013884156942367554, 0.00015267729759216309, 0.00016651302576065063, 0.00018034875392913818, 0.00019418448209762573, 0.00020802021026611328, 0.00022185593843460083, 0.00023569166660308838, 0.00024952739477157593, 0.0002633631229400635, 0.000277198851108551, 0.0002910345792770386, 0.0003048703074455261, 0.00031870603561401367, 0.0003325417637825012, 0.00034637749195098877, 0.0003602132201194763, 0.00037404894828796387, 0.0003878846764564514, 0.00040172040462493896, 0.0004155561327934265, 0.00042939186096191406]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 16.0, 16.0, 17.0, 31.0, 44.0, 58.0, 84.0, 127.0, 197.0, 445.0, 1479.0, 7014.0, 71165.0, 895888.0, 62867.0, 6505.0, 1504.0, 450.0, 210.0, 128.0, 78.0, 58.0, 47.0, 29.0, 31.0, 12.0, 10.0, 7.0, 12.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0187110900878906e-05, -4.8772431910037994e-05, -4.735775291919708e-05, -4.594307392835617e-05, -4.452839493751526e-05, -4.311371594667435e-05, -4.1699036955833435e-05, -4.028435796499252e-05, -3.886967897415161e-05, -3.74549999833107e-05, -3.604032099246979e-05, -3.4625642001628876e-05, -3.3210963010787964e-05, -3.179628401994705e-05, -3.038160502910614e-05, -2.8966926038265228e-05, -2.7552247047424316e-05, -2.6137568056583405e-05, -2.4722889065742493e-05, -2.330821007490158e-05, -2.189353108406067e-05, -2.0478852093219757e-05, -1.9064173102378845e-05, -1.7649494111537933e-05, -1.623481512069702e-05, -1.482013612985611e-05, -1.3405457139015198e-05, -1.1990778148174286e-05, -1.0576099157333374e-05, -9.161420166492462e-06, -7.74674117565155e-06, -6.3320621848106384e-06, -4.9173831939697266e-06, -3.5027042031288147e-06, -2.088025212287903e-06, -6.73346221446991e-07, 7.413327693939209e-07, 2.1560117602348328e-06, 3.5706907510757446e-06, 4.9853697419166565e-06, 6.400048732757568e-06, 7.81472772359848e-06, 9.229406714439392e-06, 1.0644085705280304e-05, 1.2058764696121216e-05, 1.3473443686962128e-05, 1.488812267780304e-05, 1.630280166864395e-05, 1.7717480659484863e-05, 1.9132159650325775e-05, 2.0546838641166687e-05, 2.19615176320076e-05, 2.337619662284851e-05, 2.4790875613689423e-05, 2.6205554604530334e-05, 2.7620233595371246e-05, 2.9034912586212158e-05, 3.044959157705307e-05, 3.186427056789398e-05, 3.3278949558734894e-05, 3.4693628549575806e-05, 3.610830754041672e-05, 3.752298653125763e-05, 3.893766552209854e-05, 4.035234451293945e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 11.0, 11.0, 14.0, 15.0, 22.0, 24.0, 28.0, 36.0, 49.0, 56.0, 61.0, 75.0, 54.0, 77.0, 66.0, 57.0, 55.0, 62.0, 43.0, 33.0, 29.0, 28.0, 24.0, 13.0, 14.0, 6.0, 9.0, 6.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012750625610351562, -0.001238986849784851, -0.001202911138534546, -0.0011668354272842407, -0.0011307597160339355, -0.0010946840047836304, -0.0010586082935333252, -0.00102253258228302, -0.0009864568710327148, -0.0009503811597824097, -0.0009143054485321045, -0.0008782297372817993, -0.0008421540260314941, -0.000806078314781189, -0.0007700026035308838, -0.0007339268922805786, -0.0006978511810302734, -0.0006617754697799683, -0.0006256997585296631, -0.0005896240472793579, -0.0005535483360290527, -0.0005174726247787476, -0.0004813969135284424, -0.0004453212022781372, -0.00040924549102783203, -0.00037316977977752686, -0.0003370940685272217, -0.0003010183572769165, -0.00026494264602661133, -0.00022886693477630615, -0.00019279122352600098, -0.0001567155122756958, -0.00012063980102539062, -8.456408977508545e-05, -4.8488378524780273e-05, -1.2412667274475098e-05, 2.3663043975830078e-05, 5.9738755226135254e-05, 9.581446647644043e-05, 0.0001318901777267456, 0.00016796588897705078, 0.00020404160022735596, 0.00024011731147766113, 0.0002761930227279663, 0.0003122687339782715, 0.00034834444522857666, 0.00038442015647888184, 0.000420495867729187, 0.0004565715789794922, 0.0004926472902297974, 0.0005287230014801025, 0.0005647987127304077, 0.0006008744239807129, 0.0006369501352310181, 0.0006730258464813232, 0.0007091015577316284, 0.0007451772689819336, 0.0007812529802322388, 0.0008173286914825439, 0.0008534044027328491, 0.0008894801139831543, 0.0009255558252334595, 0.0009616315364837646, 0.0009977072477340698, 0.001033782958984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1795.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1045010.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1754.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 50.0, 0.0, 0.0, 81.0, 0.0, 0.0, 118.0, 0.0, 0.0, 133.0, 0.0, 0.0, 0.0, 168.0, 0.0, 0.0, 142.0, 0.0, 0.0, 113.0, 0.0, 0.0, 89.0, 0.0, 0.0, 52.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 10.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.774199962615967e-07, -5.587935447692871e-07, -5.401670932769775e-07, -5.21540641784668e-07, -5.029141902923584e-07, -4.842877388000488e-07, -4.6566128730773926e-07, -4.470348358154297e-07, -4.284083843231201e-07, -4.0978193283081055e-07, -3.91155481338501e-07, -3.725290298461914e-07, -3.5390257835388184e-07, -3.3527612686157227e-07, -3.166496753692627e-07, -2.980232238769531e-07, -2.7939677238464355e-07, -2.60770320892334e-07, -2.421438694000244e-07, -2.2351741790771484e-07, -2.0489096641540527e-07, -1.862645149230957e-07, -1.6763806343078613e-07, -1.4901161193847656e-07, -1.30385160446167e-07, -1.1175870895385742e-07, -9.313225746154785e-08, -7.450580596923828e-08, -5.587935447692871e-08, -3.725290298461914e-08, -1.862645149230957e-08, 0.0, 1.862645149230957e-08, 3.725290298461914e-08, 5.587935447692871e-08, 7.450580596923828e-08, 9.313225746154785e-08, 1.1175870895385742e-07, 1.30385160446167e-07, 1.4901161193847656e-07, 1.6763806343078613e-07, 1.862645149230957e-07, 2.0489096641540527e-07, 2.2351741790771484e-07, 2.421438694000244e-07, 2.60770320892334e-07, 2.7939677238464355e-07, 2.980232238769531e-07, 3.166496753692627e-07, 3.3527612686157227e-07, 3.5390257835388184e-07, 3.725290298461914e-07, 3.91155481338501e-07, 4.0978193283081055e-07, 4.284083843231201e-07, 4.470348358154297e-07, 4.6566128730773926e-07, 4.842877388000488e-07, 5.029141902923584e-07, 5.21540641784668e-07, 5.401670932769775e-07, 5.587935447692871e-07, 5.774199962615967e-07, 5.960464477539062e-07]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 221.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048055.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 234.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.3189932107925415e-07, -2.253800630569458e-07, -2.1886080503463745e-07, -2.123415470123291e-07, -2.0582228899002075e-07, -1.993030309677124e-07, -1.9278377294540405e-07, -1.862645149230957e-07, -1.7974525690078735e-07, -1.73225998878479e-07, -1.6670674085617065e-07, -1.601874828338623e-07, -1.5366822481155396e-07, -1.471489667892456e-07, -1.4062970876693726e-07, -1.341104507446289e-07, -1.2759119272232056e-07, -1.210719347000122e-07, -1.1455267667770386e-07, -1.0803341865539551e-07, -1.0151416063308716e-07, -9.499490261077881e-08, -8.847564458847046e-08, -8.195638656616211e-08, -7.543712854385376e-08, -6.891787052154541e-08, -6.239861249923706e-08, -5.587935447692871e-08, -4.936009645462036e-08, -4.284083843231201e-08, -3.632158041000366e-08, -2.9802322387695312e-08, -2.3283064365386963e-08, -1.6763806343078613e-08, -1.0244548320770264e-08, -3.725290298461914e-09, 2.7939677238464355e-09, 9.313225746154785e-09, 1.5832483768463135e-08, 2.2351741790771484e-08, 2.8870999813079834e-08, 3.5390257835388184e-08, 4.190951585769653e-08, 4.842877388000488e-08, 5.494803190231323e-08, 6.146728992462158e-08, 6.798654794692993e-08, 7.450580596923828e-08, 8.102506399154663e-08, 8.754432201385498e-08, 9.406358003616333e-08, 1.0058283805847168e-07, 1.0710209608078003e-07, 1.1362135410308838e-07, 1.2014061212539673e-07, 1.2665987014770508e-07, 1.3317912817001343e-07, 1.3969838619232178e-07, 1.4621764421463013e-07, 1.5273690223693848e-07, 1.5925616025924683e-07, 1.6577541828155518e-07, 1.7229467630386353e-07, 1.7881393432617188e-07]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 8.0, 6.0, 13.0, 22.0, 27.0, 38.0, 68.0, 83.0, 136.0, 197.0, 131.0, 78.0, 47.0, 46.0, 25.0, 18.0, 9.0, 13.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009596081217750907, -0.0009332785266451538, -0.0009069489315152168, -0.0008806193945929408, -0.0008542897994630039, -0.0008279602043330669, -0.0008016306674107909, -0.000775301072280854, -0.000748971477150917, -0.0007226418820209801, -0.0006963122868910432, -0.0006699827499687672, -0.0006436531548388302, -0.0006173235597088933, -0.0005909940227866173, -0.0005646644276566803, -0.0005383348325267434, -0.0005120052373968065, -0.0004856756713707, -0.0004593461053445935, -0.0004330165102146566, -0.00040668691508471966, -0.0003803573490586132, -0.0003540277830325067, -0.00032769818790256977, -0.00030136859277263284, -0.00027503902674652636, -0.0002487094607204199, -0.00022237986559048295, -0.00019605028501246125, -0.00016972070443443954, -0.00014339112385641783, -0.00011706154327839613, -9.073196270037442e-05, -6.440238212235272e-05, -3.8072801544331014e-05, -1.1743220966309309e-05, 1.4586359611712396e-05, 4.09159401897341e-05, 6.72455207677558e-05, 9.357510134577751e-05, 0.00011990468192379922, 0.00014623426250182092, 0.00017256384307984263, 0.00019889342365786433, 0.00022522300423588604, 0.00025155258481390774, 0.0002778821508400142, 0.00030421174596995115, 0.0003305413410998881, 0.00035687090712599456, 0.00038320047315210104, 0.000409530068282038, 0.0004358596634119749, 0.0004621892294380814, 0.0004885187954641879, 0.0005148483905941248, 0.0005411779857240617, 0.0005675075808539987, 0.0005938371177762747, 0.0006201667129062116, 0.0006464963080361485, 0.0006728258449584246, 0.0006991554400883615, 0.0007254850352182984]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 7.0, 13.0, 8.0, 16.0, 15.0, 23.0, 21.0, 24.0, 21.0, 33.0, 33.0, 36.0, 46.0, 47.0, 40.0, 58.0, 35.0, 47.0, 46.0, 51.0, 56.0, 44.0, 40.0, 34.0, 26.0, 28.0, 17.0, 24.0, 22.0, 22.0, 13.0, 10.0, 9.0, 11.0, 9.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003391556965652853, -0.0003294508787803352, -0.0003197460318915546, -0.00031004121410660446, -0.00030033636721782386, -0.0002906315494328737, -0.00028092670254409313, -0.000271221884759143, -0.00026151706697419286, -0.0002518122491892427, -0.00024210740230046213, -0.00023240256996359676, -0.0002226977376267314, -0.00021299291984178126, -0.0002032880875049159, -0.00019358325516805053, -0.00018387840827926993, -0.00017417357594240457, -0.0001644687436055392, -0.00015476391126867384, -0.00014505907893180847, -0.00013535426114685833, -0.00012564942880999297, -0.0001159445964731276, -0.00010623976413626224, -9.653493179939687e-05, -8.683009946253151e-05, -7.712527440162376e-05, -6.742044206475839e-05, -5.7715609727893025e-05, -4.8010781029006466e-05, -3.830595233011991e-05, -2.8601149097085e-05, -1.8896318579209037e-05, -9.191488061333075e-06, 5.133424565428868e-07, 1.0218172974418849e-05, 1.9923005311284214e-05, 2.9627834010170773e-05, 3.933266270905733e-05, 4.9037495045922697e-05, 5.874232738278806e-05, 6.844715971965343e-05, 7.815198478056118e-05, 8.785681711742654e-05, 9.756164945429191e-05, 0.00010726647451519966, 0.00011697130685206503, 0.0001266761391889304, 0.00013638097152579576, 0.00014608580386266112, 0.0001557906361995265, 0.00016549546853639185, 0.000175200286321342, 0.00018490511865820736, 0.00019460995099507272, 0.0002043147833319381, 0.00021401961566880345, 0.00022372444800566882, 0.00023342928034253418, 0.00024313409812748432, 0.0002528389450162649, 0.00026254376280121505, 0.0002722485805861652, 0.0002819534274749458]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 7.0, 10.0, 23.0, 15.0, 50.0, 50.0, 109.0, 182.0, 277.0, 465.0, 780.0, 1309.0, 2312.0, 4168.0, 7802.0, 15783.0, 33543.0, 80759.0, 265075.0, 439663.0, 111618.0, 43419.0, 19711.0, 9677.0, 5088.0, 2796.0, 1570.0, 876.0, 561.0, 313.0, 199.0, 119.0, 73.0, 46.0, 31.0, 20.0, 12.0, 11.0, 6.0, 4.0, 4.0, 0.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00045680999755859375, -0.00044214725494384766, -0.00042748451232910156, -0.00041282176971435547, -0.0003981590270996094, -0.0003834962844848633, -0.0003688335418701172, -0.0003541707992553711, -0.000339508056640625, -0.0003248453140258789, -0.0003101825714111328, -0.0002955198287963867, -0.0002808570861816406, -0.00026619434356689453, -0.00025153160095214844, -0.00023686885833740234, -0.00022220611572265625, -0.00020754337310791016, -0.00019288063049316406, -0.00017821788787841797, -0.00016355514526367188, -0.00014889240264892578, -0.0001342296600341797, -0.0001195669174194336, -0.0001049041748046875, -9.02414321899414e-05, -7.557868957519531e-05, -6.091594696044922e-05, -4.6253204345703125e-05, -3.159046173095703e-05, -1.6927719116210938e-05, -2.2649765014648438e-06, 1.239776611328125e-05, 2.7060508728027344e-05, 4.172325134277344e-05, 5.638599395751953e-05, 7.104873657226562e-05, 8.571147918701172e-05, 0.00010037422180175781, 0.0001150369644165039, 0.00012969970703125, 0.0001443624496459961, 0.0001590251922607422, 0.00017368793487548828, 0.00018835067749023438, 0.00020301342010498047, 0.00021767616271972656, 0.00023233890533447266, 0.00024700164794921875, 0.00026166439056396484, 0.00027632713317871094, 0.00029098987579345703, 0.0003056526184082031, 0.0003203153610229492, 0.0003349781036376953, 0.0003496408462524414, 0.0003643035888671875, 0.0003789663314819336, 0.0003936290740966797, 0.0004082918167114258, 0.0004229545593261719, 0.00043761730194091797, 0.00045228004455566406, 0.00046694278717041016, 0.00048160552978515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 10.0, 15.0, 24.0, 25.0, 31.0, 37.0, 41.0, 38.0, 67.0, 64.0, 78.0, 84.0, 65.0, 56.0, 64.0, 65.0, 38.0, 39.0, 28.0, 31.0, 23.0, 18.0, 10.0, 14.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.152557373046875e-05, -6.940308958292007e-05, -6.72806054353714e-05, -6.515812128782272e-05, -6.303563714027405e-05, -6.091315299272537e-05, -5.87906688451767e-05, -5.666818469762802e-05, -5.4545700550079346e-05, -5.242321640253067e-05, -5.0300732254981995e-05, -4.817824810743332e-05, -4.6055763959884644e-05, -4.393327981233597e-05, -4.181079566478729e-05, -3.968831151723862e-05, -3.756582736968994e-05, -3.5443343222141266e-05, -3.332085907459259e-05, -3.1198374927043915e-05, -2.907589077949524e-05, -2.6953406631946564e-05, -2.4830922484397888e-05, -2.2708438336849213e-05, -2.0585954189300537e-05, -1.846347004175186e-05, -1.6340985894203186e-05, -1.421850174665451e-05, -1.2096017599105835e-05, -9.97353345155716e-06, -7.851049304008484e-06, -5.728565156459808e-06, -3.606081008911133e-06, -1.4835968613624573e-06, 6.388872861862183e-07, 2.761371433734894e-06, 4.883855581283569e-06, 7.006339728832245e-06, 9.12882387638092e-06, 1.1251308023929596e-05, 1.3373792171478271e-05, 1.5496276319026947e-05, 1.7618760466575623e-05, 1.9741244614124298e-05, 2.1863728761672974e-05, 2.398621290922165e-05, 2.6108697056770325e-05, 2.8231181204319e-05, 3.0353665351867676e-05, 3.247614949941635e-05, 3.459863364696503e-05, 3.67211177945137e-05, 3.884360194206238e-05, 4.0966086089611053e-05, 4.308857023715973e-05, 4.5211054384708405e-05, 4.733353853225708e-05, 4.9456022679805756e-05, 5.157850682735443e-05, 5.370099097490311e-05, 5.582347512245178e-05, 5.794595927000046e-05, 6.006844341754913e-05, 6.219092756509781e-05, 6.431341171264648e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 9.0, 2.0, 5.0, 16.0, 17.0, 22.0, 43.0, 51.0, 103.0, 151.0, 220.0, 325.0, 491.0, 791.0, 1329.0, 2105.0, 3390.0, 5709.0, 9654.0, 17482.0, 32535.0, 65874.0, 159228.0, 424288.0, 177037.0, 69703.0, 34441.0, 18277.0, 10142.0, 5849.0, 3384.0, 2188.0, 1301.0, 846.0, 535.0, 340.0, 228.0, 146.0, 110.0, 52.0, 44.0, 37.0, 33.0, 4.0, 10.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00015056133270263672, -0.00014578737318515778, -0.00014101341366767883, -0.0001362394541501999, -0.00013146549463272095, -0.000126691535115242, -0.00012191757559776306, -0.00011714361608028412, -0.00011236965656280518, -0.00010759569704532623, -0.00010282173752784729, -9.804777801036835e-05, -9.32738184928894e-05, -8.849985897541046e-05, -8.372589945793152e-05, -7.895193994045258e-05, -7.417798042297363e-05, -6.940402090549469e-05, -6.463006138801575e-05, -5.9856101870536804e-05, -5.508214235305786e-05, -5.030818283557892e-05, -4.5534223318099976e-05, -4.076026380062103e-05, -3.598630428314209e-05, -3.121234476566315e-05, -2.6438385248184204e-05, -2.166442573070526e-05, -1.689046621322632e-05, -1.2116506695747375e-05, -7.342547178268433e-06, -2.5685876607894897e-06, 2.205371856689453e-06, 6.979331374168396e-06, 1.1753290891647339e-05, 1.6527250409126282e-05, 2.1301209926605225e-05, 2.6075169444084167e-05, 3.084912896156311e-05, 3.562308847904205e-05, 4.0397047996520996e-05, 4.517100751399994e-05, 4.994496703147888e-05, 5.4718926548957825e-05, 5.949288606643677e-05, 6.426684558391571e-05, 6.904080510139465e-05, 7.38147646188736e-05, 7.858872413635254e-05, 8.336268365383148e-05, 8.813664317131042e-05, 9.291060268878937e-05, 9.768456220626831e-05, 0.00010245852172374725, 0.0001072324812412262, 0.00011200644075870514, 0.00011678040027618408, 0.00012155435979366302, 0.00012632831931114197, 0.0001311022788286209, 0.00013587623834609985, 0.0001406501978635788, 0.00014542415738105774, 0.00015019811689853668, 0.00015497207641601562]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 10.0, 7.0, 13.0, 11.0, 18.0, 22.0, 27.0, 31.0, 36.0, 46.0, 40.0, 43.0, 64.0, 54.0, 61.0, 72.0, 55.0, 52.0, 39.0, 39.0, 48.0, 33.0, 34.0, 32.0, 22.0, 15.0, 17.0, 16.0, 7.0, 5.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.566545486450195e-05, -9.248219430446625e-05, -8.929893374443054e-05, -8.611567318439484e-05, -8.293241262435913e-05, -7.974915206432343e-05, -7.656589150428772e-05, -7.338263094425201e-05, -7.019937038421631e-05, -6.70161098241806e-05, -6.38328492641449e-05, -6.064958870410919e-05, -5.7466328144073486e-05, -5.428306758403778e-05, -5.1099807024002075e-05, -4.791654646396637e-05, -4.4733285903930664e-05, -4.155002534389496e-05, -3.836676478385925e-05, -3.518350422382355e-05, -3.200024366378784e-05, -2.8816983103752136e-05, -2.563372254371643e-05, -2.2450461983680725e-05, -1.926720142364502e-05, -1.6083940863609314e-05, -1.2900680303573608e-05, -9.717419743537903e-06, -6.534159183502197e-06, -3.3508986234664917e-06, -1.6763806343078613e-07, 3.0156224966049194e-06, 6.198883056640625e-06, 9.38214361667633e-06, 1.2565404176712036e-05, 1.5748664736747742e-05, 1.8931925296783447e-05, 2.2115185856819153e-05, 2.529844641685486e-05, 2.8481706976890564e-05, 3.166496753692627e-05, 3.4848228096961975e-05, 3.803148865699768e-05, 4.1214749217033386e-05, 4.439800977706909e-05, 4.75812703371048e-05, 5.07645308971405e-05, 5.394779145717621e-05, 5.7131052017211914e-05, 6.031431257724762e-05, 6.349757313728333e-05, 6.668083369731903e-05, 6.986409425735474e-05, 7.304735481739044e-05, 7.623061537742615e-05, 7.941387593746185e-05, 8.259713649749756e-05, 8.578039705753326e-05, 8.896365761756897e-05, 9.214691817760468e-05, 9.533017873764038e-05, 9.851343929767609e-05, 0.00010169669985771179, 0.0001048799604177475, 0.0001080632209777832]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 5.0, 12.0, 6.0, 11.0, 16.0, 20.0, 23.0, 35.0, 43.0, 33.0, 63.0, 82.0, 120.0, 133.0, 157.0, 245.0, 336.0, 687.0, 1311.0, 3429.0, 16250.0, 972670.0, 43097.0, 5649.0, 1703.0, 848.0, 420.0, 322.0, 174.0, 120.0, 115.0, 110.0, 62.0, 45.0, 34.0, 26.0, 38.0, 24.0, 18.0, 11.0, 12.0, 9.0, 9.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00013971328735351562, -0.00013556517660617828, -0.00013141706585884094, -0.0001272689551115036, -0.00012312084436416626, -0.00011897273361682892, -0.00011482462286949158, -0.00011067651212215424, -0.0001065284013748169, -0.00010238029062747955, -9.823217988014221e-05, -9.408406913280487e-05, -8.993595838546753e-05, -8.578784763813019e-05, -8.163973689079285e-05, -7.74916261434555e-05, -7.334351539611816e-05, -6.919540464878082e-05, -6.504729390144348e-05, -6.089918315410614e-05, -5.67510724067688e-05, -5.260296165943146e-05, -4.8454850912094116e-05, -4.4306740164756775e-05, -4.0158629417419434e-05, -3.601051867008209e-05, -3.186240792274475e-05, -2.771429717540741e-05, -2.356618642807007e-05, -1.9418075680732727e-05, -1.5269964933395386e-05, -1.1121854186058044e-05, -6.973743438720703e-06, -2.825632691383362e-06, 1.3224780559539795e-06, 5.470588803291321e-06, 9.618699550628662e-06, 1.3766810297966003e-05, 1.7914921045303345e-05, 2.2063031792640686e-05, 2.6211142539978027e-05, 3.035925328731537e-05, 3.450736403465271e-05, 3.865547478199005e-05, 4.280358552932739e-05, 4.6951696276664734e-05, 5.1099807024002075e-05, 5.5247917771339417e-05, 5.939602851867676e-05, 6.35441392660141e-05, 6.769225001335144e-05, 7.184036076068878e-05, 7.598847150802612e-05, 8.013658225536346e-05, 8.42846930027008e-05, 8.843280375003815e-05, 9.258091449737549e-05, 9.672902524471283e-05, 0.00010087713599205017, 0.00010502524673938751, 0.00010917335748672485, 0.0001133214682340622, 0.00011746957898139954, 0.00012161768972873688, 0.00012576580047607422]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 179.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 607.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 202.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.7229467630386353e-07, -1.6577541828155518e-07, -1.5925616025924683e-07, -1.5273690223693848e-07, -1.4621764421463013e-07, -1.3969838619232178e-07, -1.3317912817001343e-07, -1.2665987014770508e-07, -1.2014061212539673e-07, -1.1362135410308838e-07, -1.0710209608078003e-07, -1.0058283805847168e-07, -9.406358003616333e-08, -8.754432201385498e-08, -8.102506399154663e-08, -7.450580596923828e-08, -6.798654794692993e-08, -6.146728992462158e-08, -5.494803190231323e-08, -4.842877388000488e-08, -4.190951585769653e-08, -3.5390257835388184e-08, -2.8870999813079834e-08, -2.2351741790771484e-08, -1.5832483768463135e-08, -9.313225746154785e-09, -2.7939677238464355e-09, 3.725290298461914e-09, 1.0244548320770264e-08, 1.6763806343078613e-08, 2.3283064365386963e-08, 2.9802322387695312e-08, 3.632158041000366e-08, 4.284083843231201e-08, 4.936009645462036e-08, 5.587935447692871e-08, 6.239861249923706e-08, 6.891787052154541e-08, 7.543712854385376e-08, 8.195638656616211e-08, 8.847564458847046e-08, 9.499490261077881e-08, 1.0151416063308716e-07, 1.0803341865539551e-07, 1.1455267667770386e-07, 1.210719347000122e-07, 1.2759119272232056e-07, 1.341104507446289e-07, 1.4062970876693726e-07, 1.471489667892456e-07, 1.5366822481155396e-07, 1.601874828338623e-07, 1.6670674085617065e-07, 1.73225998878479e-07, 1.7974525690078735e-07, 1.862645149230957e-07, 1.9278377294540405e-07, 1.993030309677124e-07, 2.0582228899002075e-07, 2.123415470123291e-07, 2.1886080503463745e-07, 2.253800630569458e-07, 2.3189932107925415e-07, 2.384185791015625e-07]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 4.0, 9.0, 13.0, 9.0, 14.0, 34.0, 46.0, 55.0, 59.0, 66.0, 103.0, 150.0, 198.0, 229.0, 338.0, 436.0, 662.0, 1049.0, 1828.0, 3623.0, 9587.0, 45866.0, 910043.0, 53863.0, 10848.0, 3972.0, 1952.0, 1111.0, 701.0, 439.0, 316.0, 240.0, 166.0, 126.0, 108.0, 75.0, 59.0, 35.0, 25.0, 27.0, 21.0, 14.0, 12.0, 8.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.589557647705078e-05, -4.428718239068985e-05, -4.267878830432892e-05, -4.107039421796799e-05, -3.9462000131607056e-05, -3.7853606045246124e-05, -3.624521195888519e-05, -3.463681787252426e-05, -3.302842378616333e-05, -3.14200296998024e-05, -2.9811635613441467e-05, -2.8203241527080536e-05, -2.6594847440719604e-05, -2.4986453354358673e-05, -2.3378059267997742e-05, -2.176966518163681e-05, -2.016127109527588e-05, -1.8552877008914948e-05, -1.6944482922554016e-05, -1.5336088836193085e-05, -1.3727694749832153e-05, -1.2119300663471222e-05, -1.051090657711029e-05, -8.902512490749359e-06, -7.294118404388428e-06, -5.685724318027496e-06, -4.077330231666565e-06, -2.4689361453056335e-06, -8.605420589447021e-07, 7.478520274162292e-07, 2.3562461137771606e-06, 3.964640200138092e-06, 5.5730342864990234e-06, 7.181428372859955e-06, 8.789822459220886e-06, 1.0398216545581818e-05, 1.2006610631942749e-05, 1.361500471830368e-05, 1.5223398804664612e-05, 1.6831792891025543e-05, 1.8440186977386475e-05, 2.0048581063747406e-05, 2.1656975150108337e-05, 2.326536923646927e-05, 2.48737633228302e-05, 2.648215740919113e-05, 2.8090551495552063e-05, 2.9698945581912994e-05, 3.1307339668273926e-05, 3.291573375463486e-05, 3.452412784099579e-05, 3.613252192735672e-05, 3.774091601371765e-05, 3.934931010007858e-05, 4.0957704186439514e-05, 4.2566098272800446e-05, 4.417449235916138e-05, 4.578288644552231e-05, 4.739128053188324e-05, 4.899967461824417e-05, 5.06080687046051e-05, 5.2216462790966034e-05, 5.3824856877326965e-05, 5.54332509636879e-05, 5.704164505004883e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 21.0, 26.0, 47.0, 95.0, 501.0, 186.0, 37.0, 36.0, 10.0, 4.0, 5.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.0279159545898438e-05, -2.922210842370987e-05, -2.81650573015213e-05, -2.7108006179332733e-05, -2.6050955057144165e-05, -2.4993903934955597e-05, -2.393685281276703e-05, -2.287980169057846e-05, -2.1822750568389893e-05, -2.0765699446201324e-05, -1.9708648324012756e-05, -1.8651597201824188e-05, -1.759454607963562e-05, -1.6537494957447052e-05, -1.5480443835258484e-05, -1.4423392713069916e-05, -1.3366341590881348e-05, -1.230929046869278e-05, -1.1252239346504211e-05, -1.0195188224315643e-05, -9.138137102127075e-06, -8.081085979938507e-06, -7.024034857749939e-06, -5.966983735561371e-06, -4.909932613372803e-06, -3.852881491184235e-06, -2.7958303689956665e-06, -1.7387792468070984e-06, -6.817281246185303e-07, 3.7532299757003784e-07, 1.432374119758606e-06, 2.489425241947174e-06, 3.546476364135742e-06, 4.60352748632431e-06, 5.660578608512878e-06, 6.7176297307014465e-06, 7.774680852890015e-06, 8.831731975078583e-06, 9.888783097267151e-06, 1.0945834219455719e-05, 1.2002885341644287e-05, 1.3059936463832855e-05, 1.4116987586021423e-05, 1.5174038708209991e-05, 1.623108983039856e-05, 1.7288140952587128e-05, 1.8345192074775696e-05, 1.9402243196964264e-05, 2.0459294319152832e-05, 2.15163454413414e-05, 2.2573396563529968e-05, 2.3630447685718536e-05, 2.4687498807907104e-05, 2.5744549930095673e-05, 2.680160105228424e-05, 2.785865217447281e-05, 2.8915703296661377e-05, 2.9972754418849945e-05, 3.102980554103851e-05, 3.208685666322708e-05, 3.314390778541565e-05, 3.420095890760422e-05, 3.5258010029792786e-05, 3.6315061151981354e-05, 3.737211227416992e-05]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 2.0, 3.0, 6.0, 10.0, 9.0, 11.0, 14.0, 18.0, 18.0, 25.0, 28.0, 32.0, 58.0, 96.0, 104.0, 127.0, 96.0, 96.0, 68.0, 45.0, 20.0, 26.0, 17.0, 9.0, 15.0, 10.0, 5.0, 8.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00023013964528217912, -0.00022230246395338327, -0.00021446529717650265, -0.0002066281158477068, -0.00019879094907082617, -0.00019095376774203032, -0.00018311658641323447, -0.00017527941963635385, -0.000167442238307558, -0.00015960505697876215, -0.00015176789020188153, -0.00014393070887308568, -0.00013609352754428983, -0.0001282563607674092, -0.00012041917943861336, -0.00011258200538577512, -0.00010474483133293688, -9.690765728009865e-05, -8.907048322726041e-05, -8.123330189846456e-05, -7.339612784562632e-05, -6.555895379278809e-05, -5.7721776101971045e-05, -4.9884598411154e-05, -4.2047424358315766e-05, -3.421025030547753e-05, -2.6373072614660487e-05, -1.8535896742832847e-05, -1.0698720871005207e-05, -2.861546818166971e-06, 4.975630872650072e-06, 1.2812808563467115e-05, 2.0650011720135808e-05, 2.8487187591963448e-05, 3.632436346379109e-05, 4.416154115460813e-05, 5.1998715207446367e-05, 5.98358892602846e-05, 6.767307058908045e-05, 7.551024464191869e-05, 8.334741869475693e-05, 9.118459274759516e-05, 9.90217668004334e-05, 0.00010685894812922925, 0.00011469612218206748, 0.00012253329623490572, 0.00013037047756370157, 0.00013820765889249742, 0.00014604482566937804, 0.0001538820069981739, 0.00016171917377505451, 0.00016955635510385036, 0.000177393521880731, 0.00018523070320952684, 0.0001930678845383227, 0.0002009050513152033, 0.00020874223264399916, 0.000216579413972795, 0.00022441658074967563, 0.00023225376207847148, 0.00024009094340726733, 0.00024792811018414795, 0.0002557652769610286, 0.00026360247284173965, 0.0002714396396186203]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 10.0, 14.0, 12.0, 22.0, 22.0, 29.0, 21.0, 33.0, 34.0, 26.0, 41.0, 46.0, 36.0, 49.0, 44.0, 47.0, 65.0, 48.0, 45.0, 41.0, 41.0, 32.0, 33.0, 47.0, 23.0, 21.0, 27.0, 13.0, 20.0, 11.0, 13.0, 6.0, 2.0, 6.0, 6.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00018471140356268734, -0.00017968621978070587, -0.00017466105055063963, -0.00016963586676865816, -0.0001646106829866767, -0.00015958551375661045, -0.00015456032997462898, -0.00014953516074456275, -0.00014450997696258128, -0.0001394847931805998, -0.00013445962395053357, -0.0001294344401685521, -0.00012440927093848586, -0.00011938408715650439, -0.00011435890337452292, -0.00010933372686849907, -0.00010430855036247522, -9.928337385645136e-05, -9.425819735042751e-05, -8.923301356844604e-05, -8.420783706242219e-05, -7.918266055639833e-05, -7.415747677441686e-05, -6.913230026839301e-05, -6.410712376236916e-05, -5.90819472563453e-05, -5.405676711234264e-05, -4.903158696833998e-05, -4.4006410462316126e-05, -3.898123395629227e-05, -3.395605381228961e-05, -2.893087366828695e-05, -2.3905711714178324e-05, -1.8880533389165066e-05, -1.3855355064151809e-05, -8.830176739138551e-06, -3.8049984141252935e-06, 1.220179910887964e-06, 6.245358235901222e-06, 1.1270538379903883e-05, 1.6295714885927737e-05, 2.1320893210940994e-05, 2.6346071535954252e-05, 3.137125167995691e-05, 3.639642818598077e-05, 4.142160469200462e-05, 4.644678483600728e-05, 5.147196498000994e-05, 5.64971414860338e-05, 6.152231799205765e-05, 6.65474944980815e-05, 7.157267828006297e-05, 7.659785478608683e-05, 8.162303129211068e-05, 8.664821507409215e-05, 9.1673391580116e-05, 9.669856808613986e-05, 0.00010172374459216371, 0.00010674892109818757, 0.00011177410488016903, 0.00011679928138619289, 0.00012182445789221674, 0.0001268496416741982, 0.00013187481090426445, 0.00013689999468624592]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 10.0, 13.0, 16.0, 25.0, 30.0, 46.0, 55.0, 90.0, 137.0, 157.0, 226.0, 370.0, 466.0, 746.0, 1033.0, 1625.0, 2572.0, 3906.0, 6597.0, 11584.0, 27129.0, 3811263.0, 282135.0, 19012.0, 9313.0, 5644.0, 3513.0, 2191.0, 1419.0, 1001.0, 628.0, 428.0, 283.0, 185.0, 139.0, 86.0, 72.0, 45.0, 30.0, 20.0, 13.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00023496150970458984, -0.0002284012734889984, -0.00022184103727340698, -0.00021528080105781555, -0.00020872056484222412, -0.0002021603286266327, -0.00019560009241104126, -0.00018903985619544983, -0.0001824796199798584, -0.00017591938376426697, -0.00016935914754867554, -0.0001627989113330841, -0.00015623867511749268, -0.00014967843890190125, -0.00014311820268630981, -0.00013655796647071838, -0.00012999773025512695, -0.00012343749403953552, -0.00011687725782394409, -0.00011031702160835266, -0.00010375678539276123, -9.71965491771698e-05, -9.063631296157837e-05, -8.407607674598694e-05, -7.751584053039551e-05, -7.095560431480408e-05, -6.439536809921265e-05, -5.7835131883621216e-05, -5.1274895668029785e-05, -4.4714659452438354e-05, -3.8154423236846924e-05, -3.159418702125549e-05, -2.5033950805664062e-05, -1.8473714590072632e-05, -1.1913478374481201e-05, -5.3532421588897705e-06, 1.2069940567016602e-06, 7.76723027229309e-06, 1.4327466487884521e-05, 2.0887702703475952e-05, 2.7447938919067383e-05, 3.4008175134658813e-05, 4.0568411350250244e-05, 4.7128647565841675e-05, 5.3688883781433105e-05, 6.0249119997024536e-05, 6.680935621261597e-05, 7.33695924282074e-05, 7.992982864379883e-05, 8.649006485939026e-05, 9.305030107498169e-05, 9.961053729057312e-05, 0.00010617077350616455, 0.00011273100972175598, 0.00011929124593734741, 0.00012585148215293884, 0.00013241171836853027, 0.0001389719545841217, 0.00014553219079971313, 0.00015209242701530457, 0.000158652663230896, 0.00016521289944648743, 0.00017177313566207886, 0.0001783333718776703, 0.00018489360809326172]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 9.0, 7.0, 9.0, 14.0, 15.0, 16.0, 17.0, 26.0, 24.0, 24.0, 39.0, 32.0, 44.0, 53.0, 36.0, 42.0, 54.0, 44.0, 57.0, 40.0, 30.0, 43.0, 36.0, 41.0, 32.0, 44.0, 31.0, 22.0, 26.0, 15.0, 18.0, 10.0, 16.0, 5.0, 6.0, 2.0, 5.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.866983413696289e-05, -2.7907080948352814e-05, -2.7144327759742737e-05, -2.638157457113266e-05, -2.5618821382522583e-05, -2.4856068193912506e-05, -2.409331500530243e-05, -2.3330561816692352e-05, -2.2567808628082275e-05, -2.18050554394722e-05, -2.104230225086212e-05, -2.0279549062252045e-05, -1.9516795873641968e-05, -1.875404268503189e-05, -1.7991289496421814e-05, -1.7228536307811737e-05, -1.646578311920166e-05, -1.5703029930591583e-05, -1.4940276741981506e-05, -1.417752355337143e-05, -1.3414770364761353e-05, -1.2652017176151276e-05, -1.1889263987541199e-05, -1.1126510798931122e-05, -1.0363757610321045e-05, -9.601004421710968e-06, -8.838251233100891e-06, -8.075498044490814e-06, -7.312744855880737e-06, -6.54999166727066e-06, -5.7872384786605835e-06, -5.024485290050507e-06, -4.26173210144043e-06, -3.4989789128303528e-06, -2.736225724220276e-06, -1.973472535610199e-06, -1.210719347000122e-06, -4.4796615839004517e-07, 3.1478703022003174e-07, 1.0775402188301086e-06, 1.8402934074401855e-06, 2.6030465960502625e-06, 3.3657997846603394e-06, 4.128552973270416e-06, 4.891306161880493e-06, 5.65405935049057e-06, 6.416812539100647e-06, 7.179565727710724e-06, 7.9423189163208e-06, 8.705072104930878e-06, 9.467825293540955e-06, 1.0230578482151031e-05, 1.0993331670761108e-05, 1.1756084859371185e-05, 1.2518838047981262e-05, 1.3281591236591339e-05, 1.4044344425201416e-05, 1.4807097613811493e-05, 1.556985080242157e-05, 1.6332603991031647e-05, 1.7095357179641724e-05, 1.78581103682518e-05, 1.8620863556861877e-05, 1.9383616745471954e-05, 2.014636993408203e-05]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 8.0, 12.0, 20.0, 33.0, 31.0, 41.0, 36.0, 44.0, 66.0, 94.0, 360.0, 57635.0, 4134854.0, 680.0, 110.0, 56.0, 35.0, 38.0, 31.0, 17.0, 21.0, 15.0, 18.0, 10.0, 4.0, 7.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.0014495849609375, -0.0014181435108184814, -0.0013867020606994629, -0.0013552606105804443, -0.0013238191604614258, -0.0012923777103424072, -0.0012609362602233887, -0.0012294948101043701, -0.0011980533599853516, -0.001166611909866333, -0.0011351704597473145, -0.001103729009628296, -0.0010722875595092773, -0.0010408461093902588, -0.0010094046592712402, -0.0009779632091522217, -0.0009465217590332031, -0.0009150803089141846, -0.000883638858795166, -0.0008521974086761475, -0.0008207559585571289, -0.0007893145084381104, -0.0007578730583190918, -0.0007264316082000732, -0.0006949901580810547, -0.0006635487079620361, -0.0006321072578430176, -0.000600665807723999, -0.0005692243576049805, -0.0005377829074859619, -0.0005063414573669434, -0.0004749000072479248, -0.00044345855712890625, -0.0004120171070098877, -0.00038057565689086914, -0.0003491342067718506, -0.00031769275665283203, -0.0002862513065338135, -0.0002548098564147949, -0.00022336840629577637, -0.0001919269561767578, -0.00016048550605773926, -0.0001290440559387207, -9.760260581970215e-05, -6.61611557006836e-05, -3.471970558166504e-05, -3.2782554626464844e-06, 2.816319465637207e-05, 5.9604644775390625e-05, 9.104609489440918e-05, 0.00012248754501342773, 0.0001539289951324463, 0.00018537044525146484, 0.0002168118953704834, 0.00024825334548950195, 0.0002796947956085205, 0.00031113624572753906, 0.0003425776958465576, 0.00037401914596557617, 0.0004054605960845947, 0.0004369020462036133, 0.00046834349632263184, 0.0004997849464416504, 0.0005312263965606689, 0.0005626678466796875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [8.0, 8.0, 32.0, 66.0, 3506.0, 418.0, 35.0, 14.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9146671295166016e-05, -2.307351678609848e-05, -1.7000362277030945e-05, -1.092720776796341e-05, -4.854053258895874e-06, 1.2191012501716614e-06, 7.292255759239197e-06, 1.3365410268306732e-05, 1.9438564777374268e-05, 2.5511719286441803e-05, 3.158487379550934e-05, 3.7658028304576874e-05, 4.373118281364441e-05, 4.9804337322711945e-05, 5.587749183177948e-05, 6.195064634084702e-05, 6.802380084991455e-05, 7.409695535898209e-05, 8.017010986804962e-05, 8.624326437711716e-05, 9.231641888618469e-05, 9.838957339525223e-05, 0.00010446272790431976, 0.0001105358824133873, 0.00011660903692245483, 0.00012268219143152237, 0.0001287553459405899, 0.00013482850044965744, 0.00014090165495872498, 0.0001469748094677925, 0.00015304796397686005, 0.00015912111848592758, 0.00016519427299499512, 0.00017126742750406265, 0.0001773405820131302, 0.00018341373652219772, 0.00018948689103126526, 0.0001955600455403328, 0.00020163320004940033, 0.00020770635455846786, 0.0002137795090675354, 0.00021985266357660294, 0.00022592581808567047, 0.000231998972594738, 0.00023807212710380554, 0.0002441452816128731, 0.0002502184361219406, 0.00025629159063100815, 0.0002623647451400757, 0.0002684378996491432, 0.00027451105415821075, 0.0002805842086672783, 0.0002866573631763458, 0.00029273051768541336, 0.0002988036721944809, 0.00030487682670354843, 0.00031094998121261597, 0.0003170231357216835, 0.00032309629023075104, 0.0003291694447398186, 0.0003352425992488861, 0.00034131575375795364, 0.0003473889082670212, 0.0003534620627760887, 0.00035953521728515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 10.0, 7.0, 4.0, 7.0, 10.0, 11.0, 16.0, 16.0, 27.0, 34.0, 37.0, 38.0, 69.0, 119.0, 165.0, 127.0, 73.0, 58.0, 27.0, 31.0, 21.0, 17.0, 11.0, 10.0, 7.0, 8.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.00010796772403409705, -0.00010517000191612169, -0.00010237228707410395, -9.95745649561286e-05, -9.677684283815324e-05, -9.39791279961355e-05, -9.118140587816015e-05, -8.838369103614241e-05, -8.558596891816705e-05, -8.27882468001917e-05, -7.999053195817396e-05, -7.71928098401986e-05, -7.439509499818087e-05, -7.159737288020551e-05, -6.879965076223016e-05, -6.60019286442548e-05, -6.320421380223706e-05, -6.0406495322240517e-05, -5.760877684224397e-05, -5.4811054724268615e-05, -5.201333624427207e-05, -4.921561776427552e-05, -4.641789564630017e-05, -4.362017716630362e-05, -4.082245868630707e-05, -3.8024740206310526e-05, -3.522702172631398e-05, -3.2429299608338624e-05, -2.9631581128342077e-05, -2.683386264834553e-05, -2.403614234935958e-05, -2.123842205037363e-05, -1.8440696294419467e-05, -1.564297781442292e-05, -1.284525751543697e-05, -1.004753812594572e-05, -7.249818736454472e-06, -4.452099346963223e-06, -1.6543799574719742e-06, 1.1433403415139765e-06, 3.9410588215105236e-06, 6.7387782110017724e-06, 9.536497600493021e-06, 1.233421698998427e-05, 1.5131936379475519e-05, 1.7929654859472066e-05, 2.0727375158458017e-05, 2.3525095457443967e-05, 2.6322813937440515e-05, 2.912053241743706e-05, 3.191825089743361e-05, 3.471597301540896e-05, 3.751369149540551e-05, 4.031140997540206e-05, 4.310913209337741e-05, 4.590685057337396e-05, 4.8704569053370506e-05, 5.150228753336705e-05, 5.43000060133636e-05, 5.7097728131338954e-05, 5.98954466113355e-05, 6.269316509133205e-05, 6.54908872093074e-05, 6.828860205132514e-05, 7.10863241693005e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 4.0, 7.0, 17.0, 14.0, 22.0, 20.0, 25.0, 34.0, 35.0, 37.0, 53.0, 52.0, 59.0, 58.0, 56.0, 50.0, 54.0, 54.0, 49.0, 57.0, 41.0, 35.0, 34.0, 30.0, 20.0, 14.0, 17.0, 21.0, 7.0, 8.0, 1.0, 4.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.773056131554767e-05, -7.573180482722819e-05, -7.37330483389087e-05, -7.173429185058922e-05, -6.973552808631212e-05, -6.773677159799263e-05, -6.573801510967314e-05, -6.373925862135366e-05, -6.174050213303417e-05, -5.974174564471468e-05, -5.77429891563952e-05, -5.5744229030096903e-05, -5.374547254177742e-05, -5.174671605345793e-05, -4.974795592715964e-05, -4.774919943884015e-05, -4.5750442950520664e-05, -4.375168646220118e-05, -4.175292997388169e-05, -3.97541698475834e-05, -3.775541335926391e-05, -3.5756656870944425e-05, -3.375789674464613e-05, -3.1759140256326646e-05, -2.976038376800716e-05, -2.7761627279687673e-05, -2.5762868972378783e-05, -2.3764110665069893e-05, -2.1765354176750407e-05, -1.976659768843092e-05, -1.776783938112203e-05, -1.576908107381314e-05, -1.377031730953604e-05, -1.1771559911721852e-05, -9.772802513907664e-06, -7.774045116093475e-06, -5.775287718279287e-06, -3.776530320465099e-06, -1.777772922650911e-06, 2.2098447516327724e-07, 2.2197418729774654e-06, 4.2184992707916535e-06, 6.217256668605842e-06, 8.21601406642003e-06, 1.0214771464234218e-05, 1.2213528862048406e-05, 1.4212286259862594e-05, 1.6211044567171484e-05, 1.820980105549097e-05, 2.0208557543810457e-05, 2.2207315851119347e-05, 2.4206074158428237e-05, 2.6204830646747723e-05, 2.820358713506721e-05, 3.02023454423761e-05, 3.220110374968499e-05, 3.4199860238004476e-05, 3.619861672632396e-05, 3.819737321464345e-05, 4.019613334094174e-05, 4.219488982926123e-05, 4.4193646317580715e-05, 4.619240644387901e-05, 4.8191162932198495e-05, 5.018991942051798e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 10.0, 17.0, 24.0, 29.0, 38.0, 73.0, 113.0, 138.0, 233.0, 432.0, 1038.0, 3241.0, 18557.0, 682070.0, 318677.0, 18458.0, 3219.0, 1031.0, 455.0, 237.0, 154.0, 84.0, 74.0, 45.0, 39.0, 24.0, 15.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6391277313232422e-05, -1.5922822058200836e-05, -1.545436680316925e-05, -1.4985911548137665e-05, -1.4517456293106079e-05, -1.4049001038074493e-05, -1.3580545783042908e-05, -1.3112090528011322e-05, -1.2643635272979736e-05, -1.217518001794815e-05, -1.1706724762916565e-05, -1.123826950788498e-05, -1.0769814252853394e-05, -1.0301358997821808e-05, -9.832903742790222e-06, -9.364448487758636e-06, -8.89599323272705e-06, -8.427537977695465e-06, -7.95908272266388e-06, -7.490627467632294e-06, -7.022172212600708e-06, -6.553716957569122e-06, -6.085261702537537e-06, -5.616806447505951e-06, -5.148351192474365e-06, -4.6798959374427795e-06, -4.211440682411194e-06, -3.742985427379608e-06, -3.2745301723480225e-06, -2.8060749173164368e-06, -2.337619662284851e-06, -1.8691644072532654e-06, -1.4007091522216797e-06, -9.32253897190094e-07, -4.637986421585083e-07, 4.6566128730773926e-09, 4.731118679046631e-07, 9.415671229362488e-07, 1.4100223779678345e-06, 1.8784776329994202e-06, 2.346932888031006e-06, 2.8153881430625916e-06, 3.2838433980941772e-06, 3.752298653125763e-06, 4.220753908157349e-06, 4.689209163188934e-06, 5.15766441822052e-06, 5.626119673252106e-06, 6.094574928283691e-06, 6.563030183315277e-06, 7.031485438346863e-06, 7.4999406933784485e-06, 7.968395948410034e-06, 8.43685120344162e-06, 8.905306458473206e-06, 9.373761713504791e-06, 9.842216968536377e-06, 1.0310672223567963e-05, 1.0779127478599548e-05, 1.1247582733631134e-05, 1.171603798866272e-05, 1.2184493243694305e-05, 1.2652948498725891e-05, 1.3121403753757477e-05, 1.3589859008789062e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 8.0, 6.0, 4.0, 14.0, 22.0, 18.0, 34.0, 34.0, 37.0, 46.0, 56.0, 60.0, 77.0, 79.0, 68.0, 77.0, 59.0, 64.0, 52.0, 40.0, 41.0, 24.0, 24.0, 21.0, 12.0, 8.0, 7.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.526708602905273e-05, -6.350316107273102e-05, -6.17392361164093e-05, -5.9975311160087585e-05, -5.821138620376587e-05, -5.644746124744415e-05, -5.4683536291122437e-05, -5.291961133480072e-05, -5.1155686378479004e-05, -4.939176142215729e-05, -4.762783646583557e-05, -4.5863911509513855e-05, -4.409998655319214e-05, -4.233606159687042e-05, -4.0572136640548706e-05, -3.880821168422699e-05, -3.7044286727905273e-05, -3.528036177158356e-05, -3.351643681526184e-05, -3.1752511858940125e-05, -2.9988586902618408e-05, -2.8224661946296692e-05, -2.6460736989974976e-05, -2.469681203365326e-05, -2.2932887077331543e-05, -2.1168962121009827e-05, -1.940503716468811e-05, -1.7641112208366394e-05, -1.5877187252044678e-05, -1.4113262295722961e-05, -1.2349337339401245e-05, -1.0585412383079529e-05, -8.821487426757812e-06, -7.057562470436096e-06, -5.29363751411438e-06, -3.5297125577926636e-06, -1.7657876014709473e-06, -1.862645149230957e-09, 1.7620623111724854e-06, 3.5259872674942017e-06, 5.289912223815918e-06, 7.053837180137634e-06, 8.81776213645935e-06, 1.0581687092781067e-05, 1.2345612049102783e-05, 1.41095370054245e-05, 1.5873461961746216e-05, 1.7637386918067932e-05, 1.940131187438965e-05, 2.1165236830711365e-05, 2.292916178703308e-05, 2.4693086743354797e-05, 2.6457011699676514e-05, 2.822093665599823e-05, 2.9984861612319946e-05, 3.174878656864166e-05, 3.351271152496338e-05, 3.5276636481285095e-05, 3.704056143760681e-05, 3.880448639392853e-05, 4.0568411350250244e-05, 4.233233630657196e-05, 4.409626126289368e-05, 4.586018621921539e-05, 4.762411117553711e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 8.0, 5.0, 10.0, 12.0, 23.0, 35.0, 56.0, 69.0, 110.0, 202.0, 407.0, 1433.0, 9052.0, 184331.0, 828542.0, 20543.0, 2474.0, 431.0, 339.0, 169.0, 93.0, 75.0, 49.0, 27.0, 19.0, 19.0, 10.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.9141387939453125e-06, -6.738118827342987e-06, -6.562098860740662e-06, -6.386078894138336e-06, -6.210058927536011e-06, -6.034038960933685e-06, -5.85801899433136e-06, -5.6819990277290344e-06, -5.505979061126709e-06, -5.3299590945243835e-06, -5.153939127922058e-06, -4.977919161319733e-06, -4.801899194717407e-06, -4.625879228115082e-06, -4.449859261512756e-06, -4.273839294910431e-06, -4.0978193283081055e-06, -3.92179936170578e-06, -3.7457793951034546e-06, -3.569759428501129e-06, -3.3937394618988037e-06, -3.2177194952964783e-06, -3.041699528694153e-06, -2.8656795620918274e-06, -2.689659595489502e-06, -2.5136396288871765e-06, -2.337619662284851e-06, -2.1615996956825256e-06, -1.9855797290802e-06, -1.8095597624778748e-06, -1.6335397958755493e-06, -1.4575198292732239e-06, -1.2814998626708984e-06, -1.105479896068573e-06, -9.294599294662476e-07, -7.534399628639221e-07, -5.774199962615967e-07, -4.0140002965927124e-07, -2.253800630569458e-07, -4.936009645462036e-08, 1.2665987014770508e-07, 3.026798367500305e-07, 4.78699803352356e-07, 6.547197699546814e-07, 8.307397365570068e-07, 1.0067597031593323e-06, 1.1827796697616577e-06, 1.3587996363639832e-06, 1.5348196029663086e-06, 1.710839569568634e-06, 1.8868595361709595e-06, 2.062879502773285e-06, 2.2388994693756104e-06, 2.414919435977936e-06, 2.5909394025802612e-06, 2.7669593691825867e-06, 2.942979335784912e-06, 3.1189993023872375e-06, 3.295019268989563e-06, 3.4710392355918884e-06, 3.647059202194214e-06, 3.823079168796539e-06, 3.999099135398865e-06, 4.17511910200119e-06, 4.351139068603516e-06]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 4.0, 11.0, 8.0, 19.0, 28.0, 31.0, 42.0, 39.0, 68.0, 60.0, 72.0, 81.0, 89.0, 74.0, 72.0, 60.0, 57.0, 42.0, 35.0, 19.0, 27.0, 13.0, 12.0, 17.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001742839813232422, -0.0001698201522231102, -0.0001653563231229782, -0.00016089249402284622, -0.00015642866492271423, -0.00015196483582258224, -0.00014750100672245026, -0.00014303717762231827, -0.00013857334852218628, -0.0001341095194220543, -0.0001296456903219223, -0.00012518186122179031, -0.00012071803212165833, -0.00011625420302152634, -0.00011179037392139435, -0.00010732654482126236, -0.00010286271572113037, -9.839888662099838e-05, -9.39350575208664e-05, -8.94712284207344e-05, -8.500739932060242e-05, -8.054357022047043e-05, -7.607974112033844e-05, -7.161591202020645e-05, -6.715208292007446e-05, -6.268825381994247e-05, -5.8224424719810486e-05, -5.37605956196785e-05, -4.929676651954651e-05, -4.483293741941452e-05, -4.036910831928253e-05, -3.590527921915054e-05, -3.1441450119018555e-05, -2.6977621018886566e-05, -2.2513791918754578e-05, -1.804996281862259e-05, -1.35861337184906e-05, -9.122304618358612e-06, -4.6584755182266235e-06, -1.94646418094635e-07, 4.2691826820373535e-06, 8.733011782169342e-06, 1.319684088230133e-05, 1.766066998243332e-05, 2.2124499082565308e-05, 2.6588328182697296e-05, 3.1052157282829285e-05, 3.551598638296127e-05, 3.997981548309326e-05, 4.444364458322525e-05, 4.890747368335724e-05, 5.337130278348923e-05, 5.7835131883621216e-05, 6.22989609837532e-05, 6.676279008388519e-05, 7.122661918401718e-05, 7.569044828414917e-05, 8.015427738428116e-05, 8.461810648441315e-05, 8.908193558454514e-05, 9.354576468467712e-05, 9.800959378480911e-05, 0.0001024734228849411, 0.00010693725198507309, 0.00011140108108520508]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [136.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048274.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 166.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 30.0, 0.0, 0.0, 57.0, 0.0, 0.0, 0.0, 111.0, 0.0, 0.0, 181.0, 0.0, 0.0, 217.0, 0.0, 0.0, 0.0, 171.0, 0.0, 0.0, 125.0, 0.0, 0.0, 0.0, 63.0, 0.0, 0.0, 24.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.591420292854309e-07, -4.414469003677368e-07, -4.237517714500427e-07, -4.0605664253234863e-07, -3.8836151361465454e-07, -3.7066638469696045e-07, -3.5297125577926636e-07, -3.3527612686157227e-07, -3.175809979438782e-07, -2.998858690261841e-07, -2.8219074010849e-07, -2.644956111907959e-07, -2.468004822731018e-07, -2.2910535335540771e-07, -2.1141022443771362e-07, -1.9371509552001953e-07, -1.7601996660232544e-07, -1.5832483768463135e-07, -1.4062970876693726e-07, -1.2293457984924316e-07, -1.0523945093154907e-07, -8.754432201385498e-08, -6.984919309616089e-08, -5.21540641784668e-08, -3.4458935260772705e-08, -1.6763806343078613e-08, 9.313225746154785e-10, 1.862645149230957e-08, 3.632158041000366e-08, 5.4016709327697754e-08, 7.171183824539185e-08, 8.940696716308594e-08, 1.0710209608078003e-07, 1.2479722499847412e-07, 1.424923539161682e-07, 1.601874828338623e-07, 1.778826117515564e-07, 1.955777406692505e-07, 2.1327286958694458e-07, 2.3096799850463867e-07, 2.4866312742233276e-07, 2.6635825634002686e-07, 2.8405338525772095e-07, 3.0174851417541504e-07, 3.1944364309310913e-07, 3.371387720108032e-07, 3.548339009284973e-07, 3.725290298461914e-07, 3.902241587638855e-07, 4.079192876815796e-07, 4.256144165992737e-07, 4.4330954551696777e-07, 4.6100467443466187e-07, 4.78699803352356e-07, 4.9639493227005e-07, 5.140900611877441e-07, 5.317851901054382e-07, 5.494803190231323e-07, 5.671754479408264e-07, 5.848705768585205e-07, 6.025657057762146e-07, 6.202608346939087e-07, 6.379559636116028e-07, 6.556510925292969e-07]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 8.0, 7.0, 12.0, 17.0, 19.0, 23.0, 27.0, 36.0, 74.0, 89.0, 171.0, 152.0, 100.0, 56.0, 38.0, 47.0, 23.0, 19.0, 10.0, 18.0, 7.0, 6.0, 9.0, 5.0, 2.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.726316157961264e-05, -5.5528271332150325e-05, -5.37933774467092e-05, -5.2058487199246883e-05, -5.0323596951784566e-05, -4.858870670432225e-05, -4.6853812818881124e-05, -4.511892257141881e-05, -4.338403232395649e-05, -4.164914207649417e-05, -3.991424819105305e-05, -3.817935794359073e-05, -3.644446769612841e-05, -3.4709577448666096e-05, -3.297468356322497e-05, -3.1239793315762654e-05, -2.950489943032153e-05, -2.777000736386981e-05, -2.603511711640749e-05, -2.430022504995577e-05, -2.2565334802493453e-05, -2.0830442736041732e-05, -1.909555066959001e-05, -1.7360660422127694e-05, -1.5625768355675973e-05, -1.3890877198718954e-05, -1.2155986041761935e-05, -1.0421093975310214e-05, -8.686202818353195e-06, -6.951311661396176e-06, -5.216419594944455e-06, -3.4815284379874356e-06, -1.7466409190092236e-06, -1.1749534678529017e-08, 1.7231418496521655e-06, 3.4580334613565356e-06, 5.192924618313555e-06, 6.927815775270574e-06, 8.662707841722295e-06, 1.0397598998679314e-05, 1.2132490155636333e-05, 1.3867381312593352e-05, 1.560227246955037e-05, 1.7337164536002092e-05, 1.9072056602453813e-05, 2.080694684991613e-05, 2.254183891636785e-05, 2.4276730982819572e-05, 2.601162123028189e-05, 2.774651329673361e-05, 2.9481403544195928e-05, 3.121629561064765e-05, 3.2951185858109966e-05, 3.468607610557228e-05, 3.642096999101341e-05, 3.8155860238475725e-05, 3.989075048593804e-05, 4.162564073340036e-05, 4.3360534618841484e-05, 4.50954248663038e-05, 4.683031511376612e-05, 4.8565205361228436e-05, 5.030009924666956e-05, 5.203498949413188e-05, 5.3769883379573e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 8.0, 5.0, 12.0, 27.0, 19.0, 34.0, 32.0, 43.0, 53.0, 64.0, 82.0, 78.0, 78.0, 63.0, 66.0, 77.0, 64.0, 51.0, 37.0, 32.0, 22.0, 19.0, 12.0, 7.0, 6.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.873767440789379e-05, -5.703814895241521e-05, -5.5338623496936634e-05, -5.3639098041458055e-05, -5.1939576223958284e-05, -5.0240050768479705e-05, -4.8540525313001126e-05, -4.684099985752255e-05, -4.514147440204397e-05, -4.344194894656539e-05, -4.174242349108681e-05, -4.004289803560823e-05, -3.834337258012965e-05, -3.6643847124651074e-05, -3.49443253071513e-05, -3.3244799851672724e-05, -3.1545274396194145e-05, -2.9845748940715566e-05, -2.8146223485236987e-05, -2.6446699848747812e-05, -2.4747174393269233e-05, -2.3047648937790655e-05, -2.134812530130148e-05, -1.96485998458229e-05, -1.7949074390344322e-05, -1.6249548934865743e-05, -1.4550024388881866e-05, -1.2850499842897989e-05, -1.115097438741941e-05, -9.451448931940831e-06, -7.751924385956954e-06, -6.052399839973077e-06, -4.352874384494498e-06, -2.6533493837632705e-06, -9.538243830320425e-07, 7.457006176991854e-07, 2.4452256184304133e-06, 4.144751073908992e-06, 5.844275619892869e-06, 7.543800165876746e-06, 9.243325621355325e-06, 1.0942851076833904e-05, 1.264237562281778e-05, 1.4341900168801658e-05, 1.6041425624280237e-05, 1.7740951079758815e-05, 1.944047471624799e-05, 2.114000017172657e-05, 2.283952562720515e-05, 2.4539051082683727e-05, 2.6238576538162306e-05, 2.793810017465148e-05, 2.963762563013006e-05, 3.1337149266619235e-05, 3.3036674722097814e-05, 3.473620017757639e-05, 3.643572563305497e-05, 3.813525108853355e-05, 3.983477654401213e-05, 4.153430199949071e-05, 4.323382745496929e-05, 4.4933352910447866e-05, 4.663287472794764e-05, 4.8332400183426216e-05, 5.0031925638904795e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 5.0, 5.0, 9.0, 11.0, 18.0, 22.0, 25.0, 40.0, 39.0, 80.0, 114.0, 151.0, 249.0, 434.0, 629.0, 1113.0, 1860.0, 3396.0, 6490.0, 13363.0, 31353.0, 86249.0, 395925.0, 371697.0, 79444.0, 29022.0, 12678.0, 6341.0, 3148.0, 1774.0, 1080.0, 633.0, 379.0, 241.0, 176.0, 112.0, 60.0, 48.0, 38.0, 24.0, 21.0, 14.0, 11.0, 11.0, 9.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.1856040954589844e-05, -5.023367702960968e-05, -4.8611313104629517e-05, -4.698894917964935e-05, -4.536658525466919e-05, -4.3744221329689026e-05, -4.212185740470886e-05, -4.04994934797287e-05, -3.8877129554748535e-05, -3.725476562976837e-05, -3.563240170478821e-05, -3.4010037779808044e-05, -3.238767385482788e-05, -3.076530992984772e-05, -2.9142946004867554e-05, -2.752058207988739e-05, -2.5898218154907227e-05, -2.4275854229927063e-05, -2.26534903049469e-05, -2.1031126379966736e-05, -1.9408762454986572e-05, -1.778639853000641e-05, -1.6164034605026245e-05, -1.4541670680046082e-05, -1.2919306755065918e-05, -1.1296942830085754e-05, -9.67457890510559e-06, -8.052214980125427e-06, -6.429851055145264e-06, -4.8074871301651e-06, -3.1851232051849365e-06, -1.562759280204773e-06, 5.960464477539063e-08, 1.6819685697555542e-06, 3.3043324947357178e-06, 4.926696419715881e-06, 6.549060344696045e-06, 8.171424269676208e-06, 9.793788194656372e-06, 1.1416152119636536e-05, 1.30385160446167e-05, 1.4660879969596863e-05, 1.6283243894577026e-05, 1.790560781955719e-05, 1.9527971744537354e-05, 2.1150335669517517e-05, 2.277269959449768e-05, 2.4395063519477844e-05, 2.6017427444458008e-05, 2.763979136943817e-05, 2.9262155294418335e-05, 3.08845192193985e-05, 3.250688314437866e-05, 3.4129247069358826e-05, 3.575161099433899e-05, 3.737397491931915e-05, 3.8996338844299316e-05, 4.061870276927948e-05, 4.2241066694259644e-05, 4.386343061923981e-05, 4.548579454421997e-05, 4.7108158469200134e-05, 4.87305223941803e-05, 5.035288631916046e-05, 5.1975250244140625e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 9.0, 11.0, 9.0, 25.0, 26.0, 24.0, 31.0, 47.0, 51.0, 64.0, 86.0, 79.0, 57.0, 69.0, 68.0, 58.0, 76.0, 47.0, 41.0, 32.0, 22.0, 18.0, 13.0, 12.0, 4.0, 5.0, 7.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4007091522216797e-05, -1.361314207315445e-05, -1.3219192624092102e-05, -1.2825243175029755e-05, -1.2431293725967407e-05, -1.203734427690506e-05, -1.1643394827842712e-05, -1.1249445378780365e-05, -1.0855495929718018e-05, -1.046154648065567e-05, -1.0067597031593323e-05, -9.673647582530975e-06, -9.279698133468628e-06, -8.88574868440628e-06, -8.491799235343933e-06, -8.097849786281586e-06, -7.703900337219238e-06, -7.309950888156891e-06, -6.9160014390945435e-06, -6.522051990032196e-06, -6.128102540969849e-06, -5.734153091907501e-06, -5.340203642845154e-06, -4.946254193782806e-06, -4.552304744720459e-06, -4.1583552956581116e-06, -3.764405846595764e-06, -3.3704563975334167e-06, -2.9765069484710693e-06, -2.582557499408722e-06, -2.1886080503463745e-06, -1.794658601284027e-06, -1.4007091522216797e-06, -1.0067597031593323e-06, -6.128102540969849e-07, -2.1886080503463745e-07, 1.7508864402770996e-07, 5.690380930900574e-07, 9.629875421524048e-07, 1.3569369912147522e-06, 1.7508864402770996e-06, 2.144835889339447e-06, 2.5387853384017944e-06, 2.932734787464142e-06, 3.3266842365264893e-06, 3.7206336855888367e-06, 4.114583134651184e-06, 4.5085325837135315e-06, 4.902482032775879e-06, 5.296431481838226e-06, 5.690380930900574e-06, 6.084330379962921e-06, 6.4782798290252686e-06, 6.872229278087616e-06, 7.266178727149963e-06, 7.66012817621231e-06, 8.054077625274658e-06, 8.448027074337006e-06, 8.841976523399353e-06, 9.2359259724617e-06, 9.629875421524048e-06, 1.0023824870586395e-05, 1.0417774319648743e-05, 1.081172376871109e-05, 1.1205673217773438e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 11.0, 13.0, 20.0, 52.0, 82.0, 136.0, 242.0, 536.0, 1214.0, 3956.0, 15489.0, 90531.0, 740474.0, 164998.0, 22539.0, 5312.0, 1626.0, 594.0, 297.0, 152.0, 106.0, 58.0, 36.0, 22.0, 21.0, 16.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.233287811279297e-05, -5.0290487706661224e-05, -4.824809730052948e-05, -4.6205706894397736e-05, -4.416331648826599e-05, -4.212092608213425e-05, -4.00785356760025e-05, -3.803614526987076e-05, -3.5993754863739014e-05, -3.395136445760727e-05, -3.1908974051475525e-05, -2.986658364534378e-05, -2.7824193239212036e-05, -2.5781802833080292e-05, -2.3739412426948547e-05, -2.1697022020816803e-05, -1.965463161468506e-05, -1.7612241208553314e-05, -1.556985080242157e-05, -1.3527460396289825e-05, -1.1485069990158081e-05, -9.442679584026337e-06, -7.400289177894592e-06, -5.357898771762848e-06, -3.3155083656311035e-06, -1.2731179594993591e-06, 7.692724466323853e-07, 2.8116628527641296e-06, 4.854053258895874e-06, 6.896443665027618e-06, 8.938834071159363e-06, 1.0981224477291107e-05, 1.3023614883422852e-05, 1.5066005289554596e-05, 1.710839569568634e-05, 1.9150786101818085e-05, 2.119317650794983e-05, 2.3235566914081573e-05, 2.5277957320213318e-05, 2.7320347726345062e-05, 2.9362738132476807e-05, 3.140512853860855e-05, 3.3447518944740295e-05, 3.548990935087204e-05, 3.7532299757003784e-05, 3.957469016313553e-05, 4.161708056926727e-05, 4.365947097539902e-05, 4.570186138153076e-05, 4.7744251787662506e-05, 4.978664219379425e-05, 5.1829032599925995e-05, 5.387142300605774e-05, 5.5913813412189484e-05, 5.795620381832123e-05, 5.999859422445297e-05, 6.204098463058472e-05, 6.408337503671646e-05, 6.61257654428482e-05, 6.816815584897995e-05, 7.02105462551117e-05, 7.225293666124344e-05, 7.429532706737518e-05, 7.633771747350693e-05, 7.838010787963867e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 5.0, 9.0, 6.0, 9.0, 16.0, 23.0, 21.0, 32.0, 35.0, 54.0, 66.0, 85.0, 84.0, 90.0, 94.0, 74.0, 75.0, 59.0, 55.0, 39.0, 14.0, 26.0, 16.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.159046173095703e-05, -3.076903522014618e-05, -2.9947608709335327e-05, -2.9126182198524475e-05, -2.8304755687713623e-05, -2.748332917690277e-05, -2.666190266609192e-05, -2.5840476155281067e-05, -2.5019049644470215e-05, -2.4197623133659363e-05, -2.337619662284851e-05, -2.255477011203766e-05, -2.1733343601226807e-05, -2.0911917090415955e-05, -2.0090490579605103e-05, -1.926906406879425e-05, -1.84476375579834e-05, -1.7626211047172546e-05, -1.6804784536361694e-05, -1.5983358025550842e-05, -1.516193151473999e-05, -1.4340505003929138e-05, -1.3519078493118286e-05, -1.2697651982307434e-05, -1.1876225471496582e-05, -1.105479896068573e-05, -1.0233372449874878e-05, -9.411945939064026e-06, -8.590519428253174e-06, -7.769092917442322e-06, -6.94766640663147e-06, -6.126239895820618e-06, -5.304813385009766e-06, -4.4833868741989136e-06, -3.6619603633880615e-06, -2.8405338525772095e-06, -2.0191073417663574e-06, -1.1976808309555054e-06, -3.762543201446533e-07, 4.4517219066619873e-07, 1.2665987014770508e-06, 2.088025212287903e-06, 2.909451723098755e-06, 3.730878233909607e-06, 4.552304744720459e-06, 5.373731255531311e-06, 6.195157766342163e-06, 7.016584277153015e-06, 7.838010787963867e-06, 8.65943729877472e-06, 9.480863809585571e-06, 1.0302290320396423e-05, 1.1123716831207275e-05, 1.1945143342018127e-05, 1.276656985282898e-05, 1.3587996363639832e-05, 1.4409422874450684e-05, 1.5230849385261536e-05, 1.6052275896072388e-05, 1.687370240688324e-05, 1.7695128917694092e-05, 1.8516555428504944e-05, 1.9337981939315796e-05, 2.0159408450126648e-05, 2.09808349609375e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 16.0, 7.0, 14.0, 20.0, 41.0, 31.0, 90.0, 114.0, 87.0, 281.0, 543.0, 437.0, 1734.0, 6119.0, 8534.0, 131219.0, 857603.0, 23664.0, 12448.0, 3174.0, 1124.0, 310.0, 388.0, 202.0, 66.0, 89.0, 66.0, 19.0, 42.0, 21.0, 7.0, 13.0, 7.0, 5.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.039836883544922e-06, -2.93925404548645e-06, -2.8386712074279785e-06, -2.738088369369507e-06, -2.637505531311035e-06, -2.5369226932525635e-06, -2.436339855194092e-06, -2.33575701713562e-06, -2.2351741790771484e-06, -2.1345913410186768e-06, -2.034008502960205e-06, -1.9334256649017334e-06, -1.8328428268432617e-06, -1.73225998878479e-06, -1.6316771507263184e-06, -1.5310943126678467e-06, -1.430511474609375e-06, -1.3299286365509033e-06, -1.2293457984924316e-06, -1.12876296043396e-06, -1.0281801223754883e-06, -9.275972843170166e-07, -8.270144462585449e-07, -7.264316082000732e-07, -6.258487701416016e-07, -5.252659320831299e-07, -4.246830940246582e-07, -3.241002559661865e-07, -2.2351741790771484e-07, -1.2293457984924316e-07, -2.2351741790771484e-08, 7.82310962677002e-08, 1.7881393432617188e-07, 2.7939677238464355e-07, 3.7997961044311523e-07, 4.805624485015869e-07, 5.811452865600586e-07, 6.817281246185303e-07, 7.82310962677002e-07, 8.828938007354736e-07, 9.834766387939453e-07, 1.084059476852417e-06, 1.1846423149108887e-06, 1.2852251529693604e-06, 1.385807991027832e-06, 1.4863908290863037e-06, 1.5869736671447754e-06, 1.687556505203247e-06, 1.7881393432617188e-06, 1.8887221813201904e-06, 1.989305019378662e-06, 2.089887857437134e-06, 2.1904706954956055e-06, 2.291053533554077e-06, 2.391636371612549e-06, 2.4922192096710205e-06, 2.592802047729492e-06, 2.693384885787964e-06, 2.7939677238464355e-06, 2.8945505619049072e-06, 2.995133399963379e-06, 3.0957162380218506e-06, 3.1962990760803223e-06, 3.296881914138794e-06, 3.3974647521972656e-06]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [77.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 867.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 1.0, 16.0, 0.0, 11.0, 34.0, 80.0, 0.0, 152.0, 476.0, 1230.0, 0.0, 3664.0, 14204.0, 89164.0, 0.0, 830605.0, 88989.0, 14115.0, 0.0, 3733.0, 1222.0, 481.0, 0.0, 168.0, 97.0, 43.0, 0.0, 21.0, 18.0, 9.0, 0.0, 14.0, 8.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06, 1.475214958190918e-06, 1.519918441772461e-06, 1.564621925354004e-06, 1.6093254089355469e-06]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 12.0, 0.0, 0.0, 13.0, 0.0, 0.0, 27.0, 0.0, 0.0, 62.0, 0.0, 0.0, 0.0, 173.0, 0.0, 0.0, 435.0, 0.0, 0.0, 175.0, 0.0, 0.0, 64.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.370246410369873e-07, -6.183981895446777e-07, -5.997717380523682e-07, -5.811452865600586e-07, -5.62518835067749e-07, -5.438923835754395e-07, -5.252659320831299e-07, -5.066394805908203e-07, -4.880130290985107e-07, -4.6938657760620117e-07, -4.507601261138916e-07, -4.3213367462158203e-07, -4.1350722312927246e-07, -3.948807716369629e-07, -3.762543201446533e-07, -3.5762786865234375e-07, -3.390014171600342e-07, -3.203749656677246e-07, -3.0174851417541504e-07, -2.8312206268310547e-07, -2.644956111907959e-07, -2.4586915969848633e-07, -2.2724270820617676e-07, -2.086162567138672e-07, -1.8998980522155762e-07, -1.7136335372924805e-07, -1.5273690223693848e-07, -1.341104507446289e-07, -1.1548399925231934e-07, -9.685754776000977e-08, -7.82310962677002e-08, -5.960464477539063e-08, -4.0978193283081055e-08, -2.2351741790771484e-08, -3.725290298461914e-09, 1.4901161193847656e-08, 3.3527612686157227e-08, 5.21540641784668e-08, 7.078051567077637e-08, 8.940696716308594e-08, 1.0803341865539551e-07, 1.2665987014770508e-07, 1.4528632164001465e-07, 1.6391277313232422e-07, 1.825392246246338e-07, 2.0116567611694336e-07, 2.1979212760925293e-07, 2.384185791015625e-07, 2.5704503059387207e-07, 2.7567148208618164e-07, 2.942979335784912e-07, 3.129243850708008e-07, 3.3155083656311035e-07, 3.501772880554199e-07, 3.688037395477295e-07, 3.8743019104003906e-07, 4.0605664253234863e-07, 4.246830940246582e-07, 4.4330954551696777e-07, 4.6193599700927734e-07, 4.805624485015869e-07, 4.991888999938965e-07, 5.178153514862061e-07, 5.364418029785156e-07]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 8.0, 9.0, 11.0, 16.0, 19.0, 30.0, 36.0, 58.0, 101.0, 175.0, 178.0, 92.0, 70.0, 40.0, 33.0, 28.0, 16.0, 13.0, 5.0, 8.0, 11.0, 4.0, 5.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.660232611466199e-05, -6.497985305031762e-05, -6.335737271001562e-05, -6.173489964567125e-05, -6.011241930536926e-05, -5.848994624102488e-05, -5.686746590072289e-05, -5.5244992836378515e-05, -5.362251613405533e-05, -5.200003943173215e-05, -5.0377562729408965e-05, -4.875508602708578e-05, -4.71326093247626e-05, -4.5510132622439414e-05, -4.388765955809504e-05, -4.2265182855771855e-05, -4.064270615344867e-05, -3.902022945112549e-05, -3.7397752748802304e-05, -3.577527604647912e-05, -3.415279934415594e-05, -3.253032627981156e-05, -3.090784593950957e-05, -2.9285372875165194e-05, -2.7662892534863204e-05, -2.604041583254002e-05, -2.4417939130216837e-05, -2.2795462427893654e-05, -2.1172987544559874e-05, -1.955051084223669e-05, -1.7928034139913507e-05, -1.6305559256579727e-05, -1.4683082554256544e-05, -1.306060585193336e-05, -1.1438130059104878e-05, -9.815653356781695e-06, -8.193177563953213e-06, -6.57070086163003e-06, -4.9482241593068466e-06, -3.325748366478365e-06, -1.7032716641551815e-06, -8.079530289251124e-08, 1.541681058370159e-06, 3.164157533319667e-06, 4.7866337808954995e-06, 6.409110028471332e-06, 8.031586730794515e-06, 9.654062523622997e-06, 1.127653922594618e-05, 1.2899015928269364e-05, 1.4521491721097846e-05, 1.6143967513926327e-05, 1.776644421624951e-05, 1.9388920918572694e-05, 2.1011397620895877e-05, 2.263387432321906e-05, 2.4256351025542244e-05, 2.5878827727865428e-05, 2.750130443018861e-05, 2.9123781132511795e-05, 3.074625783483498e-05, 3.236873453715816e-05, 3.399120760150254e-05, 3.561368430382572e-05, 3.7236161006148905e-05]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 2.0, 9.0, 8.0, 7.0, 9.0, 5.0, 8.0, 10.0, 16.0, 15.0, 14.0, 14.0, 19.0, 26.0, 23.0, 27.0, 9.0, 32.0, 30.0, 28.0, 28.0, 28.0, 48.0, 41.0, 40.0, 37.0, 33.0, 38.0, 35.0, 32.0, 22.0, 38.0, 32.0, 33.0, 20.0, 24.0, 20.0, 17.0, 15.0, 18.0, 12.0, 12.0, 9.0, 6.0, 14.0, 15.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.315750862180721e-05, -2.2394540792447515e-05, -2.1631571144098416e-05, -2.086860331473872e-05, -2.0105635485379025e-05, -1.9342665837029926e-05, -1.857969800767023e-05, -1.7816728359321132e-05, -1.7053760529961437e-05, -1.629079270060174e-05, -1.5527823052252643e-05, -1.4764855222892947e-05, -1.400188648403855e-05, -1.3238917745184153e-05, -1.2475949915824458e-05, -1.1712981176970061e-05, -1.0950013347610366e-05, -1.0187044608755969e-05, -9.424076779396273e-06, -8.661108040541876e-06, -7.898139301687479e-06, -7.135171017580433e-06, -6.372202733473387e-06, -5.6092339946189895e-06, -4.846265710511943e-06, -4.083297426404897e-06, -3.3203286875505e-06, -2.557360403443454e-06, -1.7943918919627322e-06, -1.0314233804820105e-06, -2.6845509637496434e-07, 4.945136424794327e-07, 1.257481926586479e-06, 2.0204504380672006e-06, 2.7834189495479222e-06, 3.5463872336549684e-06, 4.3093559725093655e-06, 5.072324256616412e-06, 5.835292540723458e-06, 6.598261279577855e-06, 7.361229563684901e-06, 8.124197847791947e-06, 8.887166586646345e-06, 9.650135325500742e-06, 1.0413103154860437e-05, 1.1176071893714834e-05, 1.1939040632569231e-05, 1.2702008461928926e-05, 1.3464977200783323e-05, 1.422794593963772e-05, 1.4990913768997416e-05, 1.575388159835711e-05, 1.651685124670621e-05, 1.7279819076065905e-05, 1.8042788724415004e-05, 1.88057565537747e-05, 1.9568724383134395e-05, 2.033169221249409e-05, 2.109466186084319e-05, 2.1857629690202884e-05, 2.262059751956258e-05, 2.338356716791168e-05, 2.4146534997271374e-05, 2.490950282663107e-05, 2.5672472474980168e-05]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 8.0, 8.0, 7.0, 17.0, 17.0, 23.0, 19.0, 32.0, 32.0, 51.0, 80.0, 112.0, 157.0, 216.0, 292.0, 479.0, 683.0, 987.0, 1512.0, 2539.0, 4244.0, 13165.0, 3934394.0, 219495.0, 6166.0, 3575.0, 2101.0, 1354.0, 781.0, 528.0, 379.0, 235.0, 169.0, 107.0, 70.0, 64.0, 50.0, 36.0, 25.0, 16.0, 16.0, 14.0, 11.0, 8.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.739927291870117e-05, -5.547143518924713e-05, -5.354359745979309e-05, -5.161575973033905e-05, -4.968792200088501e-05, -4.776008427143097e-05, -4.583224654197693e-05, -4.390440881252289e-05, -4.197657108306885e-05, -4.004873335361481e-05, -3.8120895624160767e-05, -3.6193057894706726e-05, -3.4265220165252686e-05, -3.2337382435798645e-05, -3.0409544706344604e-05, -2.8481706976890564e-05, -2.6553869247436523e-05, -2.4626031517982483e-05, -2.2698193788528442e-05, -2.0770356059074402e-05, -1.884251832962036e-05, -1.691468060016632e-05, -1.498684287071228e-05, -1.305900514125824e-05, -1.11311674118042e-05, -9.203329682350159e-06, -7.275491952896118e-06, -5.347654223442078e-06, -3.419816493988037e-06, -1.4919787645339966e-06, 4.3585896492004395e-07, 2.3636966943740845e-06, 4.291534423828125e-06, 6.2193721532821655e-06, 8.147209882736206e-06, 1.0075047612190247e-05, 1.2002885341644287e-05, 1.3930723071098328e-05, 1.5858560800552368e-05, 1.778639853000641e-05, 1.971423625946045e-05, 2.164207398891449e-05, 2.356991171836853e-05, 2.549774944782257e-05, 2.742558717727661e-05, 2.9353424906730652e-05, 3.128126263618469e-05, 3.320910036563873e-05, 3.5136938095092773e-05, 3.7064775824546814e-05, 3.8992613554000854e-05, 4.0920451283454895e-05, 4.2848289012908936e-05, 4.4776126742362976e-05, 4.6703964471817017e-05, 4.863180220127106e-05, 5.05596399307251e-05, 5.248747766017914e-05, 5.441531538963318e-05, 5.634315311908722e-05, 5.827099084854126e-05, 6.01988285779953e-05, 6.212666630744934e-05, 6.405450403690338e-05, 6.598234176635742e-05]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 5.0, 7.0, 13.0, 7.0, 8.0, 8.0, 11.0, 12.0, 18.0, 17.0, 29.0, 20.0, 21.0, 22.0, 22.0, 37.0, 33.0, 34.0, 43.0, 49.0, 51.0, 48.0, 56.0, 37.0, 27.0, 45.0, 38.0, 26.0, 38.0, 33.0, 29.0, 22.0, 25.0, 17.0, 9.0, 13.0, 12.0, 6.0, 13.0, 12.0, 4.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1086463928222656e-05, -1.0711140930652618e-05, -1.033581793308258e-05, -9.960494935512543e-06, -9.585171937942505e-06, -9.209848940372467e-06, -8.83452594280243e-06, -8.459202945232391e-06, -8.083879947662354e-06, -7.708556950092316e-06, -7.333233952522278e-06, -6.95791095495224e-06, -6.582587957382202e-06, -6.207264959812164e-06, -5.8319419622421265e-06, -5.456618964672089e-06, -5.081295967102051e-06, -4.705972969532013e-06, -4.330649971961975e-06, -3.955326974391937e-06, -3.5800039768218994e-06, -3.2046809792518616e-06, -2.8293579816818237e-06, -2.454034984111786e-06, -2.078711986541748e-06, -1.7033889889717102e-06, -1.3280659914016724e-06, -9.527429938316345e-07, -5.774199962615967e-07, -2.0209699869155884e-07, 1.73225998878479e-07, 5.485489964485168e-07, 9.238719940185547e-07, 1.2991949915885925e-06, 1.6745179891586304e-06, 2.0498409867286682e-06, 2.425163984298706e-06, 2.800486981868744e-06, 3.1758099794387817e-06, 3.5511329770088196e-06, 3.926455974578857e-06, 4.301778972148895e-06, 4.677101969718933e-06, 5.052424967288971e-06, 5.427747964859009e-06, 5.803070962429047e-06, 6.1783939599990845e-06, 6.553716957569122e-06, 6.92903995513916e-06, 7.304362952709198e-06, 7.679685950279236e-06, 8.055008947849274e-06, 8.430331945419312e-06, 8.80565494298935e-06, 9.180977940559387e-06, 9.556300938129425e-06, 9.931623935699463e-06, 1.03069469332695e-05, 1.0682269930839539e-05, 1.1057592928409576e-05, 1.1432915925979614e-05, 1.1808238923549652e-05, 1.218356192111969e-05, 1.2558884918689728e-05, 1.2934207916259766e-05]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 12.0, 3.0, 14.0, 46.0, 39.0, 135.0, 343.0, 1803.0, 42446.0, 4144204.0, 4330.0, 579.0, 155.0, 71.0, 43.0, 20.0, 6.0, 11.0, 4.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010460615158081055, -9.966734796762466e-05, -9.472854435443878e-05, -8.97897407412529e-05, -8.485093712806702e-05, -7.991213351488113e-05, -7.497332990169525e-05, -7.003452628850937e-05, -6.509572267532349e-05, -6.0156919062137604e-05, -5.521811544895172e-05, -5.027931183576584e-05, -4.5340508222579956e-05, -4.0401704609394073e-05, -3.546290099620819e-05, -3.052409738302231e-05, -2.5585293769836426e-05, -2.0646490156650543e-05, -1.570768654346466e-05, -1.0768882930278778e-05, -5.8300793170928955e-06, -8.912757039070129e-07, 4.04752790927887e-06, 8.986331522464752e-06, 1.3925135135650635e-05, 1.8863938748836517e-05, 2.38027423620224e-05, 2.8741545975208282e-05, 3.3680349588394165e-05, 3.861915320158005e-05, 4.355795681476593e-05, 4.849676042795181e-05, 5.3435564041137695e-05, 5.837436765432358e-05, 6.331317126750946e-05, 6.825197488069534e-05, 7.319077849388123e-05, 7.812958210706711e-05, 8.306838572025299e-05, 8.800718933343887e-05, 9.294599294662476e-05, 9.788479655981064e-05, 0.00010282360017299652, 0.0001077624037861824, 0.00011270120739936829, 0.00011764001101255417, 0.00012257881462574005, 0.00012751761823892593, 0.00013245642185211182, 0.0001373952254652977, 0.00014233402907848358, 0.00014727283269166946, 0.00015221163630485535, 0.00015715043991804123, 0.0001620892435312271, 0.000167028047144413, 0.00017196685075759888, 0.00017690565437078476, 0.00018184445798397064, 0.00018678326159715652, 0.0001917220652103424, 0.0001966608688235283, 0.00020159967243671417, 0.00020653847604990005, 0.00021147727966308594]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 9.0, 5.0, 9.0, 16.0, 70.0, 470.0, 3027.0, 358.0, 51.0, 14.0, 10.0, 8.0, 8.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1980533599853516e-05, -1.1393800377845764e-05, -1.0807067155838013e-05, -1.0220333933830261e-05, -9.63360071182251e-06, -9.046867489814758e-06, -8.460134267807007e-06, -7.873401045799255e-06, -7.286667823791504e-06, -6.6999346017837524e-06, -6.113201379776001e-06, -5.5264681577682495e-06, -4.939734935760498e-06, -4.353001713752747e-06, -3.766268491744995e-06, -3.1795352697372437e-06, -2.592802047729492e-06, -2.0060688257217407e-06, -1.4193356037139893e-06, -8.326023817062378e-07, -2.4586915969848633e-07, 3.4086406230926514e-07, 9.275972843170166e-07, 1.514330506324768e-06, 2.1010637283325195e-06, 2.687796950340271e-06, 3.2745301723480225e-06, 3.861263394355774e-06, 4.447996616363525e-06, 5.034729838371277e-06, 5.621463060379028e-06, 6.20819628238678e-06, 6.794929504394531e-06, 7.381662726402283e-06, 7.968395948410034e-06, 8.555129170417786e-06, 9.141862392425537e-06, 9.728595614433289e-06, 1.031532883644104e-05, 1.0902062058448792e-05, 1.1488795280456543e-05, 1.2075528502464294e-05, 1.2662261724472046e-05, 1.3248994946479797e-05, 1.3835728168487549e-05, 1.44224613904953e-05, 1.5009194612503052e-05, 1.5595927834510803e-05, 1.6182661056518555e-05, 1.6769394278526306e-05, 1.7356127500534058e-05, 1.794286072254181e-05, 1.852959394454956e-05, 1.9116327166557312e-05, 1.9703060388565063e-05, 2.0289793610572815e-05, 2.0876526832580566e-05, 2.1463260054588318e-05, 2.204999327659607e-05, 2.263672649860382e-05, 2.3223459720611572e-05, 2.3810192942619324e-05, 2.4396926164627075e-05, 2.4983659386634827e-05, 2.5570392608642578e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 9.0, 3.0, 7.0, 13.0, 24.0, 34.0, 47.0, 82.0, 127.0, 224.0, 175.0, 90.0, 53.0, 30.0, 27.0, 14.0, 17.0, 10.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.04856946261134e-05, -3.943894989788532e-05, -3.8392205169657245e-05, -3.734546044142917e-05, -3.629871571320109e-05, -3.5251970984973013e-05, -3.420522989472374e-05, -3.3158485166495666e-05, -3.211174043826759e-05, -3.106499571003951e-05, -3.0018250981811434e-05, -2.8971506253583357e-05, -2.7924763344344683e-05, -2.6878018616116606e-05, -2.583127388788853e-05, -2.478452915966045e-05, -2.3737784431432374e-05, -2.2691039703204297e-05, -2.164429497497622e-05, -2.0597552065737545e-05, -1.9550807337509468e-05, -1.850406260928139e-05, -1.7457317881053314e-05, -1.6410573152825236e-05, -1.536382842459716e-05, -1.4317083696369082e-05, -1.3270339877635706e-05, -1.2223595149407629e-05, -1.1176851330674253e-05, -1.0130106602446176e-05, -9.083361874218099e-06, -8.036617145990022e-06, -6.989874236751348e-06, -5.943129963270621e-06, -4.896385689789895e-06, -3.849640961561818e-06, -2.8028966880810913e-06, -1.7561524146003649e-06, -7.094076863722876e-07, 3.3733658710843883e-07, 1.3840808605891652e-06, 2.4308251340698916e-06, 3.4775696349242935e-06, 4.524314135778695e-06, 5.571058409259422e-06, 6.617802682740148e-06, 7.664547410968225e-06, 8.711291229701601e-06, 9.758035957929678e-06, 1.0804780686157756e-05, 1.1851524504891131e-05, 1.2898269233119208e-05, 1.3945013051852584e-05, 1.4991757780080661e-05, 1.603850250830874e-05, 1.7085247236536816e-05, 1.8131991964764893e-05, 1.917873669299297e-05, 2.0225481421221048e-05, 2.1272226149449125e-05, 2.23189690586878e-05, 2.3365713786915876e-05, 2.4412458515143953e-05, 2.545920324337203e-05, 2.6505946152610704e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 10.0, 5.0, 12.0, 13.0, 11.0, 19.0, 19.0, 15.0, 20.0, 29.0, 36.0, 36.0, 38.0, 44.0, 40.0, 41.0, 37.0, 46.0, 30.0, 46.0, 54.0, 44.0, 42.0, 39.0, 40.0, 33.0, 26.0, 24.0, 40.0, 19.0, 16.0, 14.0, 11.0, 13.0, 7.0, 10.0, 10.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3450993719743565e-05, -1.3038894394412637e-05, -1.262679597857641e-05, -1.2214697562740184e-05, -1.1802598237409256e-05, -1.1390498912078328e-05, -1.0978400496242102e-05, -1.0566302080405876e-05, -1.0154202755074948e-05, -9.74210342974402e-06, -9.330005013907794e-06, -8.917906598071568e-06, -8.50580727274064e-06, -8.093707947409712e-06, -7.681609531573486e-06, -7.2695106609899085e-06, -6.857411790406331e-06, -6.445312919822754e-06, -6.033214049239177e-06, -5.6211151786556e-06, -5.209016308072023e-06, -4.796917437488446e-06, -4.384818566904869e-06, -3.972719696321292e-06, -3.5606208257377148e-06, -3.1485219551541377e-06, -2.7364230845705606e-06, -2.3243242139869835e-06, -1.9122253434034064e-06, -1.5001264728198294e-06, -1.0880276022362523e-06, -6.759287316526752e-07, -2.638298610690981e-07, 1.4826900951447897e-07, 5.60367880098056e-07, 9.724667506816331e-07, 1.3845656212652102e-06, 1.7966644918487873e-06, 2.2087633624323644e-06, 2.6208622330159415e-06, 3.0329611035995185e-06, 3.4450599741830956e-06, 3.857158844766673e-06, 4.26925771535025e-06, 4.681356585933827e-06, 5.093455456517404e-06, 5.505554327100981e-06, 5.917653197684558e-06, 6.329752068268135e-06, 6.741850938851712e-06, 7.153949809435289e-06, 7.5660486800188664e-06, 7.978147550602444e-06, 8.390246875933371e-06, 8.802345291769598e-06, 9.214443707605824e-06, 9.626543032936752e-06, 1.003864235826768e-05, 1.0450740774103906e-05, 1.0862839189940132e-05, 1.127493851527106e-05, 1.1687037840601988e-05, 1.2099136256438214e-05, 1.251123467227444e-05, 1.2923333997605368e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 1.0, 7.0, 14.0, 33.0, 21.0, 58.0, 136.0, 216.0, 227.0, 773.0, 1849.0, 6142.0, 8411.0, 130611.0, 859689.0, 22652.0, 12275.0, 3244.0, 1143.0, 298.0, 371.0, 172.0, 87.0, 24.0, 38.0, 20.0, 10.0, 5.0, 11.0, 4.0, 0.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.337860107421875e-06, -3.234483301639557e-06, -3.1311064958572388e-06, -3.0277296900749207e-06, -2.9243528842926025e-06, -2.8209760785102844e-06, -2.7175992727279663e-06, -2.614222466945648e-06, -2.51084566116333e-06, -2.407468855381012e-06, -2.304092049598694e-06, -2.2007152438163757e-06, -2.0973384380340576e-06, -1.9939616322517395e-06, -1.8905848264694214e-06, -1.7872080206871033e-06, -1.6838312149047852e-06, -1.580454409122467e-06, -1.477077603340149e-06, -1.3737007975578308e-06, -1.2703239917755127e-06, -1.1669471859931946e-06, -1.0635703802108765e-06, -9.601935744285583e-07, -8.568167686462402e-07, -7.534399628639221e-07, -6.50063157081604e-07, -5.466863512992859e-07, -4.4330954551696777e-07, -3.3993273973464966e-07, -2.3655593395233154e-07, -1.3317912817001343e-07, -2.9802322387695312e-08, 7.35744833946228e-08, 1.7695128917694092e-07, 2.8032809495925903e-07, 3.8370490074157715e-07, 4.870817065238953e-07, 5.904585123062134e-07, 6.938353180885315e-07, 7.972121238708496e-07, 9.005889296531677e-07, 1.0039657354354858e-06, 1.107342541217804e-06, 1.210719347000122e-06, 1.3140961527824402e-06, 1.4174729585647583e-06, 1.5208497643470764e-06, 1.6242265701293945e-06, 1.7276033759117126e-06, 1.8309801816940308e-06, 1.934356987476349e-06, 2.037733793258667e-06, 2.141110599040985e-06, 2.2444874048233032e-06, 2.3478642106056213e-06, 2.4512410163879395e-06, 2.5546178221702576e-06, 2.6579946279525757e-06, 2.761371433734894e-06, 2.864748239517212e-06, 2.96812504529953e-06, 3.071501851081848e-06, 3.1748786568641663e-06, 3.2782554626464844e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 14.0, 10.0, 12.0, 18.0, 23.0, 24.0, 34.0, 48.0, 48.0, 50.0, 71.0, 63.0, 63.0, 84.0, 68.0, 60.0, 65.0, 54.0, 37.0, 49.0, 29.0, 18.0, 13.0, 18.0, 8.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.621246337890625e-05, -1.5815719962120056e-05, -1.5418976545333862e-05, -1.5022233128547668e-05, -1.4625489711761475e-05, -1.422874629497528e-05, -1.3832002878189087e-05, -1.3435259461402893e-05, -1.30385160446167e-05, -1.2641772627830505e-05, -1.2245029211044312e-05, -1.1848285794258118e-05, -1.1451542377471924e-05, -1.105479896068573e-05, -1.0658055543899536e-05, -1.0261312127113342e-05, -9.864568710327148e-06, -9.467825293540955e-06, -9.07108187675476e-06, -8.674338459968567e-06, -8.277595043182373e-06, -7.88085162639618e-06, -7.484108209609985e-06, -7.0873647928237915e-06, -6.690621376037598e-06, -6.293877959251404e-06, -5.89713454246521e-06, -5.500391125679016e-06, -5.103647708892822e-06, -4.706904292106628e-06, -4.3101608753204346e-06, -3.913417458534241e-06, -3.516674041748047e-06, -3.119930624961853e-06, -2.723187208175659e-06, -2.3264437913894653e-06, -1.9297003746032715e-06, -1.5329569578170776e-06, -1.1362135410308838e-06, -7.394701242446899e-07, -3.427267074584961e-07, 5.4016709327697754e-08, 4.507601261138916e-07, 8.475035429000854e-07, 1.2442469596862793e-06, 1.6409903764724731e-06, 2.037733793258667e-06, 2.434477210044861e-06, 2.8312206268310547e-06, 3.2279640436172485e-06, 3.6247074604034424e-06, 4.021450877189636e-06, 4.41819429397583e-06, 4.814937710762024e-06, 5.211681127548218e-06, 5.608424544334412e-06, 6.0051679611206055e-06, 6.401911377906799e-06, 6.798654794692993e-06, 7.195398211479187e-06, 7.592141628265381e-06, 7.988885045051575e-06, 8.385628461837769e-06, 8.782371878623962e-06, 9.179115295410156e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 13.0, 0.0, 0.0, 11.0, 0.0, 0.0, 32.0, 0.0, 0.0, 66.0, 0.0, 0.0, 120.0, 0.0, 0.0, 251.0, 0.0, 0.0, 850.0, 0.0, 0.0, 21562.0, 0.0, 1002767.0, 0.0, 0.0, 21580.0, 0.0, 0.0, 847.0, 0.0, 0.0, 226.0, 0.0, 0.0, 124.0, 0.0, 0.0, 61.0, 0.0, 0.0, 33.0, 0.0, 0.0, 14.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.152557373046875e-07, -6.94766640663147e-07, -6.742775440216064e-07, -6.537884473800659e-07, -6.332993507385254e-07, -6.128102540969849e-07, -5.923211574554443e-07, -5.718320608139038e-07, -5.513429641723633e-07, -5.308538675308228e-07, -5.103647708892822e-07, -4.898756742477417e-07, -4.6938657760620117e-07, -4.4889748096466064e-07, -4.284083843231201e-07, -4.079192876815796e-07, -3.8743019104003906e-07, -3.6694109439849854e-07, -3.46451997756958e-07, -3.259629011154175e-07, -3.0547380447387695e-07, -2.849847078323364e-07, -2.644956111907959e-07, -2.4400651454925537e-07, -2.2351741790771484e-07, -2.0302832126617432e-07, -1.825392246246338e-07, -1.6205012798309326e-07, -1.4156103134155273e-07, -1.210719347000122e-07, -1.0058283805847168e-07, -8.009374141693115e-08, -5.960464477539063e-08, -3.91155481338501e-08, -1.862645149230957e-08, 1.862645149230957e-09, 2.2351741790771484e-08, 4.284083843231201e-08, 6.332993507385254e-08, 8.381903171539307e-08, 1.043081283569336e-07, 1.2479722499847412e-07, 1.4528632164001465e-07, 1.6577541828155518e-07, 1.862645149230957e-07, 2.0675361156463623e-07, 2.2724270820617676e-07, 2.477318048477173e-07, 2.682209014892578e-07, 2.8870999813079834e-07, 3.0919909477233887e-07, 3.296881914138794e-07, 3.501772880554199e-07, 3.7066638469696045e-07, 3.91155481338501e-07, 4.116445779800415e-07, 4.3213367462158203e-07, 4.5262277126312256e-07, 4.731118679046631e-07, 4.936009645462036e-07, 5.140900611877441e-07, 5.345791578292847e-07, 5.550682544708252e-07, 5.755573511123657e-07, 5.960464477539062e-07]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 0.0, 7.0, 6.0, 8.0, 7.0, 10.0, 8.0, 17.0, 21.0, 16.0, 20.0, 21.0, 35.0, 30.0, 19.0, 47.0, 39.0, 48.0, 53.0, 50.0, 42.0, 43.0, 49.0, 45.0, 37.0, 40.0, 32.0, 38.0, 35.0, 22.0, 27.0, 20.0, 18.0, 13.0, 15.0, 15.0, 10.0, 10.0, 10.0, 2.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8715858459472656e-05, -1.8182210624217987e-05, -1.7648562788963318e-05, -1.711491495370865e-05, -1.658126711845398e-05, -1.604761928319931e-05, -1.551397144794464e-05, -1.4980323612689972e-05, -1.4446675777435303e-05, -1.3913027942180634e-05, -1.3379380106925964e-05, -1.2845732271671295e-05, -1.2312084436416626e-05, -1.1778436601161957e-05, -1.1244788765907288e-05, -1.0711140930652618e-05, -1.017749309539795e-05, -9.64384526014328e-06, -9.11019742488861e-06, -8.576549589633942e-06, -8.042901754379272e-06, -7.509253919124603e-06, -6.975606083869934e-06, -6.441958248615265e-06, -5.908310413360596e-06, -5.3746625781059265e-06, -4.841014742851257e-06, -4.307366907596588e-06, -3.773719072341919e-06, -3.2400712370872498e-06, -2.7064234018325806e-06, -2.1727755665779114e-06, -1.6391277313232422e-06, -1.105479896068573e-06, -5.718320608139038e-07, -3.818422555923462e-08, 4.954636096954346e-07, 1.0291114449501038e-06, 1.562759280204773e-06, 2.096407115459442e-06, 2.6300549507141113e-06, 3.1637027859687805e-06, 3.6973506212234497e-06, 4.230998456478119e-06, 4.764646291732788e-06, 5.298294126987457e-06, 5.8319419622421265e-06, 6.365589797496796e-06, 6.899237632751465e-06, 7.432885468006134e-06, 7.966533303260803e-06, 8.500181138515472e-06, 9.033828973770142e-06, 9.56747680902481e-06, 1.010112464427948e-05, 1.063477247953415e-05, 1.1168420314788818e-05, 1.1702068150043488e-05, 1.2235715985298157e-05, 1.2769363820552826e-05, 1.3303011655807495e-05, 1.3836659491062164e-05, 1.4370307326316833e-05, 1.4903955161571503e-05, 1.5437602996826172e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 19.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 128.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 633.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 125.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0], "bins": [-2.980232238769531e-07, -2.905726432800293e-07, -2.8312206268310547e-07, -2.7567148208618164e-07, -2.682209014892578e-07, -2.60770320892334e-07, -2.5331974029541016e-07, -2.4586915969848633e-07, -2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 11.0, 23.0, 51.0, 161.0, 477.0, 181.0, 61.0, 29.0, 11.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.199952960945666e-05, -7.04186677467078e-05, -6.883781315991655e-05, -6.725695129716769e-05, -6.567608943441883e-05, -6.409523484762758e-05, -6.251437298487872e-05, -6.093351112212986e-05, -5.93526528973598e-05, -5.777179467258975e-05, -5.619093280984089e-05, -5.4610074585070834e-05, -5.302921636030078e-05, -5.144835449755192e-05, -4.9867496272781864e-05, -4.828663804801181e-05, -4.670577618526295e-05, -4.5124917960492894e-05, -4.354405609774403e-05, -4.196319787297398e-05, -4.038233601022512e-05, -3.880147778545506e-05, -3.722061956068501e-05, -3.563975769793615e-05, -3.405889947316609e-05, -3.247804124839604e-05, -3.089717938564718e-05, -2.9316321160877123e-05, -2.7735461117117666e-05, -2.6154601073358208e-05, -2.4573742848588154e-05, -2.2992882804828696e-05, -2.1412026399048045e-05, -1.9831166355288588e-05, -1.825030631152913e-05, -1.6669448086759076e-05, -1.5088588042999618e-05, -1.350772799924016e-05, -1.1926868864975404e-05, -1.0346009730710648e-05, -8.76514968695119e-06, -7.184290097939083e-06, -5.6034305089269765e-06, -4.02257091991487e-06, -2.4417113309027627e-06, -8.608512871433049e-07, 7.20007847121451e-07, 2.300866981386207e-06, 3.881727025145665e-06, 5.462586614157772e-06, 7.0434462031698786e-06, 8.624305337434635e-06, 1.0205165381194092e-05, 1.178602542495355e-05, 1.3366884559218306e-05, 1.4947743693483062e-05, 1.652860373724252e-05, 1.8109463781001978e-05, 1.9690323824761435e-05, 2.127118204953149e-05, 2.2852042093290947e-05, 2.4432902137050405e-05, 2.601376036182046e-05, 2.7594620405579917e-05, 2.9175480449339375e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 5.0, 6.0, 14.0, 16.0, 18.0, 24.0, 26.0, 32.0, 54.0, 48.0, 55.0, 64.0, 56.0, 57.0, 56.0, 69.0, 69.0, 52.0, 58.0, 42.0, 44.0, 34.0, 35.0, 15.0, 13.0, 18.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.46016491271439e-05, -1.4238306903280318e-05, -1.3874964679416735e-05, -1.3511622455553152e-05, -1.3148279322194867e-05, -1.2784937098331284e-05, -1.24215948744677e-05, -1.2058252650604118e-05, -1.1694910426740535e-05, -1.1331568202876952e-05, -1.0968225979013368e-05, -1.0604883755149785e-05, -1.0241541531286202e-05, -9.878198397927918e-06, -9.514856174064334e-06, -9.151513950200751e-06, -8.788171726337168e-06, -8.424829502473585e-06, -8.061487278610002e-06, -7.69814505474642e-06, -7.334802376135485e-06, -6.971460152271902e-06, -6.608117473660968e-06, -6.244775249797385e-06, -5.881433025933802e-06, -5.518090802070219e-06, -5.154748578206636e-06, -4.791405899595702e-06, -4.428063675732119e-06, -4.064721451868536e-06, -3.7013790006312774e-06, -3.338036549394019e-06, -2.9746952350251377e-06, -2.6113530111615546e-06, -2.248010559924296e-06, -1.8846682223738753e-06, -1.5213258848234545e-06, -1.1579835472730338e-06, -7.94641209722613e-07, -4.312987584853545e-07, -6.795653462177143e-08, 2.9538580292864935e-07, 6.587281404790701e-07, 1.022070478029491e-06, 1.3854128155799117e-06, 1.7487551531303325e-06, 2.1120974906807533e-06, 2.4754399419180118e-06, 2.838782165781595e-06, 3.202124389645178e-06, 3.5654668408824364e-06, 3.928809292119695e-06, 4.292151515983278e-06, 4.655493739846861e-06, 5.018836418457795e-06, 5.382178642321378e-06, 5.745520866184961e-06, 6.108863090048544e-06, 6.472205313912127e-06, 6.835547992523061e-06, 7.198890216386644e-06, 7.562232440250227e-06, 7.925575118861161e-06, 8.288917342724744e-06, 8.652259566588327e-06]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 12.0, 15.0, 21.0, 28.0, 46.0, 47.0, 95.0, 127.0, 266.0, 598.0, 1289.0, 3699.0, 9890.0, 37870.0, 235824.0, 646562.0, 83587.0, 18248.0, 6442.0, 2221.0, 794.0, 371.0, 163.0, 123.0, 50.0, 33.0, 36.0, 33.0, 23.0, 9.0, 10.0, 3.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.300739288330078e-05, -2.231542021036148e-05, -2.162344753742218e-05, -2.093147486448288e-05, -2.023950219154358e-05, -1.954752951860428e-05, -1.8855556845664978e-05, -1.8163584172725677e-05, -1.7471611499786377e-05, -1.6779638826847076e-05, -1.6087666153907776e-05, -1.5395693480968475e-05, -1.4703720808029175e-05, -1.4011748135089874e-05, -1.3319775462150574e-05, -1.2627802789211273e-05, -1.1935830116271973e-05, -1.1243857443332672e-05, -1.0551884770393372e-05, -9.859912097454071e-06, -9.16793942451477e-06, -8.47596675157547e-06, -7.78399407863617e-06, -7.092021405696869e-06, -6.400048732757568e-06, -5.708076059818268e-06, -5.016103386878967e-06, -4.324130713939667e-06, -3.632158041000366e-06, -2.9401853680610657e-06, -2.248212695121765e-06, -1.5562400221824646e-06, -8.642673492431641e-07, -1.7229467630386353e-07, 5.19677996635437e-07, 1.2116506695747375e-06, 1.903623342514038e-06, 2.5955960154533386e-06, 3.287568688392639e-06, 3.97954136133194e-06, 4.67151403427124e-06, 5.363486707210541e-06, 6.055459380149841e-06, 6.747432053089142e-06, 7.439404726028442e-06, 8.131377398967743e-06, 8.823350071907043e-06, 9.515322744846344e-06, 1.0207295417785645e-05, 1.0899268090724945e-05, 1.1591240763664246e-05, 1.2283213436603546e-05, 1.2975186109542847e-05, 1.3667158782482147e-05, 1.4359131455421448e-05, 1.5051104128360748e-05, 1.574307680130005e-05, 1.643504947423935e-05, 1.712702214717865e-05, 1.781899482011795e-05, 1.851096749305725e-05, 1.920294016599655e-05, 1.9894912838935852e-05, 2.0586885511875153e-05, 2.1278858184814453e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 10.0, 10.0, 12.0, 12.0, 21.0, 23.0, 25.0, 31.0, 36.0, 49.0, 53.0, 46.0, 59.0, 67.0, 75.0, 59.0, 70.0, 65.0, 41.0, 48.0, 25.0, 31.0, 24.0, 25.0, 14.0, 17.0, 16.0, 8.0, 11.0, 2.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.614757537841797e-05, -5.441159009933472e-05, -5.2675604820251465e-05, -5.093961954116821e-05, -4.920363426208496e-05, -4.746764898300171e-05, -4.573166370391846e-05, -4.3995678424835205e-05, -4.225969314575195e-05, -4.05237078666687e-05, -3.878772258758545e-05, -3.70517373085022e-05, -3.5315752029418945e-05, -3.357976675033569e-05, -3.184378147125244e-05, -3.010779619216919e-05, -2.8371810913085938e-05, -2.6635825634002686e-05, -2.4899840354919434e-05, -2.316385507583618e-05, -2.142786979675293e-05, -1.9691884517669678e-05, -1.7955899238586426e-05, -1.6219913959503174e-05, -1.4483928680419922e-05, -1.274794340133667e-05, -1.1011958122253418e-05, -9.275972843170166e-06, -7.539987564086914e-06, -5.804002285003662e-06, -4.06801700592041e-06, -2.332031726837158e-06, -5.960464477539062e-07, 1.1399388313293457e-06, 2.8759241104125977e-06, 4.61190938949585e-06, 6.3478946685791016e-06, 8.083879947662354e-06, 9.819865226745605e-06, 1.1555850505828857e-05, 1.329183578491211e-05, 1.5027821063995361e-05, 1.6763806343078613e-05, 1.8499791622161865e-05, 2.0235776901245117e-05, 2.197176218032837e-05, 2.370774745941162e-05, 2.5443732738494873e-05, 2.7179718017578125e-05, 2.8915703296661377e-05, 3.065168857574463e-05, 3.238767385482788e-05, 3.412365913391113e-05, 3.5859644412994385e-05, 3.759562969207764e-05, 3.933161497116089e-05, 4.106760025024414e-05, 4.280358552932739e-05, 4.4539570808410645e-05, 4.6275556087493896e-05, 4.801154136657715e-05, 4.97475266456604e-05, 5.148351192474365e-05, 5.3219497203826904e-05, 5.4955482482910156e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 1.0, 10.0, 11.0, 9.0, 12.0, 16.0, 18.0, 26.0, 20.0, 29.0, 42.0, 59.0, 96.0, 149.0, 410.0, 2076.0, 1042823.0, 1835.0, 405.0, 152.0, 94.0, 49.0, 35.0, 38.0, 22.0, 17.0, 22.0, 15.0, 11.0, 5.0, 7.0, 14.0, 4.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00013518333435058594, -0.0001313723623752594, -0.00012756139039993286, -0.00012375041842460632, -0.00011993944644927979, -0.00011612847447395325, -0.00011231750249862671, -0.00010850653052330017, -0.00010469555854797363, -0.0001008845865726471, -9.707361459732056e-05, -9.326264262199402e-05, -8.945167064666748e-05, -8.564069867134094e-05, -8.18297266960144e-05, -7.801875472068787e-05, -7.420778274536133e-05, -7.039681077003479e-05, -6.658583879470825e-05, -6.277486681938171e-05, -5.8963894844055176e-05, -5.515292286872864e-05, -5.13419508934021e-05, -4.753097891807556e-05, -4.3720006942749023e-05, -3.9909034967422485e-05, -3.609806299209595e-05, -3.228709101676941e-05, -2.847611904144287e-05, -2.4665147066116333e-05, -2.0854175090789795e-05, -1.7043203115463257e-05, -1.3232231140136719e-05, -9.42125916481018e-06, -5.610287189483643e-06, -1.7993152141571045e-06, 2.0116567611694336e-06, 5.822628736495972e-06, 9.63360071182251e-06, 1.3444572687149048e-05, 1.7255544662475586e-05, 2.1066516637802124e-05, 2.4877488613128662e-05, 2.86884605884552e-05, 3.249943256378174e-05, 3.6310404539108276e-05, 4.0121376514434814e-05, 4.393234848976135e-05, 4.774332046508789e-05, 5.155429244041443e-05, 5.536526441574097e-05, 5.9176236391067505e-05, 6.298720836639404e-05, 6.679818034172058e-05, 7.060915231704712e-05, 7.442012429237366e-05, 7.82310962677002e-05, 8.204206824302673e-05, 8.585304021835327e-05, 8.966401219367981e-05, 9.347498416900635e-05, 9.728595614433289e-05, 0.00010109692811965942, 0.00010490790009498596, 0.0001087188720703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 13.0, 9.0, 4.0, 5.0, 11.0, 24.0, 15.0, 23.0, 27.0, 23.0, 47.0, 43.0, 48.0, 42.0, 63.0, 65.0, 52.0, 64.0, 62.0, 49.0, 62.0, 44.0, 30.0, 20.0, 32.0, 20.0, 19.0, 16.0, 11.0, 11.0, 5.0, 12.0, 10.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.226799011230469e-05, -8.966494351625443e-05, -8.706189692020416e-05, -8.44588503241539e-05, -8.185580372810364e-05, -7.925275713205338e-05, -7.664971053600311e-05, -7.404666393995285e-05, -7.144361734390259e-05, -6.884057074785233e-05, -6.623752415180206e-05, -6.36344775557518e-05, -6.103143095970154e-05, -5.8428384363651276e-05, -5.582533776760101e-05, -5.322229117155075e-05, -5.061924457550049e-05, -4.8016197979450226e-05, -4.541315138339996e-05, -4.28101047873497e-05, -4.020705819129944e-05, -3.7604011595249176e-05, -3.5000964999198914e-05, -3.239791840314865e-05, -2.979487180709839e-05, -2.7191825211048126e-05, -2.4588778614997864e-05, -2.19857320189476e-05, -1.938268542289734e-05, -1.6779638826847076e-05, -1.4176592230796814e-05, -1.1573545634746552e-05, -8.970499038696289e-06, -6.367452442646027e-06, -3.764405846595764e-06, -1.1613592505455017e-06, 1.4416873455047607e-06, 4.044733941555023e-06, 6.647780537605286e-06, 9.250827133655548e-06, 1.185387372970581e-05, 1.4456920325756073e-05, 1.7059966921806335e-05, 1.9663013517856598e-05, 2.226606011390686e-05, 2.4869106709957123e-05, 2.7472153306007385e-05, 3.0075199902057648e-05, 3.267824649810791e-05, 3.528129309415817e-05, 3.7884339690208435e-05, 4.04873862862587e-05, 4.309043288230896e-05, 4.569347947835922e-05, 4.8296526074409485e-05, 5.089957267045975e-05, 5.350261926651001e-05, 5.610566586256027e-05, 5.8708712458610535e-05, 6.13117590546608e-05, 6.391480565071106e-05, 6.651785224676132e-05, 6.912089884281158e-05, 7.172394543886185e-05, 7.432699203491211e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 10.0, 6.0, 39.0, 25.0, 120.0, 386.0, 3289.0, 1041297.0, 2825.0, 311.0, 117.0, 0.0, 26.0, 38.0, 8.0, 9.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-06, -1.4938414096832275e-06, -1.4379620552062988e-06, -1.3820827007293701e-06, -1.3262033462524414e-06, -1.2703239917755127e-06, -1.214444637298584e-06, -1.1585652828216553e-06, -1.1026859283447266e-06, -1.0468065738677979e-06, -9.909272193908691e-07, -9.350478649139404e-07, -8.791685104370117e-07, -8.23289155960083e-07, -7.674098014831543e-07, -7.115304470062256e-07, -6.556510925292969e-07, -5.997717380523682e-07, -5.438923835754395e-07, -4.880130290985107e-07, -4.3213367462158203e-07, -3.762543201446533e-07, -3.203749656677246e-07, -2.644956111907959e-07, -2.086162567138672e-07, -1.5273690223693848e-07, -9.685754776000977e-08, -4.0978193283081055e-08, 1.4901161193847656e-08, 7.078051567077637e-08, 1.2665987014770508e-07, 1.825392246246338e-07, 2.384185791015625e-07, 2.942979335784912e-07, 3.501772880554199e-07, 4.0605664253234863e-07, 4.6193599700927734e-07, 5.178153514862061e-07, 5.736947059631348e-07, 6.295740604400635e-07, 6.854534149169922e-07, 7.413327693939209e-07, 7.972121238708496e-07, 8.530914783477783e-07, 9.08970832824707e-07, 9.648501873016357e-07, 1.0207295417785645e-06, 1.0766088962554932e-06, 1.1324882507324219e-06, 1.1883676052093506e-06, 1.2442469596862793e-06, 1.300126314163208e-06, 1.3560056686401367e-06, 1.4118850231170654e-06, 1.4677643775939941e-06, 1.5236437320709229e-06, 1.5795230865478516e-06, 1.6354024410247803e-06, 1.691281795501709e-06, 1.7471611499786377e-06, 1.8030405044555664e-06, 1.8589198589324951e-06, 1.914799213409424e-06, 1.9706785678863525e-06, 2.0265579223632812e-06]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [28.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 985.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.0, 0.0, 0.0, 0.0, 0.0, 0.0, 591.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7062.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1032816.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7238.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 673.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0], "bins": [-3.5762786865234375e-07, -3.4831464290618896e-07, -3.390014171600342e-07, -3.296881914138794e-07, -3.203749656677246e-07, -3.110617399215698e-07, -3.0174851417541504e-07, -2.9243528842926025e-07, -2.8312206268310547e-07, -2.738088369369507e-07, -2.644956111907959e-07, -2.551823854446411e-07, -2.4586915969848633e-07, -2.3655593395233154e-07, -2.2724270820617676e-07, -2.1792948246002197e-07, -2.086162567138672e-07, -1.993030309677124e-07, -1.8998980522155762e-07, -1.8067657947540283e-07, -1.7136335372924805e-07, -1.6205012798309326e-07, -1.5273690223693848e-07, -1.434236764907837e-07, -1.341104507446289e-07, -1.2479722499847412e-07, -1.1548399925231934e-07, -1.0617077350616455e-07, -9.685754776000977e-08, -8.754432201385498e-08, -7.82310962677002e-08, -6.891787052154541e-08, -5.960464477539063e-08, -5.029141902923584e-08, -4.0978193283081055e-08, -3.166496753692627e-08, -2.2351741790771484e-08, -1.30385160446167e-08, -3.725290298461914e-09, 5.587935447692871e-09, 1.4901161193847656e-08, 2.421438694000244e-08, 3.3527612686157227e-08, 4.284083843231201e-08, 5.21540641784668e-08, 6.146728992462158e-08, 7.078051567077637e-08, 8.009374141693115e-08, 8.940696716308594e-08, 9.872019290924072e-08, 1.0803341865539551e-07, 1.1734664440155029e-07, 1.2665987014770508e-07, 1.3597309589385986e-07, 1.4528632164001465e-07, 1.5459954738616943e-07, 1.6391277313232422e-07, 1.73225998878479e-07, 1.825392246246338e-07, 1.9185245037078857e-07, 2.0116567611694336e-07, 2.1047890186309814e-07, 2.1979212760925293e-07, 2.2910535335540771e-07, 2.384185791015625e-07]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 915.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1009.0, 12.0, 2.0], "bins": [-0.0013530079741030931, -0.0013311069924384356, -0.0013092058943584561, -0.0012873049126937985, -0.001265403931029141, -0.0012435028329491615, -0.001221601851284504, -0.0011997008696198463, -0.0011777998879551888, -0.0011558989062905312, -0.0011339978082105517, -0.0011120968265458941, -0.0010901958448812366, -0.0010682947468012571, -0.0010463937651365995, -0.001024492783471942, -0.0010025916853919625, -0.000980690703727305, -0.0009587896638549864, -0.0009368886239826679, -0.0009149876423180103, -0.0008930866024456918, -0.0008711855625733733, -0.0008492845809087157, -0.0008273835410363972, -0.0008054825011640787, -0.0007835815194994211, -0.0007616804796271026, -0.0007397794397547841, -0.0007178784580901265, -0.000695977418217808, -0.0006740763783454895, -0.0006521753966808319, -0.0006302743568085134, -0.0006083733751438558, -0.0005864723352715373, -0.0005645713536068797, -0.0005426703137345612, -0.0005207692738622427, -0.0004988682921975851, -0.00047696728142909706, -0.000455066270660609, -0.0004331652307882905, -0.00041126422001980245, -0.0003893632092513144, -0.00036746219848282635, -0.0003455611877143383, -0.0003236601478420198, -0.00030175913707353175, -0.0002798581263050437, -0.0002579570864327252, -0.00023605607566423714, -0.0002141550648957491, -0.00019225405412726104, -0.00017035302880685776, -0.0001484520034864545, -0.00012655099271796644, -0.00010464997467352077, -8.274895662907511e-05, -6.0847938584629446e-05, -3.894692054018378e-05, -1.704590249573812e-05, 4.855115548707545e-06, 2.6756140869110823e-05, 4.865715163759887e-05]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 8.0, 1.0, 3.0, 7.0, 2.0, 6.0, 7.0, 10.0, 12.0, 21.0, 13.0, 16.0, 25.0, 32.0, 16.0, 33.0, 37.0, 42.0, 39.0, 33.0, 38.0, 40.0, 41.0, 46.0, 37.0, 40.0, 43.0, 35.0, 37.0, 37.0, 23.0, 24.0, 30.0, 28.0, 23.0, 21.0, 14.0, 19.0, 8.0, 12.0, 10.0, 6.0, 17.0, 3.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00014106053276918828, -0.00013702278374694288, -0.00013298503472469747, -0.00012894728570245206, -0.00012490953668020666, -0.00012087178038200364, -0.00011683402408380061, -0.0001127962750615552, -0.0001087585260393098, -0.00010472077701706439, -0.00010068302799481899, -9.664527169661596e-05, -9.260752267437056e-05, -8.856977365212515e-05, -8.453201735392213e-05, -8.049426833167672e-05, -7.645651930943131e-05, -7.241877028718591e-05, -6.83810212649405e-05, -6.434326496673748e-05, -6.030551594449207e-05, -5.6267766922246665e-05, -5.223001426202245e-05, -4.8192261601798236e-05, -4.415451257955283e-05, -4.011676355730742e-05, -3.607901089708321e-05, -3.2041258236858994e-05, -2.8003509214613587e-05, -2.3965758373378776e-05, -1.9928007532143965e-05, -1.5890256690909155e-05, -1.1852520401589572e-05, -7.814769560354762e-06, -3.777018719119951e-06, 2.607321221148595e-07, 4.29848296334967e-06, 8.33623380458448e-06, 1.2373984645819291e-05, 1.6411735487054102e-05, 2.0449486328288913e-05, 2.4487237169523723e-05, 2.8524988010758534e-05, 3.256274067098275e-05, 3.6600489693228155e-05, 4.063823871547356e-05, 4.467599137569778e-05, 4.871374403592199e-05, 5.27514930581674e-05, 5.6789242080412805e-05, 6.082699474063702e-05, 6.486474740086123e-05, 6.890249642310664e-05, 7.294024544535205e-05, 7.697800174355507e-05, 8.101575076580048e-05, 8.505349978804588e-05, 8.909124881029129e-05, 9.31289978325367e-05, 9.716675413073972e-05, 0.00010120450315298513, 0.00010524225217523053, 0.00010928000847343355, 0.00011331775749567896, 0.00011735550651792437]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 12.0, 2.0, 13.0, 2.0, 10.0, 4.0, 15.0, 14.0, 30.0, 9.0, 42.0, 9.0, 51.0, 27.0, 70.0, 68.0, 173.0, 345.0, 3939282.0, 253240.0, 308.0, 195.0, 71.0, 67.0, 21.0, 43.0, 21.0, 34.0, 9.0, 18.0, 11.0, 17.0, 5.0, 14.0, 9.0, 14.0, 3.0, 8.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011599063873291016, -0.00011212378740310669, -0.00010825693607330322, -0.00010439008474349976, -0.00010052323341369629, -9.665638208389282e-05, -9.278953075408936e-05, -8.892267942428589e-05, -8.505582809448242e-05, -8.118897676467896e-05, -7.732212543487549e-05, -7.345527410507202e-05, -6.958842277526855e-05, -6.572157144546509e-05, -6.185472011566162e-05, -5.7987868785858154e-05, -5.412101745605469e-05, -5.025416612625122e-05, -4.6387314796447754e-05, -4.252046346664429e-05, -3.865361213684082e-05, -3.4786760807037354e-05, -3.091990947723389e-05, -2.705305814743042e-05, -2.3186206817626953e-05, -1.9319355487823486e-05, -1.545250415802002e-05, -1.1585652828216553e-05, -7.718801498413086e-06, -3.851950168609619e-06, 1.4901161193847656e-08, 3.8817524909973145e-06, 7.748603820800781e-06, 1.1615455150604248e-05, 1.5482306480407715e-05, 1.934915781021118e-05, 2.321600914001465e-05, 2.7082860469818115e-05, 3.094971179962158e-05, 3.481656312942505e-05, 3.8683414459228516e-05, 4.255026578903198e-05, 4.641711711883545e-05, 5.0283968448638916e-05, 5.415081977844238e-05, 5.801767110824585e-05, 6.188452243804932e-05, 6.575137376785278e-05, 6.961822509765625e-05, 7.348507642745972e-05, 7.735192775726318e-05, 8.121877908706665e-05, 8.508563041687012e-05, 8.895248174667358e-05, 9.281933307647705e-05, 9.668618440628052e-05, 0.00010055303573608398, 0.00010441988706588745, 0.00010828673839569092, 0.00011215358972549438, 0.00011602044105529785, 0.00011988729238510132, 0.00012375414371490479, 0.00012762099504470825, 0.00013148784637451172]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 7.0, 8.0, 10.0, 12.0, 25.0, 24.0, 41.0, 50.0, 0.0, 62.0, 80.0, 68.0, 77.0, 90.0, 78.0, 79.0, 68.0, 55.0, 0.0, 47.0, 24.0, 29.0, 20.0, 18.0, 10.0, 6.0, 11.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.3764947652816772e-06, -1.3224780559539795e-06, -1.2684613466262817e-06, -1.214444637298584e-06, -1.1604279279708862e-06, -1.1064112186431885e-06, -1.0523945093154907e-06, -9.98377799987793e-07, -9.443610906600952e-07, -8.903443813323975e-07, -8.363276720046997e-07, -7.82310962677002e-07, -7.282942533493042e-07, -6.742775440216064e-07, -6.202608346939087e-07, -5.662441253662109e-07, -5.122274160385132e-07, -4.5821070671081543e-07, -4.041939973831177e-07, -3.501772880554199e-07, -2.9616057872772217e-07, -2.421438694000244e-07, -1.8812716007232666e-07, -1.341104507446289e-07, -8.009374141693115e-08, -2.60770320892334e-08, 2.7939677238464355e-08, 8.195638656616211e-08, 1.3597309589385986e-07, 1.8998980522155762e-07, 2.4400651454925537e-07, 2.980232238769531e-07, 3.520399332046509e-07, 4.0605664253234863e-07, 4.600733518600464e-07, 5.140900611877441e-07, 5.681067705154419e-07, 6.221234798431396e-07, 6.761401891708374e-07, 7.301568984985352e-07, 7.841736078262329e-07, 8.381903171539307e-07, 8.922070264816284e-07, 9.462237358093262e-07, 1.000240445137024e-06, 1.0542571544647217e-06, 1.1082738637924194e-06, 1.1622905731201172e-06, 1.216307282447815e-06, 1.2703239917755127e-06, 1.3243407011032104e-06, 1.3783574104309082e-06, 1.432374119758606e-06, 1.4863908290863037e-06, 1.5404075384140015e-06, 1.5944242477416992e-06, 1.648440957069397e-06, 1.7024576663970947e-06, 1.7564743757247925e-06, 1.8104910850524902e-06, 1.864507794380188e-06, 1.9185245037078857e-06, 1.9725412130355835e-06, 2.0265579223632812e-06]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 10.0, 1.0, 5.0, 21.0, 4.0, 72.0, 28.0, 961.0, 4191419.0, 1597.0, 43.0, 81.0, 3.0, 5.0, 14.0, 1.0, 7.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.777576446533203e-05, -2.6768073439598083e-05, -2.5760382413864136e-05, -2.4752691388130188e-05, -2.374500036239624e-05, -2.2737309336662292e-05, -2.1729618310928345e-05, -2.0721927285194397e-05, -1.971423625946045e-05, -1.87065452337265e-05, -1.7698854207992554e-05, -1.6691163182258606e-05, -1.5683472156524658e-05, -1.467578113079071e-05, -1.3668090105056763e-05, -1.2660399079322815e-05, -1.1652708053588867e-05, -1.064501702785492e-05, -9.637326002120972e-06, -8.629634976387024e-06, -7.621943950653076e-06, -6.614252924919128e-06, -5.606561899185181e-06, -4.598870873451233e-06, -3.591179847717285e-06, -2.5834888219833374e-06, -1.5757977962493896e-06, -5.681067705154419e-07, 4.3958425521850586e-07, 1.4472752809524536e-06, 2.4549663066864014e-06, 3.462657332420349e-06, 4.470348358154297e-06, 5.478039383888245e-06, 6.485730409622192e-06, 7.49342143535614e-06, 8.501112461090088e-06, 9.508803486824036e-06, 1.0516494512557983e-05, 1.1524185538291931e-05, 1.2531876564025879e-05, 1.3539567589759827e-05, 1.4547258615493774e-05, 1.5554949641227722e-05, 1.656264066696167e-05, 1.7570331692695618e-05, 1.8578022718429565e-05, 1.9585713744163513e-05, 2.059340476989746e-05, 2.160109579563141e-05, 2.2608786821365356e-05, 2.3616477847099304e-05, 2.4624168872833252e-05, 2.56318598985672e-05, 2.6639550924301147e-05, 2.7647241950035095e-05, 2.8654932975769043e-05, 2.966262400150299e-05, 3.067031502723694e-05, 3.1678006052970886e-05, 3.2685697078704834e-05, 3.369338810443878e-05, 3.470107913017273e-05, 3.570877015590668e-05, 3.6716461181640625e-05]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 5.0, 0.0, 6.0, 0.0, 0.0, 4.0, 0.0, 22.0, 0.0, 0.0, 42.0, 0.0, 274.0, 0.0, 0.0, 3342.0, 0.0, 282.0, 0.0, 0.0, 43.0, 0.0, 16.0, 0.0, 15.0, 0.0, 0.0, 8.0, 0.0, 2.0, 0.0, 0.0, 7.0, 0.0, 6.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.314367055892944e-07, -6.07222318649292e-07, -5.830079317092896e-07, -5.587935447692871e-07, -5.345791578292847e-07, -5.103647708892822e-07, -4.861503839492798e-07, -4.6193599700927734e-07, -4.377216100692749e-07, -4.1350722312927246e-07, -3.8929283618927e-07, -3.650784492492676e-07, -3.4086406230926514e-07, -3.166496753692627e-07, -2.9243528842926025e-07, -2.682209014892578e-07, -2.4400651454925537e-07, -2.1979212760925293e-07, -1.955777406692505e-07, -1.7136335372924805e-07, -1.471489667892456e-07, -1.2293457984924316e-07, -9.872019290924072e-08, -7.450580596923828e-08, -5.029141902923584e-08, -2.60770320892334e-08, -1.862645149230957e-09, 2.2351741790771484e-08, 4.6566128730773926e-08, 7.078051567077637e-08, 9.499490261077881e-08, 1.1920928955078125e-07, 1.434236764907837e-07, 1.6763806343078613e-07, 1.9185245037078857e-07, 2.1606683731079102e-07, 2.4028122425079346e-07, 2.644956111907959e-07, 2.8870999813079834e-07, 3.129243850708008e-07, 3.371387720108032e-07, 3.6135315895080566e-07, 3.855675458908081e-07, 4.0978193283081055e-07, 4.33996319770813e-07, 4.5821070671081543e-07, 4.824250936508179e-07, 5.066394805908203e-07, 5.308538675308228e-07, 5.550682544708252e-07, 5.792826414108276e-07, 6.034970283508301e-07, 6.277114152908325e-07, 6.51925802230835e-07, 6.761401891708374e-07, 7.003545761108398e-07, 7.245689630508423e-07, 7.487833499908447e-07, 7.729977369308472e-07, 7.972121238708496e-07, 8.21426510810852e-07, 8.456408977508545e-07, 8.698552846908569e-07, 8.940696716308594e-07]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 12.0, 23.0, 20.0, 53.0, 73.0, 115.0, 232.0, 173.0, 128.0, 74.0, 27.0, 25.0, 18.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55933855441981e-06, -2.446863845761982e-06, -2.334389364477829e-06, -2.221914655820001e-06, -2.109440174535848e-06, -1.99696546587802e-06, -1.8844907572201919e-06, -1.7720161622492014e-06, -1.659541567278211e-06, -1.5470669723072206e-06, -1.4345923773362301e-06, -1.322117668678402e-06, -1.2096430737074115e-06, -1.097168478736421e-06, -9.84693770078593e-07, -8.722191751076025e-07, -7.597445801366121e-07, -6.472699851656216e-07, -5.347953333512123e-07, -4.2232070995851245e-07, -3.098460865658126e-07, -1.9737149159482215e-07, -8.489683978041285e-08, 2.757781203399645e-08, 1.400524070049869e-07, 2.5252703039768676e-07, 3.6500165379038663e-07, 4.774763056047959e-07, 5.899509005757864e-07, 7.024254955467768e-07, 8.149001473611861e-07, 9.273747991755954e-07, 1.0398493941465858e-06, 1.1523239891175763e-06, 1.2647985840885667e-06, 1.3772732927463949e-06, 1.4897478877173853e-06, 1.6022224826883757e-06, 1.714697191346204e-06, 1.8271717863171943e-06, 1.9396463812881848e-06, 2.052121089946013e-06, 2.1645955712301657e-06, 2.277070279887994e-06, 2.389544988545822e-06, 2.5020194698299747e-06, 2.614494178487803e-06, 2.726968887145631e-06, 2.8394433684297837e-06, 2.951918077087612e-06, 3.0643925583717646e-06, 3.1768672670295928e-06, 3.2893417483137455e-06, 3.4018164569715736e-06, 3.514291165629402e-06, 3.6267656469135545e-06, 3.7392403555713827e-06, 3.851715064229211e-06, 3.9641895455133636e-06, 4.076664026797516e-06, 4.18913896282902e-06, 4.301613444113173e-06, 4.414087925397325e-06, 4.526562861428829e-06, 4.639037342712982e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 8.0, 13.0, 13.0, 18.0, 15.0, 20.0, 21.0, 31.0, 24.0, 27.0, 33.0, 48.0, 54.0, 35.0, 49.0, 47.0, 44.0, 31.0, 43.0, 45.0, 47.0, 26.0, 30.0, 36.0, 23.0, 22.0, 22.0, 26.0, 18.0, 20.0, 21.0, 17.0, 12.0, 6.0, 9.0, 4.0, 8.0, 7.0, 7.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.2638087127925246e-06, -1.227200868925138e-06, -1.190593138744589e-06, -1.1539852948772023e-06, -1.1173775646966533e-06, -1.0807697208292666e-06, -1.0441619906487176e-06, -1.007554146781331e-06, -9.709463029139442e-07, -9.343385158899764e-07, -8.977307288660086e-07, -8.611229418420407e-07, -8.245151548180729e-07, -7.879073109506862e-07, -7.512995239267184e-07, -7.146917369027506e-07, -6.780840067222016e-07, -6.414762196982338e-07, -6.048684326742659e-07, -5.682606456502981e-07, -5.316528586263303e-07, -4.950450147589436e-07, -4.5843722773497575e-07, -4.218294407110079e-07, -3.852216536870401e-07, -3.4861386666307226e-07, -3.1200607963910443e-07, -2.7539826419342717e-07, -2.3879047716945934e-07, -2.021826901454915e-07, -1.6557488891066896e-07, -1.2896708767584641e-07, -9.23594143387163e-08, -5.575162020932112e-08, -1.914382607992593e-08, 1.746396804946926e-08, 5.4071762178864446e-08, 9.067954920283228e-08, 1.2728735043765482e-07, 1.6389515167247737e-07, 2.005029386964452e-07, 2.3711072572041303e-07, 2.7371851274438086e-07, 3.103263281900581e-07, 3.4693411521402595e-07, 3.835419022379938e-07, 4.2014971768367104e-07, 4.5675750470763887e-07, 4.933652917316067e-07, 5.299730787555745e-07, 5.665808657795424e-07, 6.031886528035102e-07, 6.39796439827478e-07, 6.764042836948647e-07, 7.130120707188325e-07, 7.496198577428004e-07, 7.862276447667682e-07, 8.22835431790736e-07, 8.594432188147039e-07, 8.960510058386717e-07, 9.326588497060584e-07, 9.692665798866074e-07, 1.005874423753994e-06, 1.042482153934543e-06, 1.0790899978019297e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 10.0, 0.0, 26.0, 0.0, 110.0, 0.0, 592.0, 0.0, 6503.0, 0.0, 1034101.0, 0.0, 6473.0, 0.0, 0.0, 586.0, 0.0, 117.0, 0.0, 31.0, 0.0, 10.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.055940270423889e-07, -7.767230272293091e-07, -7.478520274162292e-07, -7.189810276031494e-07, -6.901100277900696e-07, -6.612390279769897e-07, -6.323680281639099e-07, -6.034970283508301e-07, -5.746260285377502e-07, -5.457550287246704e-07, -5.168840289115906e-07, -4.880130290985107e-07, -4.591420292854309e-07, -4.302710294723511e-07, -4.0140002965927124e-07, -3.725290298461914e-07, -3.4365803003311157e-07, -3.1478703022003174e-07, -2.859160304069519e-07, -2.5704503059387207e-07, -2.2817403078079224e-07, -1.993030309677124e-07, -1.7043203115463257e-07, -1.4156103134155273e-07, -1.126900315284729e-07, -8.381903171539307e-08, -5.494803190231323e-08, -2.60770320892334e-08, 2.7939677238464355e-09, 3.166496753692627e-08, 6.05359673500061e-08, 8.940696716308594e-08, 1.1827796697616577e-07, 1.471489667892456e-07, 1.7601996660232544e-07, 2.0489096641540527e-07, 2.337619662284851e-07, 2.6263296604156494e-07, 2.915039658546448e-07, 3.203749656677246e-07, 3.4924596548080444e-07, 3.781169652938843e-07, 4.069879651069641e-07, 4.3585896492004395e-07, 4.647299647331238e-07, 4.936009645462036e-07, 5.224719643592834e-07, 5.513429641723633e-07, 5.802139639854431e-07, 6.09084963798523e-07, 6.379559636116028e-07, 6.668269634246826e-07, 6.956979632377625e-07, 7.245689630508423e-07, 7.534399628639221e-07, 7.82310962677002e-07, 8.111819624900818e-07, 8.400529623031616e-07, 8.689239621162415e-07, 8.977949619293213e-07, 9.266659617424011e-07, 9.55536961555481e-07, 9.844079613685608e-07, 1.0132789611816406e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 8.0, 7.0, 20.0, 28.0, 28.0, 46.0, 53.0, 0.0, 61.0, 99.0, 110.0, 112.0, 99.0, 91.0, 58.0, 46.0, 43.0, 33.0, 26.0, 15.0, 13.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6226043701171875e-06, -2.5657936930656433e-06, -2.508983016014099e-06, -2.452172338962555e-06, -2.3953616619110107e-06, -2.3385509848594666e-06, -2.2817403078079224e-06, -2.224929630756378e-06, -2.168118953704834e-06, -2.11130827665329e-06, -2.0544975996017456e-06, -1.9976869225502014e-06, -1.9408762454986572e-06, -1.884065568447113e-06, -1.8272548913955688e-06, -1.7704442143440247e-06, -1.7136335372924805e-06, -1.6568228602409363e-06, -1.600012183189392e-06, -1.543201506137848e-06, -1.4863908290863037e-06, -1.4295801520347595e-06, -1.3727694749832153e-06, -1.3159587979316711e-06, -1.259148120880127e-06, -1.2023374438285828e-06, -1.1455267667770386e-06, -1.0887160897254944e-06, -1.0319054126739502e-06, -9.75094735622406e-07, -9.182840585708618e-07, -8.614733815193176e-07, -8.046627044677734e-07, -7.478520274162292e-07, -6.910413503646851e-07, -6.342306733131409e-07, -5.774199962615967e-07, -5.206093192100525e-07, -4.637986421585083e-07, -4.069879651069641e-07, -3.501772880554199e-07, -2.9336661100387573e-07, -2.3655593395233154e-07, -1.7974525690078735e-07, -1.2293457984924316e-07, -6.612390279769897e-08, -9.313225746154785e-09, 4.7497451305389404e-08, 1.043081283569336e-07, 1.6111880540847778e-07, 2.1792948246002197e-07, 2.7474015951156616e-07, 3.3155083656311035e-07, 3.8836151361465454e-07, 4.4517219066619873e-07, 5.019828677177429e-07, 5.587935447692871e-07, 6.156042218208313e-07, 6.724148988723755e-07, 7.292255759239197e-07, 7.860362529754639e-07, 8.428469300270081e-07, 8.996576070785522e-07, 9.564682841300964e-07, 1.0132789611816406e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 178.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048189.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 207.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 13.0, 2.0, 3.0, 4.0, 2.0, 11.0, 27.0, 31.0, 20.0, 12.0, 2.0, 3.0, 13.0, 164.0, 31.0, 16.0, 5.0, 29.0, 30.0, 181.0, 36.0, 16.0, 6.0, 16.0, 22.0, 70.0, 102.0, 7.0, 2.0, 10.0, 24.0, 29.0, 28.0, 7.0, 6.0, 2.0, 3.0, 7.0, 10.0, 10.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3245811462402344e-06, -2.2510066628456116e-06, -2.1774321794509888e-06, -2.103857696056366e-06, -2.030283212661743e-06, -1.9567087292671204e-06, -1.8831342458724976e-06, -1.8095597624778748e-06, -1.735985279083252e-06, -1.6624107956886292e-06, -1.5888363122940063e-06, -1.5152618288993835e-06, -1.4416873455047607e-06, -1.368112862110138e-06, -1.2945383787155151e-06, -1.2209638953208923e-06, -1.1473894119262695e-06, -1.0738149285316467e-06, -1.000240445137024e-06, -9.266659617424011e-07, -8.530914783477783e-07, -7.795169949531555e-07, -7.059425115585327e-07, -6.323680281639099e-07, -5.587935447692871e-07, -4.852190613746643e-07, -4.116445779800415e-07, -3.380700945854187e-07, -2.644956111907959e-07, -1.909211277961731e-07, -1.1734664440155029e-07, -4.377216100692749e-08, 2.9802322387695312e-08, 1.0337680578231812e-07, 1.7695128917694092e-07, 2.505257725715637e-07, 3.241002559661865e-07, 3.976747393608093e-07, 4.7124922275543213e-07, 5.448237061500549e-07, 6.183981895446777e-07, 6.919726729393005e-07, 7.655471563339233e-07, 8.391216397285461e-07, 9.126961231231689e-07, 9.862706065177917e-07, 1.0598450899124146e-06, 1.1334195733070374e-06, 1.2069940567016602e-06, 1.280568540096283e-06, 1.3541430234909058e-06, 1.4277175068855286e-06, 1.5012919902801514e-06, 1.5748664736747742e-06, 1.648440957069397e-06, 1.7220154404640198e-06, 1.7955899238586426e-06, 1.8691644072532654e-06, 1.942738890647888e-06, 2.016313374042511e-06, 2.089887857437134e-06, 2.1634623408317566e-06, 2.2370368242263794e-06, 2.310611307621002e-06, 2.384185791015625e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 968.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 12.0, 30.0, 72.0, 198.0, 455.0, 179.0, 39.0, 16.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4630641089752316e-06, -1.2887580851383973e-06, -1.114452061301563e-06, -9.401460374647286e-07, -7.658400136278942e-07, -5.915339897910599e-07, -4.172279659542255e-07, -2.4292194211739115e-07, -6.86159182805568e-08, 1.0569010555627756e-07, 2.799961293931119e-07, 4.5430215322994627e-07, 6.286081770667806e-07, 8.02914200903615e-07, 9.772202247404493e-07, 1.1515262485772837e-06, 1.325832272414118e-06, 1.5001382962509524e-06, 1.6744443200877868e-06, 1.8487503439246211e-06, 2.0230563677614555e-06, 2.19736239159829e-06, 2.371668415435124e-06, 2.5459744392719585e-06, 2.720280463108793e-06, 2.8945864869456273e-06, 3.0688925107824616e-06, 3.243198534619296e-06, 3.4175045584561303e-06, 3.5918105822929647e-06, 3.766116606129799e-06, 3.940422629966633e-06, 4.114728653803468e-06, 4.289034677640302e-06, 4.4633407014771365e-06, 4.637646725313971e-06, 4.811952749150805e-06, 4.9862587729876395e-06, 5.160564796824474e-06, 5.334870820661308e-06, 5.509176844498143e-06, 5.683482868334977e-06, 5.857788892171811e-06, 6.032094916008646e-06, 6.20640093984548e-06, 6.380706963682314e-06, 6.555012987519149e-06, 6.729319011355983e-06, 6.9036250351928174e-06, 7.077931059029652e-06, 7.252237082866486e-06, 7.4265431067033205e-06, 7.600849130540155e-06, 7.77515560912434e-06, 7.949461178213824e-06, 8.123766747303307e-06, 8.298073225887492e-06, 8.472379704471678e-06, 8.646685273561161e-06, 8.820990842650644e-06, 8.99529732123483e-06, 9.169603799819015e-06, 9.343909368908498e-06, 9.518214937997982e-06, 9.692521416582167e-06]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 6.0, 18.0, 22.0, 32.0, 41.0, 40.0, 51.0, 74.0, 95.0, 79.0, 84.0, 72.0, 69.0, 59.0, 50.0, 41.0, 45.0, 31.0, 31.0, 11.0, 17.0, 11.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.033006012425176e-06, -1.986451252378174e-06, -1.9398964923311723e-06, -1.8933416185973329e-06, -1.8467867448634934e-06, -1.8002319848164916e-06, -1.7536772247694898e-06, -1.7071223510356504e-06, -1.6605674773018109e-06, -1.614012717254809e-06, -1.5674578435209696e-06, -1.5209030834739679e-06, -1.4743482097401284e-06, -1.4277934496931266e-06, -1.3812386896461248e-06, -1.3346838159122854e-06, -1.2881290558652836e-06, -1.2415742958182818e-06, -1.1950194220844423e-06, -1.1484646620374406e-06, -1.101909788303601e-06, -1.0553550282565993e-06, -1.0088001545227598e-06, -9.62245394475758e-07, -9.156905775853375e-07, -8.691357606949168e-07, -8.225809438044962e-07, -7.760261269140756e-07, -7.294713668670738e-07, -6.829164931332343e-07, -6.363617330862326e-07, -5.898069161958119e-07, -5.432521561488102e-07, -4.966973392583895e-07, -4.501425223679689e-07, -4.0358773389925773e-07, -3.570329170088371e-07, -3.104781001184165e-07, -2.639233116497053e-07, -2.1736849475928466e-07, -1.7081367786886403e-07, -1.242588609784434e-07, -7.77040582988775e-08, -3.114925561931159e-08, 1.5405561271109036e-08, 6.196037816152966e-08, 1.0851516663024086e-07, 1.5506998352066148e-07, 2.016248004110821e-07, 2.4817961730150273e-07, 2.9473443419192336e-07, 3.4128922266063455e-07, 3.878440395510552e-07, 4.343988564414758e-07, 4.80953644910187e-07, 5.275084618006076e-07, 5.740632786910282e-07, 6.206180955814489e-07, 6.671729124718695e-07, 7.137276725188713e-07, 7.602825462527107e-07, 8.068373062997125e-07, 8.533921231901331e-07, 8.999469400805538e-07, 9.465017569709744e-07]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 3.0, 3.0, 7.0, 15.0, 7.0, 9.0, 16.0, 20.0, 33.0, 36.0, 41.0, 46.0, 123.0, 135.0, 286.0, 718.0, 2562.0, 122157.0, 795885.0, 108318.0, 13976.0, 2649.0, 972.0, 137.0, 88.0, 60.0, 76.0, 34.0, 33.0, 16.0, 18.0, 20.0, 12.0, 16.0, 5.0, 9.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.086162567138672e-06, -2.0135194063186646e-06, -1.9408762454986572e-06, -1.86823308467865e-06, -1.7955899238586426e-06, -1.7229467630386353e-06, -1.650303602218628e-06, -1.5776604413986206e-06, -1.5050172805786133e-06, -1.432374119758606e-06, -1.3597309589385986e-06, -1.2870877981185913e-06, -1.214444637298584e-06, -1.1418014764785767e-06, -1.0691583156585693e-06, -9.96515154838562e-07, -9.238719940185547e-07, -8.512288331985474e-07, -7.7858567237854e-07, -7.059425115585327e-07, -6.332993507385254e-07, -5.606561899185181e-07, -4.880130290985107e-07, -4.153698682785034e-07, -3.427267074584961e-07, -2.7008354663848877e-07, -1.9744038581848145e-07, -1.2479722499847412e-07, -5.21540641784668e-08, 2.0489096641540527e-08, 9.313225746154785e-08, 1.6577541828155518e-07, 2.384185791015625e-07, 3.110617399215698e-07, 3.8370490074157715e-07, 4.5634806156158447e-07, 5.289912223815918e-07, 6.016343832015991e-07, 6.742775440216064e-07, 7.469207048416138e-07, 8.195638656616211e-07, 8.922070264816284e-07, 9.648501873016357e-07, 1.037493348121643e-06, 1.1101365089416504e-06, 1.1827796697616577e-06, 1.255422830581665e-06, 1.3280659914016724e-06, 1.4007091522216797e-06, 1.473352313041687e-06, 1.5459954738616943e-06, 1.6186386346817017e-06, 1.691281795501709e-06, 1.7639249563217163e-06, 1.8365681171417236e-06, 1.909211277961731e-06, 1.9818544387817383e-06, 2.0544975996017456e-06, 2.127140760421753e-06, 2.1997839212417603e-06, 2.2724270820617676e-06, 2.345070242881775e-06, 2.4177134037017822e-06, 2.4903565645217896e-06, 2.562999725341797e-06]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 3.0, 4.0, 6.0, 14.0, 5.0, 9.0, 19.0, 15.0, 16.0, 30.0, 28.0, 43.0, 28.0, 29.0, 59.0, 34.0, 75.0, 46.0, 54.0, 59.0, 44.0, 54.0, 51.0, 35.0, 40.0, 28.0, 16.0, 33.0, 28.0, 14.0, 20.0, 9.0, 16.0, 13.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0531158447265625e-06, -3.91155481338501e-06, -3.769993782043457e-06, -3.6284327507019043e-06, -3.4868717193603516e-06, -3.345310688018799e-06, -3.203749656677246e-06, -3.0621886253356934e-06, -2.9206275939941406e-06, -2.779066562652588e-06, -2.637505531311035e-06, -2.4959444999694824e-06, -2.3543834686279297e-06, -2.212822437286377e-06, -2.0712614059448242e-06, -1.9297003746032715e-06, -1.7881393432617188e-06, -1.646578311920166e-06, -1.5050172805786133e-06, -1.3634562492370605e-06, -1.2218952178955078e-06, -1.080334186553955e-06, -9.387731552124023e-07, -7.972121238708496e-07, -6.556510925292969e-07, -5.140900611877441e-07, -3.725290298461914e-07, -2.3096799850463867e-07, -8.940696716308594e-08, 5.21540641784668e-08, 1.9371509552001953e-07, 3.3527612686157227e-07, 4.76837158203125e-07, 6.183981895446777e-07, 7.599592208862305e-07, 9.015202522277832e-07, 1.043081283569336e-06, 1.1846423149108887e-06, 1.3262033462524414e-06, 1.4677643775939941e-06, 1.6093254089355469e-06, 1.7508864402770996e-06, 1.8924474716186523e-06, 2.034008502960205e-06, 2.175569534301758e-06, 2.3171305656433105e-06, 2.4586915969848633e-06, 2.600252628326416e-06, 2.7418136596679688e-06, 2.8833746910095215e-06, 3.0249357223510742e-06, 3.166496753692627e-06, 3.3080577850341797e-06, 3.4496188163757324e-06, 3.591179847717285e-06, 3.732740879058838e-06, 3.874301910400391e-06, 4.015862941741943e-06, 4.157423973083496e-06, 4.298985004425049e-06, 4.4405460357666016e-06, 4.582107067108154e-06, 4.723668098449707e-06, 4.86522912979126e-06, 5.0067901611328125e-06]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 4.0, 5.0, 3.0, 6.0, 11.0, 8.0, 16.0, 14.0, 19.0, 37.0, 34.0, 41.0, 37.0, 75.0, 103.0, 245.0, 534.0, 2567.0, 1042907.0, 1032.0, 332.0, 140.0, 92.0, 47.0, 41.0, 43.0, 25.0, 36.0, 17.0, 15.0, 19.0, 4.0, 4.0, 3.0, 6.0, 7.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.9252300262451172e-05, -1.873541623353958e-05, -1.821853220462799e-05, -1.77016481757164e-05, -1.718476414680481e-05, -1.666788011789322e-05, -1.615099608898163e-05, -1.5634112060070038e-05, -1.5117228031158447e-05, -1.4600344002246857e-05, -1.4083459973335266e-05, -1.3566575944423676e-05, -1.3049691915512085e-05, -1.2532807886600494e-05, -1.2015923857688904e-05, -1.1499039828777313e-05, -1.0982155799865723e-05, -1.0465271770954132e-05, -9.948387742042542e-06, -9.431503713130951e-06, -8.91461968421936e-06, -8.39773565530777e-06, -7.88085162639618e-06, -7.363967597484589e-06, -6.847083568572998e-06, -6.3301995396614075e-06, -5.813315510749817e-06, -5.296431481838226e-06, -4.779547452926636e-06, -4.262663424015045e-06, -3.7457793951034546e-06, -3.228895366191864e-06, -2.7120113372802734e-06, -2.195127308368683e-06, -1.6782432794570923e-06, -1.1613592505455017e-06, -6.444752216339111e-07, -1.2759119272232056e-07, 3.8929283618927e-07, 9.061768651008606e-07, 1.4230608940124512e-06, 1.9399449229240417e-06, 2.4568289518356323e-06, 2.973712980747223e-06, 3.4905970096588135e-06, 4.007481038570404e-06, 4.524365067481995e-06, 5.041249096393585e-06, 5.558133125305176e-06, 6.075017154216766e-06, 6.591901183128357e-06, 7.1087852120399475e-06, 7.625669240951538e-06, 8.142553269863129e-06, 8.65943729877472e-06, 9.17632132768631e-06, 9.6932053565979e-06, 1.0210089385509491e-05, 1.0726973414421082e-05, 1.1243857443332672e-05, 1.1760741472244263e-05, 1.2277625501155853e-05, 1.2794509530067444e-05, 1.3311393558979034e-05, 1.3828277587890625e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 4.0, 5.0, 9.0, 6.0, 6.0, 16.0, 19.0, 12.0, 20.0, 28.0, 37.0, 27.0, 25.0, 46.0, 35.0, 61.0, 64.0, 67.0, 49.0, 59.0, 54.0, 49.0, 43.0, 45.0, 32.0, 34.0, 25.0, 26.0, 23.0, 15.0, 12.0, 4.0, 6.0, 5.0, 4.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.761882781982422e-06, -8.52532684803009e-06, -8.288770914077759e-06, -8.052214980125427e-06, -7.815659046173096e-06, -7.579103112220764e-06, -7.342547178268433e-06, -7.105991244316101e-06, -6.8694353103637695e-06, -6.632879376411438e-06, -6.3963234424591064e-06, -6.159767508506775e-06, -5.923211574554443e-06, -5.686655640602112e-06, -5.45009970664978e-06, -5.213543772697449e-06, -4.976987838745117e-06, -4.740431904792786e-06, -4.503875970840454e-06, -4.2673200368881226e-06, -4.030764102935791e-06, -3.7942081689834595e-06, -3.557652235031128e-06, -3.3210963010787964e-06, -3.084540367126465e-06, -2.8479844331741333e-06, -2.6114284992218018e-06, -2.3748725652694702e-06, -2.1383166313171387e-06, -1.9017606973648071e-06, -1.6652047634124756e-06, -1.428648829460144e-06, -1.1920928955078125e-06, -9.55536961555481e-07, -7.189810276031494e-07, -4.824250936508179e-07, -2.4586915969848633e-07, -9.313225746154785e-09, 2.2724270820617676e-07, 4.637986421585083e-07, 7.003545761108398e-07, 9.369105100631714e-07, 1.173466444015503e-06, 1.4100223779678345e-06, 1.646578311920166e-06, 1.8831342458724976e-06, 2.119690179824829e-06, 2.3562461137771606e-06, 2.592802047729492e-06, 2.8293579816818237e-06, 3.0659139156341553e-06, 3.302469849586487e-06, 3.5390257835388184e-06, 3.77558171749115e-06, 4.0121376514434814e-06, 4.248693585395813e-06, 4.4852495193481445e-06, 4.721805453300476e-06, 4.958361387252808e-06, 5.194917321205139e-06, 5.431473255157471e-06, 5.668029189109802e-06, 5.904585123062134e-06, 6.141141057014465e-06, 6.377696990966797e-06]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1798.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1044967.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1747.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1005.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 111.0, 0.0, 0.0, 0.0, 0.0, 1989.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1044306.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2003.0, 0.0, 0.0, 0.0, 0.0, 0.0, 130.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.069879651069641e-07, -3.9674341678619385e-07, -3.864988684654236e-07, -3.762543201446533e-07, -3.6600977182388306e-07, -3.557652235031128e-07, -3.4552067518234253e-07, -3.3527612686157227e-07, -3.25031578540802e-07, -3.1478703022003174e-07, -3.045424818992615e-07, -2.942979335784912e-07, -2.8405338525772095e-07, -2.738088369369507e-07, -2.635642886161804e-07, -2.5331974029541016e-07, -2.430751919746399e-07, -2.3283064365386963e-07, -2.2258609533309937e-07, -2.123415470123291e-07, -2.0209699869155884e-07, -1.9185245037078857e-07, -1.816079020500183e-07, -1.7136335372924805e-07, -1.6111880540847778e-07, -1.5087425708770752e-07, -1.4062970876693726e-07, -1.30385160446167e-07, -1.2014061212539673e-07, -1.0989606380462646e-07, -9.96515154838562e-08, -8.940696716308594e-08, -7.916241884231567e-08, -6.891787052154541e-08, -5.8673322200775146e-08, -4.842877388000488e-08, -3.818422555923462e-08, -2.7939677238464355e-08, -1.7695128917694092e-08, -7.450580596923828e-09, 2.7939677238464355e-09, 1.30385160446167e-08, 2.3283064365386963e-08, 3.3527612686157227e-08, 4.377216100692749e-08, 5.4016709327697754e-08, 6.426125764846802e-08, 7.450580596923828e-08, 8.475035429000854e-08, 9.499490261077881e-08, 1.0523945093154907e-07, 1.1548399925231934e-07, 1.257285475730896e-07, 1.3597309589385986e-07, 1.4621764421463013e-07, 1.564621925354004e-07, 1.6670674085617065e-07, 1.7695128917694092e-07, 1.8719583749771118e-07, 1.9744038581848145e-07, 2.076849341392517e-07, 2.1792948246002197e-07, 2.2817403078079224e-07, 2.384185791015625e-07]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1004.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07, 1.2293457984924316e-07, 1.2665987014770508e-07, 1.30385160446167e-07, 1.341104507446289e-07, 1.3783574104309082e-07, 1.4156103134155273e-07, 1.4528632164001465e-07, 1.4901161193847656e-07, 1.5273690223693848e-07, 1.564621925354004e-07, 1.601874828338623e-07, 1.6391277313232422e-07, 1.6763806343078613e-07, 1.7136335372924805e-07, 1.7508864402770996e-07, 1.7881393432617188e-07]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 10.0, 28.0, 118.0, 617.0, 200.0, 28.0, 5.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3572526768257376e-05, -1.3168772966309916e-05, -1.2765020073857158e-05, -1.2361266271909699e-05, -1.195751246996224e-05, -1.1553759577509481e-05, -1.1150005775562022e-05, -1.0746252883109264e-05, -1.0342499081161804e-05, -9.938745279214345e-06, -9.534992386761587e-06, -9.131238584814128e-06, -8.72748569236137e-06, -8.32373189041391e-06, -7.91997808846645e-06, -7.516224741266342e-06, -7.112471394066233e-06, -6.7087180468661245e-06, -6.304964699666016e-06, -5.901210897718556e-06, -5.4974575505184475e-06, -5.093704203318339e-06, -4.689950401370879e-06, -4.2861970541707706e-06, -3.882443706970662e-06, -3.478690359770553e-06, -3.074936785196769e-06, -2.671183210622985e-06, -2.2674298634228762e-06, -1.8636765162227675e-06, -1.4599229416489834e-06, -1.0561693670751993e-06, -6.524169293697923e-07, -2.4866346848284593e-07, 1.5508999240410049e-07, 5.588434532910469e-07, 9.625969141779933e-07, 1.366350261378102e-06, 1.7701038359518861e-06, 2.1738574105256703e-06, 2.577610757725779e-06, 2.9813641049258877e-06, 3.385117679499672e-06, 3.788871254073456e-06, 4.192624601273565e-06, 4.596377948473673e-06, 5.000131750421133e-06, 5.403885097621242e-06, 5.80763844482135e-06, 6.211391792021459e-06, 6.615145139221568e-06, 7.018898941169027e-06, 7.422652288369136e-06, 7.826405635569245e-06, 8.230159437516704e-06, 8.633913239464164e-06, 9.037666131916922e-06, 9.441419933864381e-06, 9.845172826317139e-06, 1.0248926628264599e-05, 1.0652680430212058e-05, 1.1056433322664816e-05, 1.1460187124612276e-05, 1.1863940017065033e-05, 1.2267693819012493e-05]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 13.0, 11.0, 12.0, 21.0, 15.0, 16.0, 28.0, 11.0, 17.0, 27.0, 39.0, 42.0, 48.0, 35.0, 31.0, 47.0, 41.0, 42.0, 39.0, 43.0, 43.0, 27.0, 34.0, 32.0, 36.0, 28.0, 39.0, 19.0, 26.0, 16.0, 13.0, 15.0, 15.0, 13.0, 11.0, 10.0, 7.0, 7.0, 4.0, 4.0, 1.0, 5.0, 1.0, 0.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0561513590801042e-05, -1.0213060704700183e-05, -9.864607818599325e-06, -9.516154023003764e-06, -9.167701136902906e-06, -8.819248250802048e-06, -8.470795364701189e-06, -8.12234247860033e-06, -7.773889592499472e-06, -7.425436706398614e-06, -7.076983365550404e-06, -6.728530479449546e-06, -6.3800775933486875e-06, -6.031624252500478e-06, -5.68317136639962e-06, -5.334718480298761e-06, -4.986265139450552e-06, -4.6378122533496935e-06, -4.289358912501484e-06, -3.940906026400626e-06, -3.5924531402997673e-06, -3.2440000268252334e-06, -2.8955469133506995e-06, -2.547094027249841e-06, -2.198640913775307e-06, -1.850187913987611e-06, -1.5017349141999148e-06, -1.1532818007253809e-06, -8.048288009376847e-07, -4.5637580114998855e-07, -1.0792268767545465e-07, 2.405301984254038e-07, 5.889833118999377e-07, 9.374363116876339e-07, 1.28588931147533e-06, 1.634342424949864e-06, 1.9827953110507224e-06, 2.3312484245252563e-06, 2.67970153799979e-06, 3.0281544241006486e-06, 3.3766075375751825e-06, 3.7250606510497164e-06, 4.073513537150575e-06, 4.421966877998784e-06, 4.770419764099643e-06, 5.118872650200501e-06, 5.4673255363013595e-06, 5.815778422402218e-06, 6.164231763250427e-06, 6.512684649351286e-06, 6.861137990199495e-06, 7.2095908763003536e-06, 7.558043762401212e-06, 7.90649664850207e-06, 8.25495044409763e-06, 8.603403330198489e-06, 8.951856216299348e-06, 9.300309102400206e-06, 9.648761988501064e-06, 9.997214874601923e-06, 1.0345668670197483e-05, 1.0694121556298342e-05, 1.10425744423992e-05, 1.1391027328500059e-05, 1.1739480214600917e-05]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 33.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 7.0, 1.0, 10.0, 27.0, 9.0, 25.0, 58.0, 64.0, 179.0, 387.0, 560.0, 2051.0, 114829.0, 4072595.0, 1929.0, 612.0, 381.0, 208.0, 65.0, 59.0, 19.0, 5.0, 19.0, 8.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 29.0, 0.0, 29.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0], "bins": [-6.139278411865234e-06, -5.947425961494446e-06, -5.755573511123657e-06, -5.563721060752869e-06, -5.37186861038208e-06, -5.1800161600112915e-06, -4.988163709640503e-06, -4.796311259269714e-06, -4.604458808898926e-06, -4.412606358528137e-06, -4.220753908157349e-06, -4.02890145778656e-06, -3.8370490074157715e-06, -3.645196557044983e-06, -3.4533441066741943e-06, -3.2614916563034058e-06, -3.069639205932617e-06, -2.8777867555618286e-06, -2.68593430519104e-06, -2.4940818548202515e-06, -2.302229404449463e-06, -2.1103769540786743e-06, -1.9185245037078857e-06, -1.7266720533370972e-06, -1.5348196029663086e-06, -1.34296715259552e-06, -1.1511147022247314e-06, -9.592622518539429e-07, -7.674098014831543e-07, -5.755573511123657e-07, -3.8370490074157715e-07, -1.9185245037078857e-07, 0.0, 1.9185245037078857e-07, 3.8370490074157715e-07, 5.755573511123657e-07, 7.674098014831543e-07, 9.592622518539429e-07, 1.1511147022247314e-06, 1.34296715259552e-06, 1.5348196029663086e-06, 1.7266720533370972e-06, 1.9185245037078857e-06, 2.1103769540786743e-06, 2.302229404449463e-06, 2.4940818548202515e-06, 2.68593430519104e-06, 2.8777867555618286e-06, 3.069639205932617e-06, 3.2614916563034058e-06, 3.4533441066741943e-06, 3.645196557044983e-06, 3.8370490074157715e-06, 4.02890145778656e-06, 4.220753908157349e-06, 4.412606358528137e-06, 4.604458808898926e-06, 4.796311259269714e-06, 4.988163709640503e-06, 5.1800161600112915e-06, 5.37186861038208e-06, 5.563721060752869e-06, 5.755573511123657e-06, 5.947425961494446e-06, 6.139278411865234e-06]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 0.0, 5.0, 0.0, 0.0, 12.0, 0.0, 0.0, 1.0, 0.0, 0.0, 29.0, 0.0, 48.0, 0.0, 0.0, 116.0, 0.0, 0.0, 149.0, 0.0, 0.0, 280.0, 0.0, 132.0, 0.0, 0.0, 106.0, 0.0, 0.0, 76.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 7.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.534399628639221e-07, -7.320195436477661e-07, -7.105991244316101e-07, -6.891787052154541e-07, -6.677582859992981e-07, -6.463378667831421e-07, -6.249174475669861e-07, -6.034970283508301e-07, -5.820766091346741e-07, -5.606561899185181e-07, -5.392357707023621e-07, -5.178153514862061e-07, -4.9639493227005e-07, -4.7497451305389404e-07, -4.5355409383773804e-07, -4.3213367462158203e-07, -4.10713255405426e-07, -3.8929283618927e-07, -3.67872416973114e-07, -3.46451997756958e-07, -3.25031578540802e-07, -3.03611159324646e-07, -2.8219074010849e-07, -2.60770320892334e-07, -2.39349901676178e-07, -2.1792948246002197e-07, -1.9650906324386597e-07, -1.7508864402770996e-07, -1.5366822481155396e-07, -1.3224780559539795e-07, -1.1082738637924194e-07, -8.940696716308594e-08, -6.798654794692993e-08, -4.6566128730773926e-08, -2.514570951461792e-08, -3.725290298461914e-09, 1.7695128917694092e-08, 3.91155481338501e-08, 6.05359673500061e-08, 8.195638656616211e-08, 1.0337680578231812e-07, 1.2479722499847412e-07, 1.4621764421463013e-07, 1.6763806343078613e-07, 1.8905848264694214e-07, 2.1047890186309814e-07, 2.3189932107925415e-07, 2.5331974029541016e-07, 2.7474015951156616e-07, 2.9616057872772217e-07, 3.175809979438782e-07, 3.390014171600342e-07, 3.604218363761902e-07, 3.818422555923462e-07, 4.032626748085022e-07, 4.246830940246582e-07, 4.461035132408142e-07, 4.675239324569702e-07, 4.889443516731262e-07, 5.103647708892822e-07, 5.317851901054382e-07, 5.532056093215942e-07, 5.746260285377502e-07, 5.960464477539062e-07]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 8.0, 3.0, 10.0, 17.0, 23.0, 46.0, 55.0, 113.0, 79.0, 383.0, 733.0, 1956.0, 6461.0, 86319.0, 4077794.0, 14712.0, 3349.0, 1190.0, 271.0, 361.0, 193.0, 92.0, 45.0, 28.0, 18.0, 10.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0994415283203125e-06, -2.985820174217224e-06, -2.8721988201141357e-06, -2.7585774660110474e-06, -2.644956111907959e-06, -2.5313347578048706e-06, -2.4177134037017822e-06, -2.304092049598694e-06, -2.1904706954956055e-06, -2.076849341392517e-06, -1.9632279872894287e-06, -1.8496066331863403e-06, -1.735985279083252e-06, -1.6223639249801636e-06, -1.5087425708770752e-06, -1.3951212167739868e-06, -1.2814998626708984e-06, -1.16787850856781e-06, -1.0542571544647217e-06, -9.406358003616333e-07, -8.270144462585449e-07, -7.133930921554565e-07, -5.997717380523682e-07, -4.861503839492798e-07, -3.725290298461914e-07, -2.5890767574310303e-07, -1.4528632164001465e-07, -3.166496753692627e-08, 8.195638656616211e-08, 1.955777406692505e-07, 3.0919909477233887e-07, 4.2282044887542725e-07, 5.364418029785156e-07, 6.50063157081604e-07, 7.636845111846924e-07, 8.773058652877808e-07, 9.909272193908691e-07, 1.1045485734939575e-06, 1.218169927597046e-06, 1.3317912817001343e-06, 1.4454126358032227e-06, 1.559033989906311e-06, 1.6726553440093994e-06, 1.7862766981124878e-06, 1.8998980522155762e-06, 2.0135194063186646e-06, 2.127140760421753e-06, 2.2407621145248413e-06, 2.3543834686279297e-06, 2.468004822731018e-06, 2.5816261768341064e-06, 2.695247530937195e-06, 2.808868885040283e-06, 2.9224902391433716e-06, 3.03611159324646e-06, 3.1497329473495483e-06, 3.2633543014526367e-06, 3.376975655555725e-06, 3.4905970096588135e-06, 3.604218363761902e-06, 3.7178397178649902e-06, 3.831461071968079e-06, 3.945082426071167e-06, 4.058703780174255e-06, 4.172325134277344e-06]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 7.0, 0.0, 9.0, 0.0, 0.0, 25.0, 0.0, 206.0, 0.0, 3594.0, 0.0, 178.0, 0.0, 0.0, 30.0, 0.0, 12.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 8.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.275972843170166e-07, -9.015202522277832e-07, -8.754432201385498e-07, -8.493661880493164e-07, -8.23289155960083e-07, -7.972121238708496e-07, -7.711350917816162e-07, -7.450580596923828e-07, -7.189810276031494e-07, -6.92903995513916e-07, -6.668269634246826e-07, -6.407499313354492e-07, -6.146728992462158e-07, -5.885958671569824e-07, -5.62518835067749e-07, -5.364418029785156e-07, -5.103647708892822e-07, -4.842877388000488e-07, -4.5821070671081543e-07, -4.3213367462158203e-07, -4.0605664253234863e-07, -3.7997961044311523e-07, -3.5390257835388184e-07, -3.2782554626464844e-07, -3.0174851417541504e-07, -2.7567148208618164e-07, -2.4959444999694824e-07, -2.2351741790771484e-07, -1.9744038581848145e-07, -1.7136335372924805e-07, -1.4528632164001465e-07, -1.1920928955078125e-07, -9.313225746154785e-08, -6.705522537231445e-08, -4.0978193283081055e-08, -1.4901161193847656e-08, 1.1175870895385742e-08, 3.725290298461914e-08, 6.332993507385254e-08, 8.940696716308594e-08, 1.1548399925231934e-07, 1.4156103134155273e-07, 1.6763806343078613e-07, 1.9371509552001953e-07, 2.1979212760925293e-07, 2.4586915969848633e-07, 2.7194619178771973e-07, 2.980232238769531e-07, 3.241002559661865e-07, 3.501772880554199e-07, 3.762543201446533e-07, 4.023313522338867e-07, 4.284083843231201e-07, 4.544854164123535e-07, 4.805624485015869e-07, 5.066394805908203e-07, 5.327165126800537e-07, 5.587935447692871e-07, 5.848705768585205e-07, 6.109476089477539e-07, 6.370246410369873e-07, 6.631016731262207e-07, 6.891787052154541e-07, 7.152557373046875e-07]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 8.0, 4.0, 2.0, 8.0, 4.0, 7.0, 14.0, 14.0, 18.0, 22.0, 28.0, 46.0, 65.0, 89.0, 191.0, 178.0, 89.0, 56.0, 34.0, 29.0, 23.0, 15.0, 18.0, 15.0, 9.0, 2.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0840711865967023e-06, -1.0436781394673744e-06, -1.0032849786512088e-06, -9.62891931521881e-07, -9.22498884392553e-07, -8.821057804198063e-07, -8.417126764470595e-07, -8.013196293177316e-07, -7.609265253449848e-07, -7.205334213722381e-07, -6.801403742429102e-07, -6.397472702701634e-07, -5.993541662974167e-07, -5.589611191680888e-07, -5.18568015195342e-07, -4.781749112225953e-07, -4.3778186409326736e-07, -3.9738878854223003e-07, -3.569957129911927e-07, -3.1660260901844595e-07, -2.762095334674086e-07, -2.358164579163713e-07, -1.9542335394362453e-07, -1.550302783925872e-07, -1.1463720284154988e-07, -7.42441201850852e-08, -3.385103752862051e-08, 6.542052233271534e-09, 4.693512778430886e-08, 8.732820333534619e-08, 1.2772130730809295e-07, 1.6811438285913027e-07, 2.0850757209700532e-07, 2.4890064764804265e-07, 2.8929372319908e-07, 3.2968682717182674e-07, 3.7007990272286406e-07, 4.104729782739014e-07, 4.5086608224664815e-07, 4.91259129375976e-07, 5.316522333487228e-07, 5.720453373214696e-07, 6.124383844507975e-07, 6.528314884235442e-07, 6.93224592396291e-07, 7.336176395256189e-07, 7.740107434983656e-07, 8.144038474711124e-07, 8.547968946004403e-07, 8.95189998573187e-07, 9.355830457025149e-07, 9.759761496752617e-07, 1.0163691968045896e-06, 1.0567623576207552e-06, 1.0971554047500831e-06, 1.137548451879411e-06, 1.1779416126955766e-06, 1.2183346598249045e-06, 1.2587278206410701e-06, 1.299120867770398e-06, 1.339513914899726e-06, 1.3799069620290538e-06, 1.4203001228452194e-06, 1.4606931699745473e-06, 1.5010862171038752e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 6.0, 12.0, 12.0, 17.0, 15.0, 18.0, 19.0, 22.0, 24.0, 34.0, 31.0, 38.0, 50.0, 42.0, 48.0, 52.0, 33.0, 50.0, 45.0, 34.0, 34.0, 45.0, 31.0, 37.0, 33.0, 22.0, 27.0, 22.0, 18.0, 18.0, 19.0, 18.0, 12.0, 16.0, 5.0, 12.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.104455335138482e-07, -6.891527846164536e-07, -6.678600925624778e-07, -6.46567400508502e-07, -6.252746516111074e-07, -6.039819027137128e-07, -5.82689210659737e-07, -5.613965186057612e-07, -5.401037697083666e-07, -5.18811020810972e-07, -4.975183287569962e-07, -4.76225608281311e-07, -4.549328878056258e-07, -4.336401673299406e-07, -4.123474468542554e-07, -3.910547263785702e-07, -3.69762005902885e-07, -3.484692854271998e-07, -3.271765649515146e-07, -3.058838444758294e-07, -2.845911240001442e-07, -2.63298403524459e-07, -2.420056830487738e-07, -2.207129625730886e-07, -1.994202420974034e-07, -1.781275216217182e-07, -1.56834801146033e-07, -1.3554208067034779e-07, -1.1424936019466259e-07, -9.295663971897739e-08, -7.166391924329218e-08, -5.0371198767606984e-08, -2.9078535135340644e-08, -7.785814659655443e-09, 1.3506905816029757e-08, 3.479962629171496e-08, 5.609234676740016e-08, 7.738506724308536e-08, 9.867778771877056e-08, 1.1997050819445576e-07, 1.4126322867014096e-07, 1.6255594914582616e-07, 1.8384866962151136e-07, 2.0514139009719656e-07, 2.2643411057288176e-07, 2.4772683104856696e-07, 2.6901955152425217e-07, 2.9031227199993737e-07, 3.1160499247562257e-07, 3.3289771295130777e-07, 3.5419043342699297e-07, 3.7548315390267817e-07, 3.9677587437836337e-07, 4.1806859485404857e-07, 4.3936131532973377e-07, 4.6065403580541897e-07, 4.819467562811042e-07, 5.032394483350799e-07, 5.245321972324746e-07, 5.458249461298692e-07, 5.67117638183845e-07, 5.884103302378207e-07, 6.097030791352154e-07, 6.3099582803261e-07, 6.522885200865858e-07]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1244.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1045982.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1268.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-2.980232238769531e-07, -2.905726432800293e-07, -2.8312206268310547e-07, -2.7567148208618164e-07, -2.682209014892578e-07, -2.60770320892334e-07, -2.5331974029541016e-07, -2.4586915969848633e-07, -2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 26.0, 0.0, 0.0, 51.0, 0.0, 98.0, 0.0, 0.0, 189.0, 0.0, 0.0, 280.0, 0.0, 0.0, 163.0, 0.0, 0.0, 105.0, 0.0, 0.0, 62.0, 0.0, 0.0, 23.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-8.344650268554688e-07, -8.139759302139282e-07, -7.934868335723877e-07, -7.729977369308472e-07, -7.525086402893066e-07, -7.320195436477661e-07, -7.115304470062256e-07, -6.910413503646851e-07, -6.705522537231445e-07, -6.50063157081604e-07, -6.295740604400635e-07, -6.09084963798523e-07, -5.885958671569824e-07, -5.681067705154419e-07, -5.476176738739014e-07, -5.271285772323608e-07, -5.066394805908203e-07, -4.861503839492798e-07, -4.6566128730773926e-07, -4.4517219066619873e-07, -4.246830940246582e-07, -4.041939973831177e-07, -3.8370490074157715e-07, -3.632158041000366e-07, -3.427267074584961e-07, -3.2223761081695557e-07, -3.0174851417541504e-07, -2.812594175338745e-07, -2.60770320892334e-07, -2.4028122425079346e-07, -2.1979212760925293e-07, -1.993030309677124e-07, -1.7881393432617188e-07, -1.5832483768463135e-07, -1.3783574104309082e-07, -1.1734664440155029e-07, -9.685754776000977e-08, -7.636845111846924e-08, -5.587935447692871e-08, -3.5390257835388184e-08, -1.4901161193847656e-08, 5.587935447692871e-09, 2.60770320892334e-08, 4.6566128730773926e-08, 6.705522537231445e-08, 8.754432201385498e-08, 1.0803341865539551e-07, 1.2852251529693604e-07, 1.4901161193847656e-07, 1.695007085800171e-07, 1.8998980522155762e-07, 2.1047890186309814e-07, 2.3096799850463867e-07, 2.514570951461792e-07, 2.7194619178771973e-07, 2.9243528842926025e-07, 3.129243850708008e-07, 3.334134817123413e-07, 3.5390257835388184e-07, 3.7439167499542236e-07, 3.948807716369629e-07, 4.153698682785034e-07, 4.3585896492004395e-07, 4.5634806156158447e-07, 4.76837158203125e-07]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048564.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.0, 0.0, 83.0, 0.0, 19.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 668.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 18.0, 0.0, 88.0, 0.0, 50.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0], "bins": [-9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 5.0, 7.0, 2.0, 5.0, 8.0, 13.0, 14.0, 19.0, 25.0, 30.0, 50.0, 76.0, 132.0, 268.0, 141.0, 40.0, 53.0, 25.0, 25.0, 20.0, 10.0, 12.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.204548981258995e-07, -5.927315100962005e-07, -5.650081220665015e-07, -5.372847340368025e-07, -5.095613460071036e-07, -4.818379011339857e-07, -4.5411451310428674e-07, -4.2639112507458776e-07, -3.986677370448888e-07, -3.709443490151898e-07, -3.432209609854908e-07, -3.154975445340824e-07, -2.8777415650438343e-07, -2.6005076847468445e-07, -2.3232736623413075e-07, -2.0460396399357705e-07, -1.7688057596387807e-07, -1.491571879341791e-07, -1.214337856936254e-07, -9.371039055849906e-08, -6.598699542337272e-08, -3.826360739367374e-08, -1.0540205153120041e-08, 1.7183197087433655e-08, 4.4906585117132636e-08, 7.262998025225897e-08, 1.0035337538738531e-07, 1.28076777627939e-07, 1.55800165657638e-07, 1.8352355368733697e-07, 2.1124695592789067e-07, 2.3897035816844436e-07, 2.6669374619814334e-07, 2.944171342278423e-07, 3.221405222575413e-07, 3.498639387089497e-07, 3.775873267386487e-07, 4.053107147683477e-07, 4.330341312197561e-07, 4.6075751924945507e-07, 4.884809072791541e-07, 5.16204295308853e-07, 5.43927683338552e-07, 5.71651071368251e-07, 5.993745162413688e-07, 6.27097847427649e-07, 6.548212923007668e-07, 6.825446803304658e-07, 7.102680683601648e-07, 7.379914563898637e-07, 7.657148444195627e-07, 7.934382324492617e-07, 8.211616204789607e-07, 8.488850653520785e-07, 8.766084533817775e-07, 9.043318414114765e-07, 9.320552294411755e-07, 9.597786174708745e-07, 9.875020623439923e-07, 1.0152253935302724e-06, 1.0429488384033903e-06, 1.0706721695896704e-06, 1.0983956144627882e-06, 1.126119059335906e-06, 1.1538423905221862e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 14.0, 11.0, 15.0, 15.0, 23.0, 29.0, 34.0, 51.0, 40.0, 67.0, 78.0, 63.0, 68.0, 74.0, 56.0, 55.0, 51.0, 48.0, 36.0, 36.0, 34.0, 22.0, 21.0, 24.0, 14.0, 8.0, 6.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.523396448050335e-07, -7.335418672482774e-07, -7.147440896915214e-07, -6.959463121347653e-07, -6.771485345780093e-07, -6.583507570212532e-07, -6.395529794644972e-07, -6.207552019077411e-07, -6.019574243509851e-07, -5.83159646794229e-07, -5.64361869237473e-07, -5.45564091680717e-07, -5.267663141239609e-07, -5.079685365672049e-07, -4.891707590104488e-07, -4.7037298145369277e-07, -4.515751754752273e-07, -4.3277739791847125e-07, -4.139796203617152e-07, -3.9518184280495916e-07, -3.763840652482031e-07, -3.5758628769144707e-07, -3.387884817129816e-07, -3.1999070415622555e-07, -3.011929265994695e-07, -2.8239514904271346e-07, -2.635973714859574e-07, -2.4479959392920136e-07, -2.2600181637244532e-07, -2.0720403881568927e-07, -1.884062470480785e-07, -1.6960846949132247e-07, -1.5081070614542114e-07, -1.320129285886651e-07, -1.1321515103190904e-07, -9.441736636972564e-08, -7.56195888129696e-08, -5.682181125621355e-08, -3.802402659403015e-08, -1.92262490372741e-08, -4.284714805180556e-10, 1.836930785259483e-08, 3.7167087185707715e-08, 5.596486829517744e-08, 7.476264585193348e-08, 9.356042340868953e-08, 1.1235820807087293e-07, 1.3115598562762898e-07, 1.4995376318438502e-07, 1.6875154074114107e-07, 1.8754931829789712e-07, 2.0634709585465316e-07, 2.251448734114092e-07, 2.4394265096816525e-07, 2.6274045694663073e-07, 2.815382345033868e-07, 3.003360120601428e-07, 3.1913378961689887e-07, 3.379315671736549e-07, 3.5672934473041096e-07, 3.75527122287167e-07, 3.9432489984392305e-07, 4.131226774006791e-07, 4.3192045495743514e-07, 4.507182325141912e-07]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 86.0, 0.0, 0.0, 0.0, 405.0, 0.0, 0.0, 0.0, 10756.0, 0.0, 0.0, 0.0, 1026002.0, 0.0, 0.0, 0.0, 10762.0, 0.0, 0.0, 0.0, 403.0, 0.0, 0.0, 0.0, 103.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.364418029785156e-07, -5.21540641784668e-07, -5.066394805908203e-07, -4.917383193969727e-07, -4.76837158203125e-07, -4.6193599700927734e-07, -4.470348358154297e-07, -4.3213367462158203e-07, -4.172325134277344e-07, -4.023313522338867e-07, -3.8743019104003906e-07, -3.725290298461914e-07, -3.5762786865234375e-07, -3.427267074584961e-07, -3.2782554626464844e-07, -3.129243850708008e-07, -2.980232238769531e-07, -2.8312206268310547e-07, -2.682209014892578e-07, -2.5331974029541016e-07, -2.384185791015625e-07, -2.2351741790771484e-07, -2.086162567138672e-07, -1.9371509552001953e-07, -1.7881393432617188e-07, -1.6391277313232422e-07, -1.4901161193847656e-07, -1.341104507446289e-07, -1.1920928955078125e-07, -1.043081283569336e-07, -8.940696716308594e-08, -7.450580596923828e-08, -5.960464477539063e-08, -4.470348358154297e-08, -2.9802322387695312e-08, -1.4901161193847656e-08, 0.0, 1.4901161193847656e-08, 2.9802322387695312e-08, 4.470348358154297e-08, 5.960464477539063e-08, 7.450580596923828e-08, 8.940696716308594e-08, 1.043081283569336e-07, 1.1920928955078125e-07, 1.341104507446289e-07, 1.4901161193847656e-07, 1.6391277313232422e-07, 1.7881393432617188e-07, 1.9371509552001953e-07, 2.086162567138672e-07, 2.2351741790771484e-07, 2.384185791015625e-07, 2.5331974029541016e-07, 2.682209014892578e-07, 2.8312206268310547e-07, 2.980232238769531e-07, 3.129243850708008e-07, 3.2782554626464844e-07, 3.427267074584961e-07, 3.5762786865234375e-07, 3.725290298461914e-07, 3.8743019104003906e-07, 4.023313522338867e-07, 4.172325134277344e-07]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 0.0, 6.0, 8.0, 0.0, 22.0, 30.0, 0.0, 33.0, 37.0, 45.0, 0.0, 72.0, 94.0, 0.0, 102.0, 119.0, 95.0, 0.0, 73.0, 66.0, 0.0, 50.0, 32.0, 0.0, 31.0, 25.0, 22.0, 0.0, 21.0, 5.0, 0.0, 3.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.4901161193847656e-06, -1.448206603527069e-06, -1.4062970876693726e-06, -1.364387571811676e-06, -1.3224780559539795e-06, -1.280568540096283e-06, -1.2386590242385864e-06, -1.1967495083808899e-06, -1.1548399925231934e-06, -1.1129304766654968e-06, -1.0710209608078003e-06, -1.0291114449501038e-06, -9.872019290924072e-07, -9.452924132347107e-07, -9.033828973770142e-07, -8.614733815193176e-07, -8.195638656616211e-07, -7.776543498039246e-07, -7.35744833946228e-07, -6.938353180885315e-07, -6.51925802230835e-07, -6.100162863731384e-07, -5.681067705154419e-07, -5.261972546577454e-07, -4.842877388000488e-07, -4.423782229423523e-07, -4.0046870708465576e-07, -3.5855919122695923e-07, -3.166496753692627e-07, -2.7474015951156616e-07, -2.3283064365386963e-07, -1.909211277961731e-07, -1.4901161193847656e-07, -1.0710209608078003e-07, -6.51925802230835e-08, -2.3283064365386963e-08, 1.862645149230957e-08, 6.05359673500061e-08, 1.0244548320770264e-07, 1.4435499906539917e-07, 1.862645149230957e-07, 2.2817403078079224e-07, 2.7008354663848877e-07, 3.119930624961853e-07, 3.5390257835388184e-07, 3.9581209421157837e-07, 4.377216100692749e-07, 4.796311259269714e-07, 5.21540641784668e-07, 5.634501576423645e-07, 6.05359673500061e-07, 6.472691893577576e-07, 6.891787052154541e-07, 7.310882210731506e-07, 7.729977369308472e-07, 8.149072527885437e-07, 8.568167686462402e-07, 8.987262845039368e-07, 9.406358003616333e-07, 9.825453162193298e-07, 1.0244548320770264e-06, 1.066364347934723e-06, 1.1082738637924194e-06, 1.150183379650116e-06, 1.1920928955078125e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 0.0, 6.0, 8.0, 15.0, 19.0, 0.0, 31.0, 22.0, 56.0, 0.0, 60.0, 83.0, 149.0, 207.0, 0.0, 406.0, 945.0, 10667.0, 0.0, 1023279.0, 10618.0, 924.0, 370.0, 0.0, 227.0, 142.0, 86.0, 60.0, 0.0, 55.0, 15.0, 30.0, 0.0, 21.0, 16.0, 8.0, 6.0, 0.0, 6.0, 2.0, 4.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4435499906539917e-06, -1.3969838619232178e-06, -1.3504177331924438e-06, -1.30385160446167e-06, -1.257285475730896e-06, -1.210719347000122e-06, -1.1641532182693481e-06, -1.1175870895385742e-06, -1.0710209608078003e-06, -1.0244548320770264e-06, -9.778887033462524e-07, -9.313225746154785e-07, -8.847564458847046e-07, -8.381903171539307e-07, -7.916241884231567e-07, -7.450580596923828e-07, -6.984919309616089e-07, -6.51925802230835e-07, -6.05359673500061e-07, -5.587935447692871e-07, -5.122274160385132e-07, -4.6566128730773926e-07, -4.1909515857696533e-07, -3.725290298461914e-07, -3.259629011154175e-07, -2.7939677238464355e-07, -2.3283064365386963e-07, -1.862645149230957e-07, -1.3969838619232178e-07, -9.313225746154785e-08, -4.6566128730773926e-08, 0.0, 4.6566128730773926e-08, 9.313225746154785e-08, 1.3969838619232178e-07, 1.862645149230957e-07, 2.3283064365386963e-07, 2.7939677238464355e-07, 3.259629011154175e-07, 3.725290298461914e-07, 4.1909515857696533e-07, 4.6566128730773926e-07, 5.122274160385132e-07, 5.587935447692871e-07, 6.05359673500061e-07, 6.51925802230835e-07, 6.984919309616089e-07, 7.450580596923828e-07, 7.916241884231567e-07, 8.381903171539307e-07, 8.847564458847046e-07, 9.313225746154785e-07, 9.778887033462524e-07, 1.0244548320770264e-06, 1.0710209608078003e-06, 1.1175870895385742e-06, 1.1641532182693481e-06, 1.210719347000122e-06, 1.257285475730896e-06, 1.30385160446167e-06, 1.3504177331924438e-06, 1.3969838619232178e-06, 1.4435499906539917e-06, 1.4901161193847656e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 4.0, 8.0, 6.0, 16.0, 10.0, 21.0, 25.0, 35.0, 44.0, 0.0, 48.0, 43.0, 54.0, 70.0, 77.0, 84.0, 80.0, 66.0, 53.0, 56.0, 32.0, 35.0, 0.0, 25.0, 28.0, 21.0, 7.0, 12.0, 12.0, 4.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6735866665840149e-06, -1.6186386346817017e-06, -1.5636906027793884e-06, -1.5087425708770752e-06, -1.453794538974762e-06, -1.3988465070724487e-06, -1.3438984751701355e-06, -1.2889504432678223e-06, -1.234002411365509e-06, -1.1790543794631958e-06, -1.1241063475608826e-06, -1.0691583156585693e-06, -1.014210283756256e-06, -9.592622518539429e-07, -9.043142199516296e-07, -8.493661880493164e-07, -7.944181561470032e-07, -7.394701242446899e-07, -6.845220923423767e-07, -6.295740604400635e-07, -5.746260285377502e-07, -5.19677996635437e-07, -4.647299647331238e-07, -4.0978193283081055e-07, -3.548339009284973e-07, -2.998858690261841e-07, -2.4493783712387085e-07, -1.8998980522155762e-07, -1.3504177331924438e-07, -8.009374141693115e-08, -2.514570951461792e-08, 2.9802322387695312e-08, 8.475035429000854e-08, 1.3969838619232178e-07, 1.94646418094635e-07, 2.4959444999694824e-07, 3.045424818992615e-07, 3.594905138015747e-07, 4.1443854570388794e-07, 4.6938657760620117e-07, 5.243346095085144e-07, 5.792826414108276e-07, 6.342306733131409e-07, 6.891787052154541e-07, 7.441267371177673e-07, 7.990747690200806e-07, 8.540228009223938e-07, 9.08970832824707e-07, 9.639188647270203e-07, 1.0188668966293335e-06, 1.0738149285316467e-06, 1.12876296043396e-06, 1.1837109923362732e-06, 1.2386590242385864e-06, 1.2936070561408997e-06, 1.3485550880432129e-06, 1.4035031199455261e-06, 1.4584511518478394e-06, 1.5133991837501526e-06, 1.5683472156524658e-06, 1.623295247554779e-06, 1.6782432794570923e-06, 1.7331913113594055e-06, 1.7881393432617188e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [372.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1047808.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 396.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1020.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [396.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1047808.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 372.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1020.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 12.0, 10.0, 16.0, 38.0, 86.0, 231.0, 429.0, 94.0, 48.0, 27.0, 9.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.958729510282865e-06, -2.8189538170408923e-06, -2.67917812379892e-06, -2.5394024305569474e-06, -2.3996269646886503e-06, -2.259851271446678e-06, -2.1200755782047054e-06, -1.9803001123364083e-06, -1.8405243054075981e-06, -1.7007486121656257e-06, -1.560973032610491e-06, -1.4211973393685184e-06, -1.281421646126546e-06, -1.1416460665714112e-06, -1.0018703733294387e-06, -8.62094793774304e-07, -7.223191005323315e-07, -5.825434641337779e-07, -4.4276779931351484e-07, -3.029921344932518e-07, -1.6321649809469818e-07, -2.3440861696144566e-08, 1.1633483154582791e-07, 2.5611041110096266e-07, 3.9588610434293514e-07, 5.356617407414888e-07, 6.754373771400424e-07, 8.152130703820148e-07, 9.549887636239873e-07, 1.094764343179122e-06, 1.2345400364210946e-06, 1.3743156159762293e-06, 1.5140913092182018e-06, 1.6538670024601743e-06, 1.793642582015309e-06, 1.9334183889441192e-06, 2.0731938548124162e-06, 2.2129695480543887e-06, 2.352745241296361e-06, 2.4925207071646582e-06, 2.6322964004066307e-06, 2.772072093648603e-06, 2.9118477868905757e-06, 3.051623480132548e-06, 3.191398946000845e-06, 3.3311746392428176e-06, 3.47095033248479e-06, 3.610725798353087e-06, 3.750501718968735e-06, 3.890277184837032e-06, 4.030052878079005e-06, 4.169828571320977e-06, 4.3096042645629495e-06, 4.449379957804922e-06, 4.5891556510468945e-06, 4.728931344288867e-06, 4.8687070375308394e-06, 5.008482730772812e-06, 5.148258424014784e-06, 5.288034117256757e-06, 5.427809810498729e-06, 5.567585503740702e-06, 5.707361196982674e-06, 5.847136435477296e-06, 5.986912128719268e-06]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 7.0, 6.0, 7.0, 5.0, 10.0, 6.0, 14.0, 11.0, 11.0, 16.0, 23.0, 29.0, 25.0, 25.0, 29.0, 38.0, 35.0, 27.0, 49.0, 45.0, 43.0, 20.0, 44.0, 40.0, 46.0, 38.0, 39.0, 35.0, 30.0, 34.0, 31.0, 32.0, 23.0, 22.0, 13.0, 15.0, 11.0, 12.0, 11.0, 16.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.1512869352591224e-06, -2.088512019327027e-06, -2.0257373307686066e-06, -1.962962414836511e-06, -1.9001874989044154e-06, -1.8374126966591575e-06, -1.7746378944138996e-06, -1.711862978481804e-06, -1.6490881762365461e-06, -1.5863133739912882e-06, -1.5235384580591926e-06, -1.4607636558139347e-06, -1.3979888535686769e-06, -1.3352139376365812e-06, -1.2724391353913234e-06, -1.2096643331460655e-06, -1.1468894172139699e-06, -1.084114614968712e-06, -1.0213396990366164e-06, -9.585648967913585e-07, -8.957900377026817e-07, -8.33015178614005e-07, -7.702403763687471e-07, -7.074655172800703e-07, -6.446906581913936e-07, -5.819157991027168e-07, -5.191409400140401e-07, -4.563661377687822e-07, -3.9359127868010546e-07, -3.308164195914287e-07, -2.680415889244614e-07, -2.0526675825749408e-07, -1.424917854819796e-07, -7.971694060415757e-08, -1.6942095726335538e-08, 4.5832749151486496e-08, 1.0860759402930853e-07, 1.7138245311798528e-07, 2.341572837849526e-07, 2.969321144519199e-07, 3.5970697354059666e-07, 4.224818326292734e-07, 4.852566917179502e-07, 5.48031493963208e-07, 6.108063530518848e-07, 6.735812121405615e-07, 7.363560143858194e-07, 7.991308734744962e-07, 8.619057325631729e-07, 9.246805916518497e-07, 9.874554507405264e-07, 1.0502302529857843e-06, 1.1130050552310422e-06, 1.1757799711631378e-06, 1.2385547734083957e-06, 1.3013295756536536e-06, 1.3641044915857492e-06, 1.426879293831007e-06, 1.4896542097631027e-06, 1.5524290120083606e-06, 1.6152039279404562e-06, 1.677978730185714e-06, 1.740753532430972e-06, 1.8035284483630676e-06, 1.8663032506083255e-06]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 9.0, 0.0, 5.0, 11.0, 21.0, 5.0, 28.0, 54.0, 111.0, 42.0, 349.0, 298.0, 165.0, 484.0, 2243.0, 1735.0, 3945.0, 50192.0, 4125198.0, 3876.0, 1687.0, 2177.0, 478.0, 169.0, 307.0, 359.0, 50.0, 116.0, 61.0, 29.0, 6.0, 23.0, 13.0, 6.0, 0.0, 13.0, 4.0, 0.0, 2.0, 5.0, 4.0, 0.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4437904357910156e-06, -2.3674219846725464e-06, -2.291053533554077e-06, -2.214685082435608e-06, -2.1383166313171387e-06, -2.0619481801986694e-06, -1.9855797290802e-06, -1.909211277961731e-06, -1.8328428268432617e-06, -1.7564743757247925e-06, -1.6801059246063232e-06, -1.603737473487854e-06, -1.5273690223693848e-06, -1.4510005712509155e-06, -1.3746321201324463e-06, -1.298263669013977e-06, -1.2218952178955078e-06, -1.1455267667770386e-06, -1.0691583156585693e-06, -9.927898645401e-07, -9.164214134216309e-07, -8.400529623031616e-07, -7.636845111846924e-07, -6.873160600662231e-07, -6.109476089477539e-07, -5.345791578292847e-07, -4.5821070671081543e-07, -3.818422555923462e-07, -3.0547380447387695e-07, -2.2910535335540771e-07, -1.5273690223693848e-07, -7.636845111846924e-08, 0.0, 7.636845111846924e-08, 1.5273690223693848e-07, 2.2910535335540771e-07, 3.0547380447387695e-07, 3.818422555923462e-07, 4.5821070671081543e-07, 5.345791578292847e-07, 6.109476089477539e-07, 6.873160600662231e-07, 7.636845111846924e-07, 8.400529623031616e-07, 9.164214134216309e-07, 9.927898645401e-07, 1.0691583156585693e-06, 1.1455267667770386e-06, 1.2218952178955078e-06, 1.298263669013977e-06, 1.3746321201324463e-06, 1.4510005712509155e-06, 1.5273690223693848e-06, 1.603737473487854e-06, 1.6801059246063232e-06, 1.7564743757247925e-06, 1.8328428268432617e-06, 1.909211277961731e-06, 1.9855797290802e-06, 2.0619481801986694e-06, 2.1383166313171387e-06, 2.214685082435608e-06, 2.291053533554077e-06, 2.3674219846725464e-06, 2.4437904357910156e-06]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 90.0, 0.0, 0.0, 0.0, 0.0, 217.0, 0.0, 0.0, 0.0, 0.0, 381.0, 0.0, 0.0, 0.0, 195.0, 0.0, 0.0, 0.0, 0.0, 90.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 11.0, 11.0, 11.0, 63.0, 108.0, 106.0, 321.0, 727.0, 1084.0, 9850.0, 4112516.0, 57411.0, 9664.0, 1560.0, 208.0, 332.0, 154.0, 49.0, 49.0, 23.0, 4.0, 9.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.5762786865234375e-06, -3.4766271710395813e-06, -3.376975655555725e-06, -3.277324140071869e-06, -3.1776726245880127e-06, -3.0780211091041565e-06, -2.9783695936203003e-06, -2.878718078136444e-06, -2.779066562652588e-06, -2.6794150471687317e-06, -2.5797635316848755e-06, -2.4801120162010193e-06, -2.380460500717163e-06, -2.280808985233307e-06, -2.1811574697494507e-06, -2.0815059542655945e-06, -1.9818544387817383e-06, -1.882202923297882e-06, -1.7825514078140259e-06, -1.6828998923301697e-06, -1.5832483768463135e-06, -1.4835968613624573e-06, -1.383945345878601e-06, -1.2842938303947449e-06, -1.1846423149108887e-06, -1.0849907994270325e-06, -9.853392839431763e-07, -8.856877684593201e-07, -7.860362529754639e-07, -6.863847374916077e-07, -5.867332220077515e-07, -4.870817065238953e-07, -3.8743019104003906e-07, -2.8777867555618286e-07, -1.8812716007232666e-07, -8.847564458847046e-08, 1.1175870895385742e-08, 1.1082738637924194e-07, 2.1047890186309814e-07, 3.1013041734695435e-07, 4.0978193283081055e-07, 5.094334483146667e-07, 6.09084963798523e-07, 7.087364792823792e-07, 8.083879947662354e-07, 9.080395102500916e-07, 1.0076910257339478e-06, 1.107342541217804e-06, 1.2069940567016602e-06, 1.3066455721855164e-06, 1.4062970876693726e-06, 1.5059486031532288e-06, 1.605600118637085e-06, 1.7052516341209412e-06, 1.8049031496047974e-06, 1.9045546650886536e-06, 2.0042061805725098e-06, 2.103857696056366e-06, 2.203509211540222e-06, 2.3031607270240784e-06, 2.4028122425079346e-06, 2.5024637579917908e-06, 2.602115273475647e-06, 2.701766788959503e-06, 2.8014183044433594e-06]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 11.0, 0.0, 0.0, 27.0, 0.0, 137.0, 0.0, 0.0, 3734.0, 0.0, 126.0, 0.0, 0.0, 34.0, 0.0, 13.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.323680281639099e-07, -6.09084963798523e-07, -5.85801899433136e-07, -5.62518835067749e-07, -5.392357707023621e-07, -5.159527063369751e-07, -4.926696419715881e-07, -4.6938657760620117e-07, -4.461035132408142e-07, -4.2282044887542725e-07, -3.995373845100403e-07, -3.762543201446533e-07, -3.5297125577926636e-07, -3.296881914138794e-07, -3.0640512704849243e-07, -2.8312206268310547e-07, -2.598389983177185e-07, -2.3655593395233154e-07, -2.1327286958694458e-07, -1.8998980522155762e-07, -1.6670674085617065e-07, -1.434236764907837e-07, -1.2014061212539673e-07, -9.685754776000977e-08, -7.35744833946228e-08, -5.029141902923584e-08, -2.7008354663848877e-08, -3.725290298461914e-09, 1.955777406692505e-08, 4.284083843231201e-08, 6.612390279769897e-08, 8.940696716308594e-08, 1.126900315284729e-07, 1.3597309589385986e-07, 1.5925616025924683e-07, 1.825392246246338e-07, 2.0582228899002075e-07, 2.2910535335540771e-07, 2.523884177207947e-07, 2.7567148208618164e-07, 2.989545464515686e-07, 3.2223761081695557e-07, 3.4552067518234253e-07, 3.688037395477295e-07, 3.9208680391311646e-07, 4.153698682785034e-07, 4.386529326438904e-07, 4.6193599700927734e-07, 4.852190613746643e-07, 5.085021257400513e-07, 5.317851901054382e-07, 5.550682544708252e-07, 5.783513188362122e-07, 6.016343832015991e-07, 6.249174475669861e-07, 6.48200511932373e-07, 6.7148357629776e-07, 6.94766640663147e-07, 7.180497050285339e-07, 7.413327693939209e-07, 7.646158337593079e-07, 7.878988981246948e-07, 8.111819624900818e-07, 8.344650268554688e-07]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 7.0, 5.0, 10.0, 10.0, 15.0, 20.0, 27.0, 27.0, 43.0, 70.0, 107.0, 203.0, 140.0, 68.0, 59.0, 43.0, 25.0, 22.0, 17.0, 11.0, 14.0, 11.0, 9.0, 11.0, 3.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.0946599786620936e-06, -1.0689774398997542e-06, -1.0432947874505771e-06, -1.0176122486882377e-06, -9.919297099258984e-07, -9.66247171163559e-07, -9.405645187143818e-07, -9.148819799520425e-07, -8.891993843462842e-07, -8.63516788740526e-07, -8.378342499781866e-07, -8.121516543724283e-07, -7.864690587666701e-07, -7.607865200043307e-07, -7.351039243985724e-07, -7.094213287928142e-07, -6.837387900304748e-07, -6.580561944247165e-07, -6.323736556623771e-07, -6.066910600566189e-07, -5.810085212942795e-07, -5.553259256885212e-07, -5.29643330082763e-07, -5.039607913204236e-07, -4.782781957146653e-07, -4.525956285306165e-07, -4.269130613465677e-07, -4.0123046574080945e-07, -3.7554789855676063e-07, -3.498653313727118e-07, -3.2418273576695356e-07, -2.9850016858290473e-07, -2.728176013988559e-07, -2.471350342148071e-07, -2.2145245281990356e-07, -1.9576987142500002e-07, -1.700873042409512e-07, -1.4440473705690238e-07, -1.1872215566199884e-07, -9.30395742670953e-08, -6.735700708304648e-08, -4.1674432793570304e-08, -1.5991858504094125e-08, 9.690715785382054e-09, 3.537329007485823e-08, 6.105585725890705e-08, 8.673843865381059e-08, 1.1242102004871413e-07, 1.3810358723276295e-07, 1.6378615441681177e-07, 1.894687358117153e-07, 2.1515131720661884e-07, 2.4083388439066766e-07, 2.665164515747165e-07, 2.9219904718047474e-07, 3.1788161436452356e-07, 3.435641815485724e-07, 3.692467487326212e-07, 3.9492931591667e-07, 4.2061191152242827e-07, 4.462944787064771e-07, 4.719770458905259e-07, 4.976596414962842e-07, 5.233422371020424e-07, 5.490247758643818e-07]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 4.0, 6.0, 9.0, 4.0, 8.0, 10.0, 13.0, 20.0, 23.0, 19.0, 23.0, 33.0, 27.0, 28.0, 43.0, 40.0, 40.0, 33.0, 39.0, 50.0, 47.0, 35.0, 38.0, 43.0, 31.0, 37.0, 39.0, 24.0, 33.0, 16.0, 22.0, 20.0, 23.0, 22.0, 15.0, 14.0, 15.0, 7.0, 10.0, 9.0, 5.0, 2.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.360576610906719e-07, -4.214798252633045e-07, -4.0690198943593714e-07, -3.9232415360856976e-07, -3.777463462029118e-07, -3.6316851037554443e-07, -3.4859067454817705e-07, -3.3401283872080967e-07, -3.194350028934423e-07, -3.048571670660749e-07, -2.9027933123870753e-07, -2.7570149541134015e-07, -2.6112365958397277e-07, -2.465458237566054e-07, -2.3196801635094744e-07, -2.1739018052358006e-07, -2.0281234469621268e-07, -1.882345088688453e-07, -1.7365667304147792e-07, -1.5907885142496525e-07, -1.4450101559759787e-07, -1.299231797702305e-07, -1.1534535104829047e-07, -1.0076752232635044e-07, -8.618968649898306e-08, -7.161185067161568e-08, -5.703402194967566e-08, -4.245618967502196e-08, -2.787835740036826e-08, -1.3300521573000879e-08, 1.277307148939144e-09, 1.5855135870879167e-08, 3.043300011995598e-08, 4.501083239460968e-08, 5.958866466926338e-08, 7.41664933912034e-08, 8.874432921857078e-08, 1.0332216504593816e-07, 1.1789999376787819e-07, 1.324778224898182e-07, 1.470556583171856e-07, 1.6163349414455297e-07, 1.7621132997192035e-07, 1.9078915158843301e-07, 2.053669874158004e-07, 2.1994482324316778e-07, 2.3452264485968044e-07, 2.491004806870478e-07, 2.636783165144152e-07, 2.782561523417826e-07, 2.9283398816914996e-07, 3.0741182399651734e-07, 3.219896598238847e-07, 3.365674956512521e-07, 3.5114530305691005e-07, 3.6572313888427743e-07, 3.803009747116448e-07, 3.948788105390122e-07, 4.0945664636637957e-07, 4.2403448219374695e-07, 4.386122895994049e-07, 4.531901254267723e-07, 4.6776796125413966e-07, 4.82345797081507e-07, 4.969236329088744e-07]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 939.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1046662.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 900.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 95.0, 0.0, 0.0, 0.0, 0.0, 207.0, 0.0, 0.0, 0.0, 0.0, 346.0, 0.0, 0.0, 0.0, 178.0, 0.0, 0.0, 0.0, 0.0, 109.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048572.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.0, 0.0, 65.0, 0.0, 42.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 671.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 68.0, 0.0, 61.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1013.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 14.0, 13.0, 11.0, 28.0, 21.0, 34.0, 50.0, 83.0, 143.0, 228.0, 99.0, 58.0, 49.0, 32.0, 23.0, 25.0, 19.0, 18.0, 4.0, 5.0, 12.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.604514055652544e-07, -6.435934096771234e-07, -6.267354137889924e-07, -6.098774179008615e-07, -5.930194220127305e-07, -5.761614829680184e-07, -5.593034302364686e-07, -5.424454911917564e-07, -5.255874953036255e-07, -5.087294994154945e-07, -4.918715035273635e-07, -4.7501350763923256e-07, -4.58155540172811e-07, -4.4129754428468004e-07, -4.2443954839654907e-07, -4.075815525084181e-07, -3.9072355662028713e-07, -3.7386556073215615e-07, -3.570075648440252e-07, -3.4014959737760364e-07, -3.2329160148947267e-07, -3.064336056013417e-07, -2.895756097132107e-07, -2.7271761382507975e-07, -2.558596179369488e-07, -2.390016220488178e-07, -2.2214364037154155e-07, -2.0528564448341058e-07, -1.8842766280613432e-07, -1.7156966691800335e-07, -1.5471167102987238e-07, -1.378536751417414e-07, -1.2099570767531986e-07, -1.0413771889261625e-07, -8.727973010991263e-08, -7.042173422178166e-08, -5.356374543907805e-08, -3.670575665637443e-08, -1.984776076824346e-08, -2.9897719855398464e-09, 1.3868216797163768e-08, 3.072620557986738e-08, 4.7584197915284676e-08, 6.444219025070197e-08, 8.130017903340558e-08, 9.81581678161092e-08, 1.1501616370424017e-07, 1.3187414538151643e-07, 1.487321412696474e-07, 1.6559013715777837e-07, 1.8244811883505463e-07, 1.993061147231856e-07, 2.1616409640046186e-07, 2.3302209228859283e-07, 2.498800881767238e-07, 2.667380840648548e-07, 2.8359607995298575e-07, 3.004540758411167e-07, 3.173120717292477e-07, 3.3417006761737866e-07, 3.510280350838002e-07, 3.678860309719312e-07, 3.8474402686006215e-07, 4.016020227481931e-07, 4.1845999021461466e-07]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 3.0, 9.0, 10.0, 7.0, 12.0, 26.0, 20.0, 21.0, 32.0, 42.0, 35.0, 48.0, 45.0, 48.0, 42.0, 58.0, 66.0, 44.0, 40.0, 47.0, 43.0, 44.0, 38.0, 29.0, 19.0, 24.0, 36.0, 19.0, 19.0, 14.0, 12.0, 8.0, 9.0, 3.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.631908498391567e-07, -3.5214796412219584e-07, -3.4110504998352553e-07, -3.3006216426656465e-07, -3.1901925012789434e-07, -3.0797636441093346e-07, -2.969334786939726e-07, -2.8589056455530226e-07, -2.748476788383414e-07, -2.638047931213805e-07, -2.527618789827102e-07, -2.417189932657493e-07, -2.306760933379337e-07, -2.196331934101181e-07, -2.0859029348230251e-07, -1.9754739355448692e-07, -1.8650449362667132e-07, -1.7546159369885572e-07, -1.6441869377104013e-07, -1.5337579384322453e-07, -1.4233290812626365e-07, -1.3129000819844805e-07, -1.2024710827063245e-07, -1.0920421544824421e-07, -9.816131552042862e-08, -8.711841559261302e-08, -7.607552277022478e-08, -6.503262284240918e-08, -5.3989726467307264e-08, -4.2946830092205346e-08, -3.190393016438975e-08, -2.086103734200151e-08, -9.818137414185912e-09, 1.2247598490944256e-09, 1.2267657112374764e-08, 2.331055526383352e-08, 3.435345163893544e-08, 4.539634801403736e-08, 5.6439247941852955e-08, 6.74821407642412e-08, 7.852504069205679e-08, 8.956794061987239e-08, 1.0061083344226063e-07, 1.1165373337007622e-07, 1.2269663329789182e-07, 1.337395190148527e-07, 1.4478243315352302e-07, 1.558253188704839e-07, 1.668682187982995e-07, 1.779111187261151e-07, 1.889540186539307e-07, 1.9999691858174629e-07, 2.1103980429870717e-07, 2.2208270422652276e-07, 2.3312560415433836e-07, 2.4416848987129924e-07, 2.5521140400996956e-07, 2.6625428972693044e-07, 2.7729720386560075e-07, 2.8834008958256163e-07, 2.9938300372123194e-07, 3.104258894381928e-07, 3.2146880357686314e-07, 3.32511689293824e-07, 3.435545750107849e-07]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 7.0, 0.0, 0.0, 18.0, 0.0, 24.0, 0.0, 32.0, 0.0, 0.0, 135.0, 0.0, 397.0, 0.0, 0.0, 1703.0, 0.0, 22752.0, 0.0, 998642.0, 0.0, 0.0, 22598.0, 0.0, 1658.0, 0.0, 375.0, 0.0, 0.0, 132.0, 0.0, 31.0, 0.0, 0.0, 34.0, 0.0, 14.0, 0.0, 13.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.497146725654602e-07, -7.245689630508423e-07, -6.994232535362244e-07, -6.742775440216064e-07, -6.491318345069885e-07, -6.239861249923706e-07, -5.988404154777527e-07, -5.736947059631348e-07, -5.485489964485168e-07, -5.234032869338989e-07, -4.98257577419281e-07, -4.731118679046631e-07, -4.4796615839004517e-07, -4.2282044887542725e-07, -3.976747393608093e-07, -3.725290298461914e-07, -3.473833203315735e-07, -3.2223761081695557e-07, -2.9709190130233765e-07, -2.7194619178771973e-07, -2.468004822731018e-07, -2.2165477275848389e-07, -1.9650906324386597e-07, -1.7136335372924805e-07, -1.4621764421463013e-07, -1.210719347000122e-07, -9.592622518539429e-08, -7.078051567077637e-08, -4.563480615615845e-08, -2.0489096641540527e-08, 4.6566128730773926e-09, 2.9802322387695312e-08, 5.494803190231323e-08, 8.009374141693115e-08, 1.0523945093154907e-07, 1.30385160446167e-07, 1.555308699607849e-07, 1.8067657947540283e-07, 2.0582228899002075e-07, 2.3096799850463867e-07, 2.561137080192566e-07, 2.812594175338745e-07, 3.0640512704849243e-07, 3.3155083656311035e-07, 3.5669654607772827e-07, 3.818422555923462e-07, 4.069879651069641e-07, 4.3213367462158203e-07, 4.5727938413619995e-07, 4.824250936508179e-07, 5.075708031654358e-07, 5.327165126800537e-07, 5.578622221946716e-07, 5.830079317092896e-07, 6.081536412239075e-07, 6.332993507385254e-07, 6.584450602531433e-07, 6.835907697677612e-07, 7.087364792823792e-07, 7.338821887969971e-07, 7.59027898311615e-07, 7.841736078262329e-07, 8.093193173408508e-07, 8.344650268554688e-07]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 17.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 42.0, 0.0, 70.0, 0.0, 0.0, 117.0, 0.0, 126.0, 0.0, 253.0, 0.0, 0.0, 118.0, 0.0, 85.0, 0.0, 70.0, 0.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 29.0, 0.0, 11.0, 0.0, 13.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.497146725654602e-07, -7.245689630508423e-07, -6.994232535362244e-07, -6.742775440216064e-07, -6.491318345069885e-07, -6.239861249923706e-07, -5.988404154777527e-07, -5.736947059631348e-07, -5.485489964485168e-07, -5.234032869338989e-07, -4.98257577419281e-07, -4.731118679046631e-07, -4.4796615839004517e-07, -4.2282044887542725e-07, -3.976747393608093e-07, -3.725290298461914e-07, -3.473833203315735e-07, -3.2223761081695557e-07, -2.9709190130233765e-07, -2.7194619178771973e-07, -2.468004822731018e-07, -2.2165477275848389e-07, -1.9650906324386597e-07, -1.7136335372924805e-07, -1.4621764421463013e-07, -1.210719347000122e-07, -9.592622518539429e-08, -7.078051567077637e-08, -4.563480615615845e-08, -2.0489096641540527e-08, 4.6566128730773926e-09, 2.9802322387695312e-08, 5.494803190231323e-08, 8.009374141693115e-08, 1.0523945093154907e-07, 1.30385160446167e-07, 1.555308699607849e-07, 1.8067657947540283e-07, 2.0582228899002075e-07, 2.3096799850463867e-07, 2.561137080192566e-07, 2.812594175338745e-07, 3.0640512704849243e-07, 3.3155083656311035e-07, 3.5669654607772827e-07, 3.818422555923462e-07, 4.069879651069641e-07, 4.3213367462158203e-07, 4.5727938413619995e-07, 4.824250936508179e-07, 5.075708031654358e-07, 5.327165126800537e-07, 5.578622221946716e-07, 5.830079317092896e-07, 6.081536412239075e-07, 6.332993507385254e-07, 6.584450602531433e-07, 6.835907697677612e-07, 7.087364792823792e-07, 7.338821887969971e-07, 7.59027898311615e-07, 7.841736078262329e-07, 8.093193173408508e-07, 8.344650268554688e-07]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 13.0, 15.0, 13.0, 39.0, 93.0, 227.0, 463.0, 1490.0, 12470.0, 1019571.0, 11903.0, 1377.0, 423.0, 245.0, 105.0, 48.0, 27.0, 11.0, 7.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.086162567138672e-06, -2.0265579223632812e-06, -1.9669532775878906e-06, -1.9073486328125e-06, -1.8477439880371094e-06, -1.7881393432617188e-06, -1.7285346984863281e-06, -1.6689300537109375e-06, -1.6093254089355469e-06, -1.5497207641601562e-06, -1.4901161193847656e-06, -1.430511474609375e-06, -1.3709068298339844e-06, -1.3113021850585938e-06, -1.2516975402832031e-06, -1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06, 1.7285346984863281e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 0.0, 17.0, 28.0, 39.0, 72.0, 88.0, 103.0, 0.0, 293.0, 111.0, 66.0, 62.0, 38.0, 0.0, 34.0, 24.0, 10.0, 6.0, 7.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.629875421524048e-07, -9.126961231231689e-07, -8.624047040939331e-07, -8.121132850646973e-07, -7.618218660354614e-07, -7.115304470062256e-07, -6.612390279769897e-07, -6.109476089477539e-07, -5.606561899185181e-07, -5.103647708892822e-07, -4.600733518600464e-07, -4.0978193283081055e-07, -3.594905138015747e-07, -3.0919909477233887e-07, -2.5890767574310303e-07, -2.086162567138672e-07, -1.5832483768463135e-07, -1.0803341865539551e-07, -5.774199962615967e-08, -7.450580596923828e-09, 4.284083843231201e-08, 9.313225746154785e-08, 1.434236764907837e-07, 1.9371509552001953e-07, 2.4400651454925537e-07, 2.942979335784912e-07, 3.4458935260772705e-07, 3.948807716369629e-07, 4.4517219066619873e-07, 4.954636096954346e-07, 5.457550287246704e-07, 5.960464477539062e-07, 6.463378667831421e-07, 6.966292858123779e-07, 7.469207048416138e-07, 7.972121238708496e-07, 8.475035429000854e-07, 8.977949619293213e-07, 9.480863809585571e-07, 9.98377799987793e-07, 1.0486692190170288e-06, 1.0989606380462646e-06, 1.1492520570755005e-06, 1.1995434761047363e-06, 1.2498348951339722e-06, 1.300126314163208e-06, 1.3504177331924438e-06, 1.4007091522216797e-06, 1.4510005712509155e-06, 1.5012919902801514e-06, 1.5515834093093872e-06, 1.601874828338623e-06, 1.6521662473678589e-06, 1.7024576663970947e-06, 1.7527490854263306e-06, 1.8030405044555664e-06, 1.8533319234848022e-06, 1.903623342514038e-06, 1.953914761543274e-06, 2.0042061805725098e-06, 2.0544975996017456e-06, 2.1047890186309814e-06, 2.1550804376602173e-06, 2.205371856689453e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [230.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048124.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 220.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.960464477539063e-08, -5.681067705154419e-08, -5.4016709327697754e-08, -5.122274160385132e-08, -4.842877388000488e-08, -4.563480615615845e-08, -4.284083843231201e-08, -4.0046870708465576e-08, -3.725290298461914e-08, -3.4458935260772705e-08, -3.166496753692627e-08, -2.8870999813079834e-08, -2.60770320892334e-08, -2.3283064365386963e-08, -2.0489096641540527e-08, -1.7695128917694092e-08, -1.4901161193847656e-08, -1.210719347000122e-08, -9.313225746154785e-09, -6.51925802230835e-09, -3.725290298461914e-09, -9.313225746154785e-10, 1.862645149230957e-09, 4.6566128730773926e-09, 7.450580596923828e-09, 1.0244548320770264e-08, 1.30385160446167e-08, 1.5832483768463135e-08, 1.862645149230957e-08, 2.1420419216156006e-08, 2.421438694000244e-08, 2.7008354663848877e-08, 2.9802322387695312e-08, 3.259629011154175e-08, 3.5390257835388184e-08, 3.818422555923462e-08, 4.0978193283081055e-08, 4.377216100692749e-08, 4.6566128730773926e-08, 4.936009645462036e-08, 5.21540641784668e-08, 5.494803190231323e-08, 5.774199962615967e-08, 6.05359673500061e-08, 6.332993507385254e-08, 6.612390279769897e-08, 6.891787052154541e-08, 7.171183824539185e-08, 7.450580596923828e-08, 7.729977369308472e-08, 8.009374141693115e-08, 8.288770914077759e-08, 8.568167686462402e-08, 8.847564458847046e-08, 9.12696123123169e-08, 9.406358003616333e-08, 9.685754776000977e-08, 9.96515154838562e-08, 1.0244548320770264e-07, 1.0523945093154907e-07, 1.0803341865539551e-07, 1.1082738637924194e-07, 1.1362135410308838e-07, 1.1641532182693481e-07, 1.1920928955078125e-07]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1022.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 466.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1047601.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 439.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1021.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 17.0, 30.0, 80.0, 188.0, 369.0, 157.0, 69.0, 35.0, 13.0, 12.0, 4.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.395856656927208e-06, -1.3105021707815467e-06, -1.2251476846358855e-06, -1.1397931984902243e-06, -1.054438712344563e-06, -9.690842261989019e-07, -8.837297400532407e-07, -7.983752539075795e-07, -7.130207677619183e-07, -6.27666281616257e-07, -5.423117954705958e-07, -4.569573093249346e-07, -3.716028231792734e-07, -2.862483370336122e-07, -2.0089385088795098e-07, -1.1553936474228976e-07, -3.018487859662855e-08, 5.516960754903266e-08, 1.4052409369469387e-07, 2.258785798403551e-07, 3.112330659860163e-07, 3.965875521316775e-07, 4.819420382773387e-07, 5.672965244229999e-07, 6.526510105686611e-07, 7.380054967143224e-07, 8.233599828599836e-07, 9.087144690056448e-07, 9.94068955151306e-07, 1.0794234412969672e-06, 1.1647779274426284e-06, 1.2501324135882896e-06, 1.3354870134207886e-06, 1.4208414995664498e-06, 1.506195985712111e-06, 1.5915504718577722e-06, 1.6769049580034334e-06, 1.7622594441490946e-06, 1.8476139302947558e-06, 1.932968416440417e-06, 2.0183229025860783e-06, 2.1036773887317395e-06, 2.1890318748774007e-06, 2.274386361023062e-06, 2.359740847168723e-06, 2.4450953333143843e-06, 2.5304498194600455e-06, 2.6158043056057068e-06, 2.701158791751368e-06, 2.786513277897029e-06, 2.8718677640426904e-06, 2.9572222501883516e-06, 3.042576736334013e-06, 3.127931222479674e-06, 3.2132857086253352e-06, 3.2986401947709965e-06, 3.3839946809166577e-06, 3.469349167062319e-06, 3.55470365320798e-06, 3.6400581393536413e-06, 3.7254126254993025e-06, 3.8107671116449637e-06, 3.896121597790625e-06, 3.981475856562611e-06, 4.066830570081947e-06]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 14.0, 13.0, 19.0, 24.0, 23.0, 23.0, 40.0, 46.0, 40.0, 45.0, 44.0, 49.0, 52.0, 65.0, 74.0, 46.0, 52.0, 42.0, 56.0, 44.0, 51.0, 25.0, 18.0, 19.0, 19.0, 10.0, 7.0, 10.0, 8.0, 5.0, 7.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.577884063408419e-06, -1.5342516235250514e-06, -1.490619069954846e-06, -1.4469865163846407e-06, -1.403354076501273e-06, -1.3597216366179055e-06, -1.3160890830477001e-06, -1.2724565294774948e-06, -1.2288240895941271e-06, -1.1851916497107595e-06, -1.1415590961405542e-06, -1.0979265425703488e-06, -1.0542941026869812e-06, -1.0106616628036136e-06, -9.670291092334082e-07, -9.233966125066218e-07, -8.797641157798353e-07, -8.361316190530488e-07, -7.924991223262623e-07, -7.488666255994758e-07, -7.052341288726893e-07, -6.616016321459028e-07, -6.179691354191164e-07, -5.743366386923299e-07, -5.307041419655434e-07, -4.870716452387569e-07, -4.434391485119704e-07, -3.9980665178518393e-07, -3.5617415505839745e-07, -3.1254165833161096e-07, -2.689091616048245e-07, -2.25276664878038e-07, -1.8164428183808923e-07, -1.3801178511130274e-07, -9.437928838451626e-08, -5.074679165772977e-08, -7.114294930943288e-09, 3.65182017958432e-08, 8.015069852262968e-08, 1.2378319524941617e-07, 1.6741569197620265e-07, 2.1104818870298914e-07, 2.546806854297756e-07, 2.983131821565621e-07, 3.419456788833486e-07, 3.855781756101351e-07, 4.2921067233692156e-07, 4.7284316906370805e-07, 5.164756657904945e-07, 5.60108162517281e-07, 6.037406592440675e-07, 6.47373155970854e-07, 6.910056526976405e-07, 7.34638149424427e-07, 7.782706461512134e-07, 8.219031428779999e-07, 8.655356396047864e-07, 9.091681363315729e-07, 9.528006330583594e-07, 9.96433072941727e-07, 1.0400656265119324e-06, 1.0836981800821377e-06, 1.1273306199655053e-06, 1.170963059848873e-06, 1.2145956134190783e-06]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 2.0, 4.0, 6.0, 6.0, 10.0, 6.0, 21.0, 18.0, 25.0, 23.0, 44.0, 42.0, 64.0, 68.0, 59.0, 54.0, 110.0, 79.0, 71.0, 171.0, 1048913.0, 64.0, 133.0, 78.0, 61.0, 101.0, 50.0, 52.0, 40.0, 35.0, 34.0, 21.0, 29.0, 21.0, 20.0, 7.0, 11.0, 13.0, 11.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.600088464532746e-06, -2.517423126846552e-06, -2.4347580165340332e-06, -2.352092678847839e-06, -2.2694275685353205e-06, -2.1867622308491264e-06, -2.1040968931629322e-06, -2.021431555476738e-06, -1.9387664451642195e-06, -1.856101221164863e-06, -1.7734359971655067e-06, -1.6907706594793126e-06, -1.6081054354799562e-06, -1.5254402114805998e-06, -1.4427748737944057e-06, -1.3601096497950493e-06, -1.277444425795693e-06, -1.1947792017963366e-06, -1.1121139777969802e-06, -1.029448640110786e-06, -9.467834161114297e-07, -8.641181921120733e-07, -7.814529112692981e-07, -6.987876304265228e-07, -6.161224064271664e-07, -5.3345718242781e-07, -4.507919015850348e-07, -3.68126649163969e-07, -2.8546139674290316e-07, -2.0279614432183735e-07, -1.2013089190077153e-07, -3.7465611057996284e-08, 4.519938556768466e-08, 1.2786463798875047e-07, 2.105298904098163e-07, 2.931951428308821e-07, 3.758603952519479e-07, 4.5852564767301374e-07, 5.411909000940796e-07, 6.238561809368548e-07, 7.065214049362112e-07, 7.891866289355676e-07, 8.718519097783428e-07, 9.54517190621118e-07, 1.0371824146204744e-06, 1.1198476386198308e-06, 1.202512976306025e-06, 1.2851782003053813e-06, 1.3678434243047377e-06, 1.450508648304094e-06, 1.5331738723034505e-06, 1.6158392099896446e-06, 1.698504433989001e-06, 1.7811696579883574e-06, 1.8638349956745515e-06, 1.94650010598707e-06, 2.0291654436732642e-06, 2.1118307813594583e-06, 2.194495891671977e-06, 2.277161229358171e-06, 2.3598263396706898e-06, 2.442491677356884e-06, 2.525157015043078e-06, 2.607822352729272e-06, 2.6904874630417908e-06]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 22.0, 91.0, 1767.0, 51468000.0, 1257.0, 132.0, 35.0, 15.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-187.375, -183.72265625, -180.0703125, -176.41796875, -172.765625, -169.11328125, -165.4609375, -161.80859375, -158.15625, -154.50390625, -150.8515625, -147.19921875, -143.546875, -139.89453125, -136.2421875, -132.58984375, -128.9375, -125.28515625, -121.6328125, -117.98046875, -114.328125, -110.67578125, -107.0234375, -103.37109375, -99.71875, -96.06640625, -92.4140625, -88.76171875, -85.109375, -81.45703125, -77.8046875, -74.15234375, -70.5, -66.84765625, -63.1953125, -59.54296875, -55.890625, -52.23828125, -48.5859375, -44.93359375, -41.28125, -37.62890625, -33.9765625, -30.32421875, -26.671875, -23.01953125, -19.3671875, -15.71484375, -12.0625, -8.41015625, -4.7578125, -1.10546875, 2.546875, 6.19921875, 9.8515625, 13.50390625, 17.15625, 20.80859375, 24.4609375, 28.11328125, 31.765625, 35.41796875, 39.0703125, 42.72265625, 46.375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 2.0, 7.0, 1.0, 4.0, 9.0, 6.0, 5.0, 19.0, 8.0, 16.0, 9.0, 23.0, 24.0, 34.0, 31.0, 45.0, 42.0, 52.0, 66.0, 81.0, 103.0, 133.0, 191.0, 352.0, 1018.0, 5593526.0, 693157.0, 1117.0, 373.0, 170.0, 151.0, 91.0, 80.0, 72.0, 71.0, 64.0, 48.0, 42.0, 37.0, 32.0, 21.0, 21.0, 11.0, 18.0, 12.0, 10.0, 7.0, 6.0, 7.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2041015625, -0.19706344604492188, -0.19002532958984375, -0.18298721313476562, -0.1759490966796875, -0.16891098022460938, -0.16187286376953125, -0.15483474731445312, -0.147796630859375, -0.14075851440429688, -0.13372039794921875, -0.12668228149414062, -0.1196441650390625, -0.11260604858398438, -0.10556793212890625, -0.09852981567382812, -0.09149169921875, -0.08445358276367188, -0.07741546630859375, -0.07037734985351562, -0.0633392333984375, -0.056301116943359375, -0.04926300048828125, -0.042224884033203125, -0.035186767578125, -0.028148651123046875, -0.02111053466796875, -0.014072418212890625, -0.0070343017578125, 3.814697265625e-06, 0.00704193115234375, 0.014080047607421875, 0.0211181640625, 0.028156280517578125, 0.03519439697265625, 0.042232513427734375, 0.0492706298828125, 0.056308746337890625, 0.06334686279296875, 0.07038497924804688, 0.077423095703125, 0.08446121215820312, 0.09149932861328125, 0.09853744506835938, 0.1055755615234375, 0.11261367797851562, 0.11965179443359375, 0.12668991088867188, 0.13372802734375, 0.14076614379882812, 0.14780426025390625, 0.15484237670898438, 0.1618804931640625, 0.16891860961914062, 0.17595672607421875, 0.18299484252929688, 0.190032958984375, 0.19707107543945312, 0.20410919189453125, 0.21114730834960938, 0.2181854248046875, 0.22522354125976562, 0.23226165771484375, 0.23929977416992188, 0.246337890625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 6.0, 6.0, 16.0, 15.0, 8.0, 17.0, 29.0, 17.0, 30.0, 26.0, 24.0, 35.0, 35.0, 30.0, 44.0, 47.0, 37.0, 56.0, 1038.0, 79.0, 46.0, 47.0, 39.0, 23.0, 27.0, 31.0, 24.0, 21.0, 20.0, 23.0, 21.0, 19.0, 9.0, 11.0, 12.0, 5.0, 10.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03125, -9.716796875, -9.40234375, -9.087890625, -8.7734375, -8.458984375, -8.14453125, -7.830078125, -7.515625, -7.201171875, -6.88671875, -6.572265625, -6.2578125, -5.943359375, -5.62890625, -5.314453125, -5.0, -4.685546875, -4.37109375, -4.056640625, -3.7421875, -3.427734375, -3.11328125, -2.798828125, -2.484375, -2.169921875, -1.85546875, -1.541015625, -1.2265625, -0.912109375, -0.59765625, -0.283203125, 0.03125, 0.345703125, 0.66015625, 0.974609375, 1.2890625, 1.603515625, 1.91796875, 2.232421875, 2.546875, 2.861328125, 3.17578125, 3.490234375, 3.8046875, 4.119140625, 4.43359375, 4.748046875, 5.0625, 5.376953125, 5.69140625, 6.005859375, 6.3203125, 6.634765625, 6.94921875, 7.263671875, 7.578125, 7.892578125, 8.20703125, 8.521484375, 8.8359375, 9.150390625, 9.46484375, 9.779296875, 10.09375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 8.0, 8.0, 10.0, 10.0, 12.0, 12.0, 25.0, 38.0, 61.0, 83.0, 123.0, 253.0, 467.0, 1337.0, 6246347.0, 40467.0, 1128.0, 436.0, 211.0, 130.0, 67.0, 56.0, 39.0, 35.0, 25.0, 10.0, 6.0, 3.0, 2.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.30615234375, -0.2955780029296875, -0.285003662109375, -0.2744293212890625, -0.26385498046875, -0.2532806396484375, -0.242706298828125, -0.2321319580078125, -0.2215576171875, -0.2109832763671875, -0.200408935546875, -0.1898345947265625, -0.17926025390625, -0.1686859130859375, -0.158111572265625, -0.1475372314453125, -0.136962890625, -0.1263885498046875, -0.115814208984375, -0.1052398681640625, -0.09466552734375, -0.0840911865234375, -0.073516845703125, -0.0629425048828125, -0.0523681640625, -0.0417938232421875, -0.031219482421875, -0.0206451416015625, -0.01007080078125, 0.0005035400390625, 0.011077880859375, 0.0216522216796875, 0.0322265625, 0.0428009033203125, 0.053375244140625, 0.0639495849609375, 0.07452392578125, 0.0850982666015625, 0.095672607421875, 0.1062469482421875, 0.1168212890625, 0.1273956298828125, 0.137969970703125, 0.1485443115234375, 0.15911865234375, 0.1696929931640625, 0.180267333984375, 0.1908416748046875, 0.201416015625, 0.2119903564453125, 0.222564697265625, 0.2331390380859375, 0.24371337890625, 0.2542877197265625, 0.264862060546875, 0.2754364013671875, 0.2860107421875, 0.2965850830078125, 0.307159423828125, 0.3177337646484375, 0.32830810546875, 0.3388824462890625, 0.349456787109375, 0.3600311279296875, 0.37060546875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 134.0, 1886.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1708984375, -0.16702747344970703, -0.16315650939941406, -0.1592855453491211, -0.15541458129882812, -0.15154361724853516, -0.1476726531982422, -0.14380168914794922, -0.13993072509765625, -0.13605976104736328, -0.1321887969970703, -0.12831783294677734, -0.12444686889648438, -0.1205759048461914, -0.11670494079589844, -0.11283397674560547, -0.1089630126953125, -0.10509204864501953, -0.10122108459472656, -0.0973501205444336, -0.09347915649414062, -0.08960819244384766, -0.08573722839355469, -0.08186626434326172, -0.07799530029296875, -0.07412433624267578, -0.07025337219238281, -0.06638240814208984, -0.06251144409179688, -0.058640480041503906, -0.05476951599121094, -0.05089855194091797, -0.047027587890625, -0.04315662384033203, -0.03928565979003906, -0.035414695739746094, -0.031543731689453125, -0.027672767639160156, -0.023801803588867188, -0.01993083953857422, -0.01605987548828125, -0.012188911437988281, -0.008317947387695312, -0.004446983337402344, -0.000576019287109375, 0.0032949447631835938, 0.0071659088134765625, 0.011036872863769531, 0.0149078369140625, 0.01877880096435547, 0.022649765014648438, 0.026520729064941406, 0.030391693115234375, 0.034262657165527344, 0.03813362121582031, 0.04200458526611328, 0.04587554931640625, 0.04974651336669922, 0.05361747741699219, 0.057488441467285156, 0.061359405517578125, 0.0652303695678711, 0.06910133361816406, 0.07297229766845703, 0.07684326171875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 8.0, 8.0, 15.0, 14.0, 19.0, 33.0, 42.0, 44.0, 99.0, 119.0, 197.0, 277.0, 430.0, 669.0, 1181.0, 2178.0, 3948.0, 8453.0, 20877.0, 69718.0, 580997.0, 5378044.0, 162737.0, 35953.0, 12578.0, 5804.0, 2880.0, 1601.0, 937.0, 546.0, 342.0, 232.0, 144.0, 98.0, 60.0, 43.0, 38.0, 24.0, 13.0, 11.0, 12.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.01080322265625, -0.010487794876098633, -0.010172367095947266, -0.009856939315795898, -0.009541511535644531, -0.009226083755493164, -0.008910655975341797, -0.00859522819519043, -0.008279800415039062, -0.007964372634887695, -0.007648944854736328, -0.007333517074584961, -0.007018089294433594, -0.0067026615142822266, -0.006387233734130859, -0.006071805953979492, -0.005756378173828125, -0.005440950393676758, -0.005125522613525391, -0.0048100948333740234, -0.004494667053222656, -0.004179239273071289, -0.003863811492919922, -0.0035483837127685547, -0.0032329559326171875, -0.0029175281524658203, -0.002602100372314453, -0.002286672592163086, -0.0019712448120117188, -0.0016558170318603516, -0.0013403892517089844, -0.0010249614715576172, -0.00070953369140625, -0.0003941059112548828, -7.867813110351562e-05, 0.00023674964904785156, 0.0005521774291992188, 0.0008676052093505859, 0.0011830329895019531, 0.0014984607696533203, 0.0018138885498046875, 0.0021293163299560547, 0.002444744110107422, 0.002760171890258789, 0.0030755996704101562, 0.0033910274505615234, 0.0037064552307128906, 0.004021883010864258, 0.004337310791015625, 0.004652738571166992, 0.004968166351318359, 0.0052835941314697266, 0.005599021911621094, 0.005914449691772461, 0.006229877471923828, 0.006545305252075195, 0.0068607330322265625, 0.00717616081237793, 0.007491588592529297, 0.007807016372680664, 0.008122444152832031, 0.008437871932983398, 0.008753299713134766, 0.009068727493286133, 0.0093841552734375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 1.0, 4.0, 5.0, 6.0, 15.0, 10.0, 14.0, 13.0, 27.0, 35.0, 50.0, 66.0, 133.0, 228.0, 701.0, 259.0, 143.0, 106.0, 70.0, 38.0, 28.0, 18.0, 13.0, 12.0, 3.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0209503173828125, -0.020341873168945312, -0.019733428955078125, -0.019124984741210938, -0.01851654052734375, -0.017908096313476562, -0.017299652099609375, -0.016691207885742188, -0.016082763671875, -0.015474319458007812, -0.014865875244140625, -0.014257431030273438, -0.01364898681640625, -0.013040542602539062, -0.012432098388671875, -0.011823654174804688, -0.0112152099609375, -0.010606765747070312, -0.009998321533203125, -0.009389877319335938, -0.00878143310546875, -0.008172988891601562, -0.007564544677734375, -0.0069561004638671875, -0.00634765625, -0.0057392120361328125, -0.005130767822265625, -0.0045223236083984375, -0.00391387939453125, -0.0033054351806640625, -0.002696990966796875, -0.0020885467529296875, -0.0014801025390625, -0.0008716583251953125, -0.000263214111328125, 0.0003452301025390625, 0.00095367431640625, 0.0015621185302734375, 0.002170562744140625, 0.0027790069580078125, 0.003387451171875, 0.0039958953857421875, 0.004604339599609375, 0.0052127838134765625, 0.00582122802734375, 0.0064296722412109375, 0.007038116455078125, 0.0076465606689453125, 0.0082550048828125, 0.008863449096679688, 0.009471893310546875, 0.010080337524414062, 0.01068878173828125, 0.011297225952148438, 0.011905670166015625, 0.012514114379882812, 0.01312255859375, 0.013731002807617188, 0.014339447021484375, 0.014947891235351562, 0.01555633544921875, 0.016164779663085938, 0.016773223876953125, 0.017381668090820312, 0.0179901123046875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 14.0, 42.0, 293.0, 338.0, 147.0, 73.0, 47.0, 24.0, 15.0, 8.0, 4.0, 6.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.1489819437265396, -0.1460566520690918, -0.14313136041164398, -0.14020606875419617, -0.13728079199790955, -0.13435550034046173, -0.13143020868301392, -0.1285049170255661, -0.1255796253681183, -0.12265433371067047, -0.11972904205322266, -0.11680375784635544, -0.11387846618890762, -0.11095317453145981, -0.10802789032459259, -0.10510259866714478, -0.10217730700969696, -0.09925201535224915, -0.09632672369480133, -0.09340143948793411, -0.0904761478304863, -0.08755085617303848, -0.08462557196617126, -0.08170028030872345, -0.07877498865127563, -0.07584969699382782, -0.07292440533638, -0.06999912112951279, -0.06707382947206497, -0.06414853781461716, -0.06122324988245964, -0.058297961950302124, -0.05537266284227371, -0.0524473711848259, -0.04952208325266838, -0.046596795320510864, -0.04367150366306305, -0.040746212005615234, -0.03782092407345772, -0.0348956361413002, -0.031970344483852386, -0.02904505468904972, -0.026119764894247055, -0.02319447509944439, -0.020269185304641724, -0.017343895509839058, -0.014418605715036392, -0.011493315920233727, -0.00856802612543106, -0.005642736330628395, -0.0027174465358257294, 0.00020784325897693634, 0.003133133053779602, 0.006058422848582268, 0.008983712643384933, 0.0119090024381876, 0.014834292232990265, 0.01775958202779293, 0.020684871822595596, 0.023610161617398262, 0.026535451412200928, 0.029460741207003593, 0.03238603100180626, 0.035311318933963776, 0.03823661059141159]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 3.0, 5.0, 7.0, 6.0, 8.0, 10.0, 8.0, 16.0, 13.0, 18.0, 18.0, 25.0, 18.0, 33.0, 38.0, 33.0, 28.0, 35.0, 52.0, 34.0, 33.0, 39.0, 45.0, 38.0, 38.0, 32.0, 39.0, 35.0, 39.0, 31.0, 25.0, 31.0, 29.0, 22.0, 16.0, 13.0, 13.0, 14.0, 9.0, 9.0, 10.0, 4.0, 6.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.029070556163787842, -0.028235023841261864, -0.027399491518735886, -0.026563959196209908, -0.02572842687368393, -0.02489289455115795, -0.024057362228631973, -0.023221829906105995, -0.022386297583580017, -0.02155076526105404, -0.02071523293852806, -0.019879700616002083, -0.019044168293476105, -0.018208635970950127, -0.01737310364842415, -0.01653757132589817, -0.015702039003372192, -0.014866506680846214, -0.014030974358320236, -0.013195442035794258, -0.01235990971326828, -0.011524377390742302, -0.010688845068216324, -0.009853312745690346, -0.009017780423164368, -0.00818224810063839, -0.0073467157781124115, -0.006511183455586433, -0.005675651133060455, -0.004840118810534477, -0.004004586488008499, -0.003169054165482521, -0.002333521842956543, -0.0014979895204305649, -0.0006624571979045868, 0.0001730751246213913, 0.0010086074471473694, 0.0018441397696733475, 0.0026796720921993256, 0.0035152044147253036, 0.004350736737251282, 0.00518626905977726, 0.006021801382303238, 0.006857333704829216, 0.007692866027355194, 0.008528398349881172, 0.00936393067240715, 0.010199462994933128, 0.011034995317459106, 0.011870527639985085, 0.012706059962511063, 0.01354159228503704, 0.014377124607563019, 0.015212656930088997, 0.016048189252614975, 0.016883721575140953, 0.01771925389766693, 0.01855478622019291, 0.019390318542718887, 0.020225850865244865, 0.021061383187770844, 0.02189691551029682, 0.0227324478328228, 0.023567980155348778, 0.024403512477874756]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 21.0, 33.0, 70.0, 192.0, 351.0, 748.0, 2120.0, 7310.0, 28907.0, 301804.0, 3800663.0, 36975.0, 8818.0, 3339.0, 1399.0, 663.0, 279.0, 143.0, 86.0, 65.0, 62.0, 50.0, 41.0, 31.0, 23.0, 29.0, 19.0, 7.0, 12.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00043392181396484375, -0.0004111975431442261, -0.0003884732723236084, -0.0003657490015029907, -0.00034302473068237305, -0.00032030045986175537, -0.0002975761890411377, -0.00027485191822052, -0.00025212764739990234, -0.00022940337657928467, -0.000206679105758667, -0.00018395483493804932, -0.00016123056411743164, -0.00013850629329681396, -0.00011578202247619629, -9.305775165557861e-05, -7.033348083496094e-05, -4.760921001434326e-05, -2.4884939193725586e-05, -2.16066837310791e-06, 2.0563602447509766e-05, 4.328787326812744e-05, 6.601214408874512e-05, 8.873641490936279e-05, 0.00011146068572998047, 0.00013418495655059814, 0.00015690922737121582, 0.0001796334981918335, 0.00020235776901245117, 0.00022508203983306885, 0.0002478063106536865, 0.0002705305814743042, 0.0002932548522949219, 0.00031597912311553955, 0.0003387033939361572, 0.0003614276647567749, 0.0003841519355773926, 0.00040687620639801025, 0.00042960047721862793, 0.0004523247480392456, 0.0004750490188598633, 0.000497773289680481, 0.0005204975605010986, 0.0005432218313217163, 0.000565946102142334, 0.0005886703729629517, 0.0006113946437835693, 0.000634118914604187, 0.0006568431854248047, 0.0006795674562454224, 0.00070229172706604, 0.0007250159978866577, 0.0007477402687072754, 0.0007704645395278931, 0.0007931888103485107, 0.0008159130811691284, 0.0008386373519897461, 0.0008613616228103638, 0.0008840858936309814, 0.0009068101644515991, 0.0009295344352722168, 0.0009522587060928345, 0.0009749829769134521, 0.0009977072477340698, 0.0010204315185546875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 7.0, 10.0, 17.0, 24.0, 21.0, 40.0, 83.0, 113.0, 175.0, 164.0, 136.0, 60.0, 53.0, 32.0, 21.0, 17.0, 7.0, 6.0, 1.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.47955322265625e-05, -2.3502856492996216e-05, -2.221018075942993e-05, -2.0917505025863647e-05, -1.9624829292297363e-05, -1.833215355873108e-05, -1.7039477825164795e-05, -1.574680209159851e-05, -1.4454126358032227e-05, -1.3161450624465942e-05, -1.1868774890899658e-05, -1.0576099157333374e-05, -9.28342342376709e-06, -7.990747690200806e-06, -6.6980719566345215e-06, -5.405396223068237e-06, -4.112720489501953e-06, -2.820044755935669e-06, -1.5273690223693848e-06, -2.3469328880310059e-07, 1.0579824447631836e-06, 2.3506581783294678e-06, 3.643333911895752e-06, 4.936009645462036e-06, 6.22868537902832e-06, 7.5213611125946045e-06, 8.814036846160889e-06, 1.0106712579727173e-05, 1.1399388313293457e-05, 1.2692064046859741e-05, 1.3984739780426025e-05, 1.527741551399231e-05, 1.6570091247558594e-05, 1.7862766981124878e-05, 1.9155442714691162e-05, 2.0448118448257446e-05, 2.174079418182373e-05, 2.3033469915390015e-05, 2.43261456489563e-05, 2.5618821382522583e-05, 2.6911497116088867e-05, 2.820417284965515e-05, 2.9496848583221436e-05, 3.078952431678772e-05, 3.2082200050354004e-05, 3.337487578392029e-05, 3.466755151748657e-05, 3.5960227251052856e-05, 3.725290298461914e-05, 3.8545578718185425e-05, 3.983825445175171e-05, 4.113093018531799e-05, 4.242360591888428e-05, 4.371628165245056e-05, 4.5008957386016846e-05, 4.630163311958313e-05, 4.7594308853149414e-05, 4.88869845867157e-05, 5.017966032028198e-05, 5.1472336053848267e-05, 5.276501178741455e-05, 5.4057687520980835e-05, 5.535036325454712e-05, 5.66430389881134e-05, 5.793571472167969e-05]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 13.0, 19.0, 44.0, 41.0, 91.0, 197.0, 613.0, 2183.0, 10362.0, 71318.0, 3937228.0, 152648.0, 15252.0, 2891.0, 630.0, 227.0, 121.0, 79.0, 54.0, 41.0, 45.0, 40.0, 25.0, 19.0, 32.0, 20.0, 10.0, 9.0, 7.0, 6.0, 9.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002086162567138672, -0.00019526854157447815, -0.0001819208264350891, -0.00016857311129570007, -0.00015522539615631104, -0.000141877681016922, -0.00012852996587753296, -0.00011518225073814392, -0.00010183453559875488, -8.848682045936584e-05, -7.51391053199768e-05, -6.179139018058777e-05, -4.844367504119873e-05, -3.509595990180969e-05, -2.1748244762420654e-05, -8.400529623031616e-06, 4.947185516357422e-06, 1.829490065574646e-05, 3.16426157951355e-05, 4.4990330934524536e-05, 5.8338046073913574e-05, 7.168576121330261e-05, 8.503347635269165e-05, 9.838119149208069e-05, 0.00011172890663146973, 0.00012507662177085876, 0.0001384243369102478, 0.00015177205204963684, 0.00016511976718902588, 0.00017846748232841492, 0.00019181519746780396, 0.000205162912607193, 0.00021851062774658203, 0.00023185834288597107, 0.0002452060580253601, 0.00025855377316474915, 0.0002719014883041382, 0.0002852492034435272, 0.00029859691858291626, 0.0003119446337223053, 0.00032529234886169434, 0.0003386400640010834, 0.0003519877791404724, 0.00036533549427986145, 0.0003786832094192505, 0.0003920309245586395, 0.00040537863969802856, 0.0004187263548374176, 0.00043207406997680664, 0.0004454217851161957, 0.0004587695002555847, 0.00047211721539497375, 0.0004854649305343628, 0.0004988126456737518, 0.0005121603608131409, 0.0005255080759525299, 0.0005388557910919189, 0.000552203506231308, 0.000565551221370697, 0.0005788989365100861, 0.0005922466516494751, 0.0006055943667888641, 0.0006189420819282532, 0.0006322897970676422, 0.0006456375122070312]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 12.0, 3.0, 7.0, 8.0, 8.0, 19.0, 30.0, 20.0, 29.0, 38.0, 32.0, 32.0, 50.0, 40.0, 57.0, 57.0, 55.0, 92.0, 89.0, 446.0, 2150.0, 330.0, 151.0, 83.0, 81.0, 54.0, 29.0, 21.0, 21.0, 15.0, 9.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.00015115737915039062, -0.00014804396778345108, -0.00014493055641651154, -0.000141817145049572, -0.00013870373368263245, -0.0001355903223156929, -0.00013247691094875336, -0.0001293634995818138, -0.00012625008821487427, -0.00012313667684793472, -0.00012002326548099518, -0.00011690985411405563, -0.00011379644274711609, -0.00011068303138017654, -0.000107569620013237, -0.00010445620864629745, -0.00010134279727935791, -9.822938591241837e-05, -9.511597454547882e-05, -9.200256317853928e-05, -8.888915181159973e-05, -8.577574044466019e-05, -8.266232907772064e-05, -7.95489177107811e-05, -7.643550634384155e-05, -7.332209497690201e-05, -7.020868360996246e-05, -6.709527224302292e-05, -6.398186087608337e-05, -6.086844950914383e-05, -5.7755038142204285e-05, -5.464162677526474e-05, -5.1528215408325195e-05, -4.841480404138565e-05, -4.5301392674446106e-05, -4.218798130750656e-05, -3.9074569940567017e-05, -3.596115857362747e-05, -3.284774720668793e-05, -2.9734335839748383e-05, -2.6620924472808838e-05, -2.3507513105869293e-05, -2.039410173892975e-05, -1.7280690371990204e-05, -1.416727900505066e-05, -1.1053867638111115e-05, -7.94045627117157e-06, -4.827044904232025e-06, -1.7136335372924805e-06, 1.3997778296470642e-06, 4.513189196586609e-06, 7.6266005635261536e-06, 1.0740011930465698e-05, 1.3853423297405243e-05, 1.6966834664344788e-05, 2.0080246031284332e-05, 2.3193657398223877e-05, 2.630706876516342e-05, 2.9420480132102966e-05, 3.253389149904251e-05, 3.5647302865982056e-05, 3.87607142329216e-05, 4.1874125599861145e-05, 4.498753696680069e-05, 4.8100948333740234e-05]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 11.0, 92.0, 763.0, 138.0, 13.0], "bins": [-0.03237712010741234, -0.03185210004448891, -0.03132707625627518, -0.030802056193351746, -0.030277034267783165, -0.029752012342214584, -0.029226992279291153, -0.028701970353722572, -0.02817694842815399, -0.02765192650258541, -0.02712690643966198, -0.0266018845140934, -0.02607686258852482, -0.025551840662956238, -0.025026820600032806, -0.024501798674464226, -0.023976776748895645, -0.023451754823327065, -0.022926734760403633, -0.022401712834835052, -0.021876690909266472, -0.02135166898369789, -0.02082664892077446, -0.02030162699520588, -0.019776606932282448, -0.019251585006713867, -0.018726564943790436, -0.018201543018221855, -0.017676521092653275, -0.017151499167084694, -0.016626479104161263, -0.016101457178592682, -0.01557643711566925, -0.015051416121423244, -0.014526394195854664, -0.014001373201608658, -0.013476351276040077, -0.012951330281794071, -0.012426309287548065, -0.011901287361979485, -0.011376265436410904, -0.010851244442164898, -0.010326222516596317, -0.009801201522350311, -0.00927617959678173, -0.008751158602535725, -0.008226137608289719, -0.007701115682721138, -0.007176094222813845, -0.006651072762906551, -0.006126051302999258, -0.005601029843091965, -0.005076008848845959, -0.004550986923277378, -0.004025965929031372, -0.0035009444691240788, -0.0029759230092167854, -0.002450901549309492, -0.0019258802058175206, -0.0014008588623255491, -0.0008758374024182558, -0.0003508159425109625, 0.00017420528456568718, 0.0006992267444729805, 0.0012242482043802738]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 9.0, 7.0, 7.0, 17.0, 30.0, 35.0, 36.0, 49.0, 59.0, 43.0, 54.0, 61.0, 67.0, 56.0, 76.0, 63.0, 43.0, 58.0, 50.0, 39.0, 47.0, 31.0, 17.0, 18.0, 8.0, 11.0, 2.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0026930570602416992, -0.0026246896013617516, -0.002556322142481804, -0.0024879546836018562, -0.0024195872247219086, -0.002351219765841961, -0.0022828523069620132, -0.0022144848480820656, -0.002146117389202118, -0.0020777499303221703, -0.0020093824714422226, -0.001941015012562275, -0.0018726475536823273, -0.0018042800948023796, -0.001735912635922432, -0.0016675451770424843, -0.0015991777181625366, -0.001530810259282589, -0.0014624428004026413, -0.0013940753415226936, -0.001325707882642746, -0.0012573404237627983, -0.0011889729648828506, -0.001120605506002903, -0.0010522380471229553, -0.0009838705882430077, -0.00091550312936306, -0.0008471356704831123, -0.0007787682116031647, -0.000710400752723217, -0.0006420332938432693, -0.0005736658349633217, -0.000505298376083374, -0.00043693091720342636, -0.0003685634583234787, -0.00030019599944353104, -0.00023182854056358337, -0.0001634610816836357, -9.509362280368805e-05, -2.6726163923740387e-05, 4.1641294956207275e-05, 0.00011000875383615494, 0.0001783762127161026, 0.00024674367159605026, 0.0003151111304759979, 0.0003834785893559456, 0.00045184604823589325, 0.0005202135071158409, 0.0005885809659957886, 0.0006569484248757362, 0.0007253158837556839, 0.0007936833426356316, 0.0008620508015155792, 0.0009304182603955269, 0.0009987857192754745, 0.0010671531781554222, 0.0011355206370353699, 0.0012038880959153175, 0.0012722555547952652, 0.0013406230136752129, 0.0014089904725551605, 0.0014773579314351082, 0.0015457253903150558, 0.0016140928491950035, 0.0016824603080749512]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 5.0, 9.0, 4.0, 9.0, 10.0, 17.0, 24.0, 45.0, 69.0, 102.0, 163.0, 266.0, 534.0, 1126.0, 3110.0, 10915.0, 99446.0, 880938.0, 40494.0, 6947.0, 2282.0, 935.0, 433.0, 282.0, 125.0, 87.0, 58.0, 35.0, 18.0, 15.0, 17.0, 5.0, 8.0, 11.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0011463165283203125, -0.0011171773076057434, -0.0010880380868911743, -0.0010588988661766052, -0.0010297596454620361, -0.001000620424747467, -0.000971481204032898, -0.0009423419833183289, -0.0009132027626037598, -0.0008840635418891907, -0.0008549243211746216, -0.0008257851004600525, -0.0007966458797454834, -0.0007675066590309143, -0.0007383674383163452, -0.0007092282176017761, -0.000680088996887207, -0.0006509497761726379, -0.0006218105554580688, -0.0005926713347434998, -0.0005635321140289307, -0.0005343928933143616, -0.0005052536725997925, -0.0004761144518852234, -0.0004469752311706543, -0.0004178360104560852, -0.0003886967897415161, -0.000359557569026947, -0.00033041834831237793, -0.00030127912759780884, -0.00027213990688323975, -0.00024300068616867065, -0.00021386146545410156, -0.00018472224473953247, -0.00015558302402496338, -0.0001264438033103943, -9.73045825958252e-05, -6.81653618812561e-05, -3.902614116668701e-05, -9.88692045211792e-06, 1.9252300262451172e-05, 4.8391520977020264e-05, 7.753074169158936e-05, 0.00010666996240615845, 0.00013580918312072754, 0.00016494840383529663, 0.00019408762454986572, 0.00022322684526443481, 0.0002523660659790039, 0.000281505286693573, 0.0003106445074081421, 0.0003397837281227112, 0.0003689229488372803, 0.00039806216955184937, 0.00042720139026641846, 0.00045634061098098755, 0.00048547983169555664, 0.0005146190524101257, 0.0005437582731246948, 0.0005728974938392639, 0.000602036714553833, 0.0006311759352684021, 0.0006603151559829712, 0.0006894543766975403, 0.0007185935974121094]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 6.0, 13.0, 19.0, 32.0, 34.0, 45.0, 78.0, 110.0, 137.0, 146.0, 123.0, 83.0, 43.0, 41.0, 28.0, 20.0, 18.0, 5.0, 3.0, 4.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2351741790771484e-05, -2.124626189470291e-05, -2.014078199863434e-05, -1.9035302102565765e-05, -1.7929822206497192e-05, -1.682434231042862e-05, -1.5718862414360046e-05, -1.4613382518291473e-05, -1.35079026222229e-05, -1.2402422726154327e-05, -1.1296942830085754e-05, -1.0191462934017181e-05, -9.085983037948608e-06, -7.980503141880035e-06, -6.875023245811462e-06, -5.769543349742889e-06, -4.664063453674316e-06, -3.5585835576057434e-06, -2.4531036615371704e-06, -1.3476237654685974e-06, -2.421438694000244e-07, 8.633360266685486e-07, 1.9688159227371216e-06, 3.0742958188056946e-06, 4.179775714874268e-06, 5.2852556109428406e-06, 6.3907355070114136e-06, 7.4962154030799866e-06, 8.60169529914856e-06, 9.707175195217133e-06, 1.0812655091285706e-05, 1.1918134987354279e-05, 1.3023614883422852e-05, 1.4129094779491425e-05, 1.5234574675559998e-05, 1.634005457162857e-05, 1.7445534467697144e-05, 1.8551014363765717e-05, 1.965649425983429e-05, 2.0761974155902863e-05, 2.1867454051971436e-05, 2.297293394804001e-05, 2.407841384410858e-05, 2.5183893740177155e-05, 2.6289373636245728e-05, 2.73948535323143e-05, 2.8500333428382874e-05, 2.9605813324451447e-05, 3.071129322052002e-05, 3.181677311658859e-05, 3.2922253012657166e-05, 3.402773290872574e-05, 3.513321280479431e-05, 3.6238692700862885e-05, 3.734417259693146e-05, 3.844965249300003e-05, 3.9555132389068604e-05, 4.0660612285137177e-05, 4.176609218120575e-05, 4.287157207727432e-05, 4.3977051973342896e-05, 4.508253186941147e-05, 4.618801176548004e-05, 4.7293491661548615e-05, 4.839897155761719e-05]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 9.0, 10.0, 11.0, 14.0, 21.0, 36.0, 40.0, 74.0, 91.0, 113.0, 190.0, 248.0, 459.0, 658.0, 995.0, 1740.0, 3029.0, 5570.0, 11069.0, 23614.0, 57414.0, 198845.0, 553929.0, 114063.0, 39947.0, 17180.0, 8395.0, 4512.0, 2300.0, 1422.0, 881.0, 550.0, 377.0, 237.0, 145.0, 110.0, 71.0, 61.0, 32.0, 22.0, 20.0, 12.0, 20.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001900196075439453, -0.00018330663442611694, -0.00017659366130828857, -0.0001698806881904602, -0.00016316771507263184, -0.00015645474195480347, -0.0001497417688369751, -0.00014302879571914673, -0.00013631582260131836, -0.00012960284948349, -0.00012288987636566162, -0.00011617690324783325, -0.00010946393013000488, -0.00010275095701217651, -9.603798389434814e-05, -8.932501077651978e-05, -8.26120376586914e-05, -7.589906454086304e-05, -6.918609142303467e-05, -6.24731183052063e-05, -5.576014518737793e-05, -4.904717206954956e-05, -4.233419895172119e-05, -3.562122583389282e-05, -2.8908252716064453e-05, -2.2195279598236084e-05, -1.5482306480407715e-05, -8.769333362579346e-06, -2.0563602447509766e-06, 4.656612873077393e-06, 1.1369585990905762e-05, 1.808255910873413e-05, 2.47955322265625e-05, 3.150850534439087e-05, 3.822147846221924e-05, 4.493445158004761e-05, 5.1647424697875977e-05, 5.8360397815704346e-05, 6.507337093353271e-05, 7.178634405136108e-05, 7.849931716918945e-05, 8.521229028701782e-05, 9.192526340484619e-05, 9.863823652267456e-05, 0.00010535120964050293, 0.0001120641827583313, 0.00011877715587615967, 0.00012549012899398804, 0.0001322031021118164, 0.00013891607522964478, 0.00014562904834747314, 0.00015234202146530151, 0.00015905499458312988, 0.00016576796770095825, 0.00017248094081878662, 0.000179193913936615, 0.00018590688705444336, 0.00019261986017227173, 0.0001993328332901001, 0.00020604580640792847, 0.00021275877952575684, 0.0002194717526435852, 0.00022618472576141357, 0.00023289769887924194, 0.0002396106719970703]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 3.0, 3.0, 13.0, 3.0, 17.0, 14.0, 26.0, 33.0, 40.0, 36.0, 46.0, 47.0, 50.0, 75.0, 64.0, 59.0, 61.0, 56.0, 58.0, 46.0, 36.0, 44.0, 33.0, 27.0, 24.0, 22.0, 15.0, 8.0, 8.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.834766387939453e-05, -9.435229003429413e-05, -9.035691618919373e-05, -8.636154234409332e-05, -8.236616849899292e-05, -7.837079465389252e-05, -7.437542080879211e-05, -7.038004696369171e-05, -6.638467311859131e-05, -6.23892992734909e-05, -5.83939254283905e-05, -5.43985515832901e-05, -5.04031777381897e-05, -4.6407803893089294e-05, -4.241243004798889e-05, -3.841705620288849e-05, -3.4421682357788086e-05, -3.0426308512687683e-05, -2.643093466758728e-05, -2.2435560822486877e-05, -1.8440186977386475e-05, -1.4444813132286072e-05, -1.0449439287185669e-05, -6.454065442085266e-06, -2.4586915969848633e-06, 1.5366822481155396e-06, 5.532056093215942e-06, 9.527429938316345e-06, 1.3522803783416748e-05, 1.751817762851715e-05, 2.1513551473617554e-05, 2.5508925318717957e-05, 2.950429916381836e-05, 3.349967300891876e-05, 3.7495046854019165e-05, 4.149042069911957e-05, 4.548579454421997e-05, 4.9481168389320374e-05, 5.3476542234420776e-05, 5.747191607952118e-05, 6.146728992462158e-05, 6.546266376972198e-05, 6.945803761482239e-05, 7.345341145992279e-05, 7.74487853050232e-05, 8.14441591501236e-05, 8.5439532995224e-05, 8.94349068403244e-05, 9.34302806854248e-05, 9.742565453052521e-05, 0.00010142102837562561, 0.00010541640222072601, 0.00010941177606582642, 0.00011340714991092682, 0.00011740252375602722, 0.00012139789760112762, 0.00012539327144622803, 0.00012938864529132843, 0.00013338401913642883, 0.00013737939298152924, 0.00014137476682662964, 0.00014537014067173004, 0.00014936551451683044, 0.00015336088836193085, 0.00015735626220703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 15.0, 9.0, 15.0, 27.0, 25.0, 45.0, 41.0, 53.0, 70.0, 97.0, 103.0, 155.0, 194.0, 278.0, 352.0, 522.0, 724.0, 1059.0, 1504.0, 2226.0, 3386.0, 5995.0, 16144.0, 966849.0, 28919.0, 7720.0, 3889.0, 2356.0, 1598.0, 1119.0, 776.0, 583.0, 404.0, 306.0, 210.0, 167.0, 141.0, 88.0, 77.0, 72.0, 53.0, 33.0, 34.0, 22.0, 25.0, 24.0, 10.0, 3.0, 4.0, 8.0, 3.0, 8.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0006885528564453125, -0.000666789710521698, -0.0006450265645980835, -0.000623263418674469, -0.0006015002727508545, -0.00057973712682724, -0.0005579739809036255, -0.000536210834980011, -0.0005144476890563965, -0.000492684543132782, -0.0004709213972091675, -0.000449158251285553, -0.0004273951053619385, -0.000405631959438324, -0.00038386881351470947, -0.00036210566759109497, -0.00034034252166748047, -0.00031857937574386597, -0.00029681622982025146, -0.00027505308389663696, -0.00025328993797302246, -0.00023152679204940796, -0.00020976364612579346, -0.00018800050020217896, -0.00016623735427856445, -0.00014447420835494995, -0.00012271106243133545, -0.00010094791650772095, -7.918477058410645e-05, -5.742162466049194e-05, -3.565847873687744e-05, -1.389533281326294e-05, 7.867813110351562e-06, 2.9630959033966064e-05, 5.1394104957580566e-05, 7.315725088119507e-05, 9.492039680480957e-05, 0.00011668354272842407, 0.00013844668865203857, 0.00016020983457565308, 0.00018197298049926758, 0.00020373612642288208, 0.00022549927234649658, 0.0002472624182701111, 0.0002690255641937256, 0.0002907887101173401, 0.0003125518560409546, 0.0003343150019645691, 0.0003560781478881836, 0.0003778412938117981, 0.0003996044397354126, 0.0004213675856590271, 0.0004431307315826416, 0.0004648938775062561, 0.0004866570234298706, 0.0005084201693534851, 0.0005301833152770996, 0.0005519464612007141, 0.0005737096071243286, 0.0005954727530479431, 0.0006172358989715576, 0.0006389990448951721, 0.0006607621908187866, 0.0006825253367424011, 0.0007042884826660156]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 9.0, 7.0, 8.0, 12.0, 13.0, 9.0, 16.0, 20.0, 20.0, 19.0, 25.0, 29.0, 39.0, 52.0, 45.0, 90.0, 123.0, 93.0, 59.0, 48.0, 36.0, 25.0, 40.0, 19.0, 22.0, 18.0, 10.0, 14.0, 19.0, 13.0, 10.0, 8.0, 7.0, 5.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09808349609375e-05, -2.029910683631897e-05, -1.961737871170044e-05, -1.893565058708191e-05, -1.825392246246338e-05, -1.757219433784485e-05, -1.689046621322632e-05, -1.6208738088607788e-05, -1.5527009963989258e-05, -1.4845281839370728e-05, -1.4163553714752197e-05, -1.3481825590133667e-05, -1.2800097465515137e-05, -1.2118369340896606e-05, -1.1436641216278076e-05, -1.0754913091659546e-05, -1.0073184967041016e-05, -9.391456842422485e-06, -8.709728717803955e-06, -8.028000593185425e-06, -7.3462724685668945e-06, -6.664544343948364e-06, -5.982816219329834e-06, -5.301088094711304e-06, -4.6193599700927734e-06, -3.937631845474243e-06, -3.255903720855713e-06, -2.5741755962371826e-06, -1.8924474716186523e-06, -1.210719347000122e-06, -5.289912223815918e-07, 1.5273690223693848e-07, 8.344650268554688e-07, 1.516193151473999e-06, 2.1979212760925293e-06, 2.8796494007110596e-06, 3.56137752532959e-06, 4.24310564994812e-06, 4.92483377456665e-06, 5.606561899185181e-06, 6.288290023803711e-06, 6.970018148422241e-06, 7.651746273040771e-06, 8.333474397659302e-06, 9.015202522277832e-06, 9.696930646896362e-06, 1.0378658771514893e-05, 1.1060386896133423e-05, 1.1742115020751953e-05, 1.2423843145370483e-05, 1.3105571269989014e-05, 1.3787299394607544e-05, 1.4469027519226074e-05, 1.5150755643844604e-05, 1.5832483768463135e-05, 1.6514211893081665e-05, 1.7195940017700195e-05, 1.7877668142318726e-05, 1.8559396266937256e-05, 1.9241124391555786e-05, 1.9922852516174316e-05, 2.0604580640792847e-05, 2.1286308765411377e-05, 2.1968036890029907e-05, 2.2649765014648438e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 7.0, 4.0, 7.0, 6.0, 12.0, 14.0, 16.0, 23.0, 36.0, 26.0, 56.0, 81.0, 123.0, 143.0, 193.0, 270.0, 389.0, 555.0, 825.0, 1238.0, 2018.0, 3848.0, 9374.0, 32672.0, 520550.0, 425417.0, 31943.0, 9024.0, 3821.0, 1996.0, 1222.0, 775.0, 528.0, 378.0, 251.0, 197.0, 137.0, 101.0, 78.0, 55.0, 36.0, 38.0, 22.0, 20.0, 10.0, 13.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00012576580047607422, -0.00012195296585559845, -0.00011814013123512268, -0.00011432729661464691, -0.00011051446199417114, -0.00010670162737369537, -0.0001028887927532196, -9.907595813274384e-05, -9.526312351226807e-05, -9.14502888917923e-05, -8.763745427131653e-05, -8.382461965084076e-05, -8.001178503036499e-05, -7.619895040988922e-05, -7.238611578941345e-05, -6.857328116893768e-05, -6.476044654846191e-05, -6.0947611927986145e-05, -5.7134777307510376e-05, -5.332194268703461e-05, -4.950910806655884e-05, -4.569627344608307e-05, -4.18834388256073e-05, -3.807060420513153e-05, -3.425776958465576e-05, -3.0444934964179993e-05, -2.6632100343704224e-05, -2.2819265723228455e-05, -1.9006431102752686e-05, -1.5193596482276917e-05, -1.1380761861801147e-05, -7.567927241325378e-06, -3.7550926208496094e-06, 5.774199962615967e-08, 3.870576620101929e-06, 7.683411240577698e-06, 1.1496245861053467e-05, 1.5309080481529236e-05, 1.9121915102005005e-05, 2.2934749722480774e-05, 2.6747584342956543e-05, 3.056041896343231e-05, 3.437325358390808e-05, 3.818608820438385e-05, 4.199892282485962e-05, 4.581175744533539e-05, 4.962459206581116e-05, 5.3437426686286926e-05, 5.7250261306762695e-05, 6.106309592723846e-05, 6.487593054771423e-05, 6.868876516819e-05, 7.250159978866577e-05, 7.631443440914154e-05, 8.012726902961731e-05, 8.394010365009308e-05, 8.775293827056885e-05, 9.156577289104462e-05, 9.537860751152039e-05, 9.919144213199615e-05, 0.00010300427675247192, 0.00010681711137294769, 0.00011062994599342346, 0.00011444278061389923, 0.000118255615234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 4.0, 8.0, 9.0, 17.0, 31.0, 40.0, 56.0, 107.0, 151.0, 283.0, 111.0, 59.0, 48.0, 29.0, 13.0, 7.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.077787399291992e-05, -8.833594620227814e-05, -8.589401841163635e-05, -8.345209062099457e-05, -8.101016283035278e-05, -7.8568235039711e-05, -7.612630724906921e-05, -7.368437945842743e-05, -7.124245166778564e-05, -6.880052387714386e-05, -6.635859608650208e-05, -6.391666829586029e-05, -6.14747405052185e-05, -5.903281271457672e-05, -5.6590884923934937e-05, -5.414895713329315e-05, -5.170702934265137e-05, -4.926510155200958e-05, -4.68231737613678e-05, -4.438124597072601e-05, -4.193931818008423e-05, -3.9497390389442444e-05, -3.705546259880066e-05, -3.4613534808158875e-05, -3.217160701751709e-05, -2.9729679226875305e-05, -2.728775143623352e-05, -2.4845823645591736e-05, -2.240389585494995e-05, -1.9961968064308167e-05, -1.7520040273666382e-05, -1.5078112483024597e-05, -1.2636184692382812e-05, -1.0194256901741028e-05, -7.752329111099243e-06, -5.3104013204574585e-06, -2.868473529815674e-06, -4.2654573917388916e-07, 2.0153820514678955e-06, 4.45730984210968e-06, 6.899237632751465e-06, 9.34116542339325e-06, 1.1783093214035034e-05, 1.4225021004676819e-05, 1.6666948795318604e-05, 1.9108876585960388e-05, 2.1550804376602173e-05, 2.3992732167243958e-05, 2.6434659957885742e-05, 2.8876587748527527e-05, 3.131851553916931e-05, 3.3760443329811096e-05, 3.620237112045288e-05, 3.8644298911094666e-05, 4.108622670173645e-05, 4.3528154492378235e-05, 4.597008228302002e-05, 4.8412010073661804e-05, 5.085393786430359e-05, 5.3295865654945374e-05, 5.573779344558716e-05, 5.817972123622894e-05, 6.062164902687073e-05, 6.306357681751251e-05, 6.55055046081543e-05]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 11.0, 13.0, 23.0, 25.0, 47.0, 81.0, 126.0, 160.0, 226.0, 169.0, 64.0, 24.0, 13.0, 11.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004188497085124254, -0.004004727583378553, -0.003820958314463496, -0.003637189045548439, -0.003453419543802738, -0.0032696500420570374, -0.00308588077314198, -0.002902111504226923, -0.002718342002481222, -0.0025345725007355213, -0.002350803231820464, -0.002167033962905407, -0.001983264461159706, -0.001799495075829327, -0.001615725690498948, -0.001431956305168569, -0.00124818691983819, -0.001064417534507811, -0.0008806481491774321, -0.000696878763847053, -0.000513109378516674, -0.00032933999318629503, -0.00014557060785591602, 3.8198777474462986e-05, 0.000221968162804842, 0.000405737548135221, 0.0005895069334656, 0.000773276318795979, 0.000957045704126358, 0.001140815089456737, 0.001324584474787116, 0.001508353860117495, 0.0016921237111091614, 0.0018758930964395404, 0.0020596624817699194, 0.0022434317506849766, 0.0024272012524306774, 0.0026109707541763783, 0.0027947400230914354, 0.0029785092920064926, 0.0031622787937521935, 0.0033460482954978943, 0.0035298175644129515, 0.0037135868333280087, 0.0038973563350737095, 0.00408112583681941, 0.004264894872903824, 0.004448664374649525, 0.0046324338763952255, 0.004816203378140926, 0.004999972879886627, 0.005183741915971041, 0.0053675114177167416, 0.005551280919462442, 0.005735049955546856, 0.005918819457292557, 0.006102588959038258, 0.0062863584607839584, 0.006470127962529659, 0.006653896998614073, 0.006837666500359774, 0.0070214360021054745, 0.007205205038189888, 0.007388974539935589, 0.00757274404168129]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 11.0, 20.0, 21.0, 26.0, 20.0, 26.0, 25.0, 23.0, 25.0, 23.0, 23.0, 28.0, 26.0, 31.0, 28.0, 28.0, 27.0, 17.0, 23.0, 23.0, 27.0, 26.0, 23.0, 25.0, 27.0, 30.0, 27.0, 28.0, 27.0, 30.0, 26.0, 28.0, 21.0, 33.0, 13.0, 17.0, 21.0, 20.0, 14.0, 13.0, 11.0, 7.0, 7.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0010091662406921387, -0.0009783729910850525, -0.0009475797414779663, -0.0009167864918708801, -0.0008859932422637939, -0.0008551999926567078, -0.0008244067430496216, -0.0007936134934425354, -0.0007628202438354492, -0.000732026994228363, -0.0007012337446212769, -0.0006704404950141907, -0.0006396472454071045, -0.0006088539958000183, -0.0005780607461929321, -0.000547267496585846, -0.0005164742469787598, -0.0004856809973716736, -0.0004548877477645874, -0.0004240944981575012, -0.00039330124855041504, -0.00036250799894332886, -0.0003317147493362427, -0.0003009214997291565, -0.0002701282501220703, -0.00023933500051498413, -0.00020854175090789795, -0.00017774850130081177, -0.00014695525169372559, -0.0001161620020866394, -8.536875247955322e-05, -5.457550287246704e-05, -2.378225326538086e-05, 7.010996341705322e-06, 3.7804245948791504e-05, 6.859749555587769e-05, 9.939074516296387e-05, 0.00013018399477005005, 0.00016097724437713623, 0.0001917704939842224, 0.0002225637435913086, 0.0002533569931983948, 0.00028415024280548096, 0.00031494349241256714, 0.0003457367420196533, 0.0003765299916267395, 0.0004073232412338257, 0.00043811649084091187, 0.00046890974044799805, 0.0004997029900550842, 0.0005304962396621704, 0.0005612894892692566, 0.0005920827388763428, 0.000622875988483429, 0.0006536692380905151, 0.0006844624876976013, 0.0007152557373046875, 0.0007460489869117737, 0.0007768422365188599, 0.000807635486125946, 0.0008384287357330322, 0.0008692219853401184, 0.0009000152349472046, 0.0009308084845542908, 0.000961601734161377]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 8.0, 20.0, 34.0, 53.0, 103.0, 193.0, 536.0, 1699.0, 7442.0, 66476.0, 4032928.0, 72129.0, 9047.0, 2162.0, 756.0, 333.0, 149.0, 72.0, 40.0, 32.0, 18.0, 11.0, 10.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008907318115234375, -0.0008543878793716431, -0.0008180439472198486, -0.0007817000150680542, -0.0007453560829162598, -0.0007090121507644653, -0.0006726682186126709, -0.0006363242864608765, -0.000599980354309082, -0.0005636364221572876, -0.0005272924900054932, -0.0004909485578536987, -0.0004546046257019043, -0.00041826069355010986, -0.00038191676139831543, -0.000345572829246521, -0.00030922889709472656, -0.00027288496494293213, -0.0002365410327911377, -0.00020019710063934326, -0.00016385316848754883, -0.0001275092363357544, -9.116530418395996e-05, -5.482137203216553e-05, -1.8477439880371094e-05, 1.786649227142334e-05, 5.4210424423217773e-05, 9.055435657501221e-05, 0.00012689828872680664, 0.00016324222087860107, 0.0001995861530303955, 0.00023593008518218994, 0.0002722740173339844, 0.0003086179494857788, 0.00034496188163757324, 0.0003813058137893677, 0.0004176497459411621, 0.00045399367809295654, 0.000490337610244751, 0.0005266815423965454, 0.0005630254745483398, 0.0005993694067001343, 0.0006357133388519287, 0.0006720572710037231, 0.0007084012031555176, 0.000744745135307312, 0.0007810890674591064, 0.0008174329996109009, 0.0008537769317626953, 0.0008901208639144897, 0.0009264647960662842, 0.0009628087282180786, 0.000999152660369873, 0.0010354965925216675, 0.001071840524673462, 0.0011081844568252563, 0.0011445283889770508, 0.0011808723211288452, 0.0012172162532806396, 0.001253560185432434, 0.0012899041175842285, 0.001326248049736023, 0.0013625919818878174, 0.0013989359140396118, 0.0014352798461914062]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 13.0, 13.0, 16.0, 28.0, 31.0, 53.0, 61.0, 90.0, 99.0, 111.0, 117.0, 92.0, 73.0, 43.0, 33.0, 34.0, 19.0, 19.0, 8.0, 9.0, 8.0, 7.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4378299713134766e-05, -2.3392029106616974e-05, -2.2405758500099182e-05, -2.141948789358139e-05, -2.04332172870636e-05, -1.9446946680545807e-05, -1.8460676074028015e-05, -1.7474405467510223e-05, -1.648813486099243e-05, -1.550186425447464e-05, -1.4515593647956848e-05, -1.3529323041439056e-05, -1.2543052434921265e-05, -1.1556781828403473e-05, -1.0570511221885681e-05, -9.58424061536789e-06, -8.597970008850098e-06, -7.611699402332306e-06, -6.625428795814514e-06, -5.639158189296722e-06, -4.652887582778931e-06, -3.666616976261139e-06, -2.680346369743347e-06, -1.6940757632255554e-06, -7.078051567077637e-07, 2.784654498100281e-07, 1.2647360563278198e-06, 2.2510066628456116e-06, 3.2372772693634033e-06, 4.223547875881195e-06, 5.209818482398987e-06, 6.1960890889167786e-06, 7.18235969543457e-06, 8.168630301952362e-06, 9.154900908470154e-06, 1.0141171514987946e-05, 1.1127442121505737e-05, 1.2113712728023529e-05, 1.309998333454132e-05, 1.4086253941059113e-05, 1.5072524547576904e-05, 1.6058795154094696e-05, 1.7045065760612488e-05, 1.803133636713028e-05, 1.901760697364807e-05, 2.0003877580165863e-05, 2.0990148186683655e-05, 2.1976418793201447e-05, 2.2962689399719238e-05, 2.394896000623703e-05, 2.4935230612754822e-05, 2.5921501219272614e-05, 2.6907771825790405e-05, 2.7894042432308197e-05, 2.888031303882599e-05, 2.986658364534378e-05, 3.085285425186157e-05, 3.1839124858379364e-05, 3.2825395464897156e-05, 3.381166607141495e-05, 3.479793667793274e-05, 3.578420728445053e-05, 3.677047789096832e-05, 3.7756748497486115e-05, 3.8743019104003906e-05]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 6.0, 11.0, 10.0, 28.0, 23.0, 49.0, 65.0, 131.0, 201.0, 350.0, 596.0, 1132.0, 1926.0, 3562.0, 7086.0, 14365.0, 33308.0, 93724.0, 773365.0, 3082818.0, 110849.0, 38314.0, 16057.0, 7650.0, 3836.0, 2052.0, 1139.0, 636.0, 383.0, 207.0, 141.0, 87.0, 59.0, 35.0, 25.0, 13.0, 8.0, 13.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002613067626953125, -0.0002534054219722748, -0.00024550408124923706, -0.00023760274052619934, -0.00022970139980316162, -0.0002218000590801239, -0.00021389871835708618, -0.00020599737763404846, -0.00019809603691101074, -0.00019019469618797302, -0.0001822933554649353, -0.00017439201474189758, -0.00016649067401885986, -0.00015858933329582214, -0.00015068799257278442, -0.0001427866518497467, -0.00013488531112670898, -0.00012698397040367126, -0.00011908262968063354, -0.00011118128895759583, -0.0001032799482345581, -9.537860751152039e-05, -8.747726678848267e-05, -7.957592606544495e-05, -7.167458534240723e-05, -6.377324461936951e-05, -5.587190389633179e-05, -4.797056317329407e-05, -4.006922245025635e-05, -3.216788172721863e-05, -2.4266541004180908e-05, -1.636520028114319e-05, -8.463859558105469e-06, -5.62518835067749e-07, 7.338821887969971e-06, 1.524016261100769e-05, 2.314150333404541e-05, 3.104284405708313e-05, 3.894418478012085e-05, 4.684552550315857e-05, 5.474686622619629e-05, 6.264820694923401e-05, 7.054954767227173e-05, 7.845088839530945e-05, 8.635222911834717e-05, 9.425356984138489e-05, 0.00010215491056442261, 0.00011005625128746033, 0.00011795759201049805, 0.00012585893273353577, 0.00013376027345657349, 0.0001416616141796112, 0.00014956295490264893, 0.00015746429562568665, 0.00016536563634872437, 0.00017326697707176208, 0.0001811683177947998, 0.00018906965851783752, 0.00019697099924087524, 0.00020487233996391296, 0.00021277368068695068, 0.0002206750214099884, 0.00022857636213302612, 0.00023647770285606384, 0.00024437904357910156]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 7.0, 4.0, 8.0, 9.0, 13.0, 9.0, 27.0, 33.0, 49.0, 43.0, 81.0, 135.0, 1063.0, 1729.0, 211.0, 125.0, 105.0, 83.0, 61.0, 64.0, 40.0, 40.0, 36.0, 26.0, 17.0, 17.0, 13.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011074542999267578, -0.00010784156620502472, -0.00010493770241737366, -0.0001020338386297226, -9.912997484207153e-05, -9.622611105442047e-05, -9.332224726676941e-05, -9.041838347911835e-05, -8.751451969146729e-05, -8.461065590381622e-05, -8.170679211616516e-05, -7.88029283285141e-05, -7.589906454086304e-05, -7.299520075321198e-05, -7.009133696556091e-05, -6.718747317790985e-05, -6.428360939025879e-05, -6.137974560260773e-05, -5.8475881814956665e-05, -5.55720180273056e-05, -5.266815423965454e-05, -4.976429045200348e-05, -4.686042666435242e-05, -4.3956562876701355e-05, -4.105269908905029e-05, -3.814883530139923e-05, -3.524497151374817e-05, -3.234110772609711e-05, -2.9437243938446045e-05, -2.6533380150794983e-05, -2.362951636314392e-05, -2.072565257549286e-05, -1.7821788787841797e-05, -1.4917925000190735e-05, -1.2014061212539673e-05, -9.11019742488861e-06, -6.206333637237549e-06, -3.302469849586487e-06, -3.986060619354248e-07, 2.505257725715637e-06, 5.409121513366699e-06, 8.312985301017761e-06, 1.1216849088668823e-05, 1.4120712876319885e-05, 1.7024576663970947e-05, 1.992844045162201e-05, 2.283230423927307e-05, 2.5736168026924133e-05, 2.8640031814575195e-05, 3.154389560222626e-05, 3.444775938987732e-05, 3.735162317752838e-05, 4.025548696517944e-05, 4.3159350752830505e-05, 4.606321454048157e-05, 4.896707832813263e-05, 5.187094211578369e-05, 5.4774805903434753e-05, 5.7678669691085815e-05, 6.058253347873688e-05, 6.348639726638794e-05, 6.6390261054039e-05, 6.929412484169006e-05, 7.219798862934113e-05, 7.510185241699219e-05]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 17.0, 98.0, 624.0, 225.0, 47.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006768617313355207, -0.0005315033486112952, -0.00038614493678323925, -0.00024078652495518327, -9.542814223095775e-05, 4.9930240493267775e-05, 0.0001952886814251542, 0.00034064706414937973, 0.00048600544687360525, 0.0006313638295978308, 0.0007767222123220563, 0.0009220806532539427, 0.0010674390941858292, 0.0012127973604947329, 0.0013581558596342802, 0.0015035142423585057, 0.0016488726250827312, 0.0017942310078069568, 0.0019395893905311823, 0.0020849478896707296, 0.0022303061559796333, 0.0023756646551191807, 0.002521023154258728, 0.0026663814205676317, 0.0028117396868765354, 0.0029570981860160828, 0.0031024564523249865, 0.003247814951464534, 0.0033931732177734375, 0.003538531716912985, 0.003683890216052532, 0.003829248482361436, 0.00397460674867034, 0.004119965247809887, 0.004265323746949434, 0.004410681780427694, 0.004556040279567242, 0.004701398778706789, 0.004846757277846336, 0.004992115311324596, 0.005137473810464144, 0.005282832309603691, 0.0054281908087432384, 0.0055735488422214985, 0.005718907341361046, 0.005864265840500593, 0.0060096243396401405, 0.006154982373118401, 0.006300341337919235, 0.006445699837058783, 0.00659105833619833, 0.00673641636967659, 0.006881774868816137, 0.007027133367955685, 0.007172491867095232, 0.007317850366234779, 0.007463208399713039, 0.007608566898852587, 0.007753925397992134, 0.007899283431470394, 0.008044642396271229, 0.008190000429749489, 0.008335358463227749, 0.008480717428028584, 0.008626075461506844]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 11.0, 10.0, 19.0, 15.0, 34.0, 30.0, 22.0, 33.0, 38.0, 40.0, 46.0, 61.0, 55.0, 53.0, 55.0, 60.0, 43.0, 53.0, 49.0, 37.0, 39.0, 31.0, 45.0, 30.0, 20.0, 20.0, 11.0, 7.0, 6.0, 11.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006406307220458984, -0.0006230268627405167, -0.0006054230034351349, -0.0005878191441297531, -0.0005702152848243713, -0.0005526114255189896, -0.0005350075662136078, -0.000517403706908226, -0.0004997998476028442, -0.00048219598829746246, -0.0004645921289920807, -0.0004469882696866989, -0.00042938441038131714, -0.00041178055107593536, -0.0003941766917705536, -0.0003765728324651718, -0.00035896897315979004, -0.00034136511385440826, -0.0003237612545490265, -0.0003061573952436447, -0.00028855353593826294, -0.00027094967663288116, -0.0002533458173274994, -0.00023574195802211761, -0.00021813809871673584, -0.00020053423941135406, -0.0001829303801059723, -0.00016532652080059052, -0.00014772266149520874, -0.00013011880218982697, -0.00011251494288444519, -9.491108357906342e-05, -7.730722427368164e-05, -5.9703364968299866e-05, -4.209950566291809e-05, -2.4495646357536316e-05, -6.891787052154541e-06, 1.0712072253227234e-05, 2.831593155860901e-05, 4.5919790863990784e-05, 6.352365016937256e-05, 8.112750947475433e-05, 9.873136878013611e-05, 0.00011633522808551788, 0.00013393908739089966, 0.00015154294669628143, 0.0001691468060016632, 0.00018675066530704498, 0.00020435452461242676, 0.00022195838391780853, 0.0002395622432231903, 0.0002571661025285721, 0.00027476996183395386, 0.00029237382113933563, 0.0003099776804447174, 0.0003275815397500992, 0.00034518539905548096, 0.00036278925836086273, 0.0003803931176662445, 0.0003979969769716263, 0.00041560083627700806, 0.00043320469558238983, 0.0004508085548877716, 0.0004684124141931534, 0.00048601627349853516]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 5.0, 6.0, 11.0, 15.0, 13.0, 26.0, 14.0, 37.0, 50.0, 64.0, 76.0, 120.0, 178.0, 268.0, 499.0, 903.0, 1839.0, 3975.0, 10128.0, 30349.0, 128164.0, 696630.0, 127476.0, 29555.0, 9983.0, 4062.0, 1854.0, 911.0, 522.0, 291.0, 172.0, 105.0, 73.0, 52.0, 29.0, 27.0, 16.0, 17.0, 6.0, 14.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000469207763671875, -0.0004547685384750366, -0.00044032931327819824, -0.00042589008808135986, -0.0004114508628845215, -0.0003970116376876831, -0.0003825724124908447, -0.00036813318729400635, -0.00035369396209716797, -0.0003392547369003296, -0.0003248155117034912, -0.00031037628650665283, -0.00029593706130981445, -0.0002814978361129761, -0.0002670586109161377, -0.0002526193857192993, -0.00023818016052246094, -0.00022374093532562256, -0.00020930171012878418, -0.0001948624849319458, -0.00018042325973510742, -0.00016598403453826904, -0.00015154480934143066, -0.00013710558414459229, -0.0001226663589477539, -0.00010822713375091553, -9.378790855407715e-05, -7.934868335723877e-05, -6.490945816040039e-05, -5.047023296356201e-05, -3.603100776672363e-05, -2.1591782569885254e-05, -7.152557373046875e-06, 7.286667823791504e-06, 2.1725893020629883e-05, 3.616511821746826e-05, 5.060434341430664e-05, 6.504356861114502e-05, 7.94827938079834e-05, 9.392201900482178e-05, 0.00010836124420166016, 0.00012280046939849854, 0.00013723969459533691, 0.0001516789197921753, 0.00016611814498901367, 0.00018055737018585205, 0.00019499659538269043, 0.0002094358205795288, 0.0002238750457763672, 0.00023831427097320557, 0.00025275349617004395, 0.0002671927213668823, 0.0002816319465637207, 0.0002960711717605591, 0.00031051039695739746, 0.00032494962215423584, 0.0003393888473510742, 0.0003538280725479126, 0.000368267297744751, 0.00038270652294158936, 0.00039714574813842773, 0.0004115849733352661, 0.0004260241985321045, 0.00044046342372894287, 0.00045490264892578125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 6.0, 7.0, 9.0, 13.0, 20.0, 27.0, 29.0, 46.0, 77.0, 108.0, 114.0, 136.0, 98.0, 80.0, 52.0, 44.0, 43.0, 26.0, 20.0, 8.0, 10.0, 5.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.1362677216529846e-05, -2.0254403352737427e-05, -1.9146129488945007e-05, -1.8037855625152588e-05, -1.692958176136017e-05, -1.582130789756775e-05, -1.471303403377533e-05, -1.360476016998291e-05, -1.249648630619049e-05, -1.1388212442398071e-05, -1.0279938578605652e-05, -9.171664714813232e-06, -8.063390851020813e-06, -6.9551169872283936e-06, -5.846843123435974e-06, -4.738569259643555e-06, -3.6302953958511353e-06, -2.522021532058716e-06, -1.4137476682662964e-06, -3.0547380447387695e-07, 8.028000593185425e-07, 1.911073923110962e-06, 3.0193477869033813e-06, 4.127621650695801e-06, 5.23589551448822e-06, 6.34416937828064e-06, 7.452443242073059e-06, 8.560717105865479e-06, 9.668990969657898e-06, 1.0777264833450317e-05, 1.1885538697242737e-05, 1.2993812561035156e-05, 1.4102086424827576e-05, 1.5210360288619995e-05, 1.6318634152412415e-05, 1.7426908016204834e-05, 1.8535181879997253e-05, 1.9643455743789673e-05, 2.0751729607582092e-05, 2.1860003471374512e-05, 2.296827733516693e-05, 2.407655119895935e-05, 2.518482506275177e-05, 2.629309892654419e-05, 2.740137279033661e-05, 2.850964665412903e-05, 2.9617920517921448e-05, 3.072619438171387e-05, 3.183446824550629e-05, 3.2942742109298706e-05, 3.4051015973091125e-05, 3.5159289836883545e-05, 3.6267563700675964e-05, 3.7375837564468384e-05, 3.84841114282608e-05, 3.959238529205322e-05, 4.070065915584564e-05, 4.180893301963806e-05, 4.291720688343048e-05, 4.40254807472229e-05, 4.513375461101532e-05, 4.624202847480774e-05, 4.735030233860016e-05, 4.845857620239258e-05]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 5.0, 0.0, 2.0, 8.0, 15.0, 10.0, 21.0, 15.0, 33.0, 76.0, 85.0, 128.0, 183.0, 304.0, 472.0, 818.0, 1382.0, 2355.0, 4269.0, 8196.0, 17162.0, 41400.0, 127098.0, 557742.0, 188944.0, 54501.0, 21560.0, 9949.0, 5077.0, 2762.0, 1512.0, 874.0, 571.0, 352.0, 234.0, 137.0, 93.0, 71.0, 36.0, 36.0, 21.0, 20.0, 11.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002205371856689453, -0.0002125576138496399, -0.00020457804203033447, -0.00019659847021102905, -0.00018861889839172363, -0.0001806393265724182, -0.0001726597547531128, -0.00016468018293380737, -0.00015670061111450195, -0.00014872103929519653, -0.0001407414674758911, -0.0001327618956565857, -0.00012478232383728027, -0.00011680275201797485, -0.00010882318019866943, -0.00010084360837936401, -9.28640365600586e-05, -8.488446474075317e-05, -7.690489292144775e-05, -6.892532110214233e-05, -6.0945749282836914e-05, -5.2966177463531494e-05, -4.4986605644226074e-05, -3.7007033824920654e-05, -2.9027462005615234e-05, -2.1047890186309814e-05, -1.3068318367004395e-05, -5.088746547698975e-06, 2.8908252716064453e-06, 1.0870397090911865e-05, 1.8849968910217285e-05, 2.6829540729522705e-05, 3.4809112548828125e-05, 4.2788684368133545e-05, 5.0768256187438965e-05, 5.8747828006744385e-05, 6.67273998260498e-05, 7.470697164535522e-05, 8.268654346466064e-05, 9.066611528396606e-05, 9.864568710327148e-05, 0.0001066252589225769, 0.00011460483074188232, 0.00012258440256118774, 0.00013056397438049316, 0.00013854354619979858, 0.000146523118019104, 0.00015450268983840942, 0.00016248226165771484, 0.00017046183347702026, 0.00017844140529632568, 0.0001864209771156311, 0.00019440054893493652, 0.00020238012075424194, 0.00021035969257354736, 0.00021833926439285278, 0.0002263188362121582, 0.00023429840803146362, 0.00024227797985076904, 0.00025025755167007446, 0.0002582371234893799, 0.0002662166953086853, 0.0002741962671279907, 0.00028217583894729614, 0.00029015541076660156]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 9.0, 9.0, 6.0, 9.0, 13.0, 21.0, 18.0, 19.0, 19.0, 19.0, 21.0, 27.0, 39.0, 46.0, 43.0, 39.0, 43.0, 52.0, 41.0, 41.0, 33.0, 35.0, 49.0, 46.0, 37.0, 26.0, 29.0, 27.0, 31.0, 21.0, 22.0, 22.0, 9.0, 15.0, 8.0, 7.0, 9.0, 6.0, 7.0, 8.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.894899368286133e-05, -5.679391324520111e-05, -5.4638832807540894e-05, -5.2483752369880676e-05, -5.032867193222046e-05, -4.817359149456024e-05, -4.6018511056900024e-05, -4.386343061923981e-05, -4.170835018157959e-05, -3.955326974391937e-05, -3.7398189306259155e-05, -3.524310886859894e-05, -3.308802843093872e-05, -3.0932947993278503e-05, -2.8777867555618286e-05, -2.662278711795807e-05, -2.446770668029785e-05, -2.2312626242637634e-05, -2.0157545804977417e-05, -1.80024653673172e-05, -1.5847384929656982e-05, -1.3692304491996765e-05, -1.1537224054336548e-05, -9.38214361667633e-06, -7.227063179016113e-06, -5.071982741355896e-06, -2.9169023036956787e-06, -7.618218660354614e-07, 1.3932585716247559e-06, 3.548339009284973e-06, 5.7034194469451904e-06, 7.858499884605408e-06, 1.0013580322265625e-05, 1.2168660759925842e-05, 1.432374119758606e-05, 1.6478821635246277e-05, 1.8633902072906494e-05, 2.078898251056671e-05, 2.294406294822693e-05, 2.5099143385887146e-05, 2.7254223823547363e-05, 2.940930426120758e-05, 3.15643846988678e-05, 3.3719465136528015e-05, 3.587454557418823e-05, 3.802962601184845e-05, 4.018470644950867e-05, 4.2339786887168884e-05, 4.44948673248291e-05, 4.664994776248932e-05, 4.8805028200149536e-05, 5.0960108637809753e-05, 5.311518907546997e-05, 5.527026951313019e-05, 5.7425349950790405e-05, 5.958043038845062e-05, 6.173551082611084e-05, 6.389059126377106e-05, 6.604567170143127e-05, 6.820075213909149e-05, 7.035583257675171e-05, 7.251091301441193e-05, 7.466599345207214e-05, 7.682107388973236e-05, 7.897615432739258e-05]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 20.0, 15.0, 19.0, 36.0, 44.0, 67.0, 120.0, 152.0, 209.0, 336.0, 524.0, 880.0, 1673.0, 3122.0, 7714.0, 22798.0, 139321.0, 785309.0, 60472.0, 14325.0, 5482.0, 2444.0, 1305.0, 728.0, 438.0, 313.0, 194.0, 134.0, 105.0, 59.0, 48.0, 40.0, 21.0, 15.0, 17.0, 12.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036907196044921875, -0.00035728514194488525, -0.00034549832344055176, -0.00033371150493621826, -0.00032192468643188477, -0.00031013786792755127, -0.0002983510494232178, -0.0002865642309188843, -0.0002747774124145508, -0.0002629905939102173, -0.0002512037754058838, -0.0002394169569015503, -0.0002276301383972168, -0.0002158433198928833, -0.0002040565013885498, -0.0001922696828842163, -0.0001804828643798828, -0.00016869604587554932, -0.00015690922737121582, -0.00014512240886688232, -0.00013333559036254883, -0.00012154877185821533, -0.00010976195335388184, -9.797513484954834e-05, -8.618831634521484e-05, -7.440149784088135e-05, -6.261467933654785e-05, -5.0827860832214355e-05, -3.904104232788086e-05, -2.7254223823547363e-05, -1.5467405319213867e-05, -3.680586814880371e-06, 8.106231689453125e-06, 1.989305019378662e-05, 3.167986869812012e-05, 4.346668720245361e-05, 5.525350570678711e-05, 6.70403242111206e-05, 7.88271427154541e-05, 9.06139612197876e-05, 0.0001024007797241211, 0.00011418759822845459, 0.00012597441673278809, 0.00013776123523712158, 0.00014954805374145508, 0.00016133487224578857, 0.00017312169075012207, 0.00018490850925445557, 0.00019669532775878906, 0.00020848214626312256, 0.00022026896476745605, 0.00023205578327178955, 0.00024384260177612305, 0.00025562942028045654, 0.00026741623878479004, 0.00027920305728912354, 0.00029098987579345703, 0.00030277669429779053, 0.000314563512802124, 0.0003263503313064575, 0.000338137149810791, 0.0003499239683151245, 0.000361710786819458, 0.0003734976053237915, 0.000385284423828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 1.0, 5.0, 4.0, 7.0, 10.0, 23.0, 16.0, 19.0, 23.0, 29.0, 30.0, 61.0, 54.0, 125.0, 186.0, 101.0, 75.0, 39.0, 39.0, 26.0, 21.0, 21.0, 17.0, 9.0, 14.0, 6.0, 9.0, 9.0, 3.0, 1.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30805778503418e-05, -3.203004598617554e-05, -3.097951412200928e-05, -2.9928982257843018e-05, -2.8878450393676758e-05, -2.7827918529510498e-05, -2.6777386665344238e-05, -2.572685480117798e-05, -2.467632293701172e-05, -2.362579107284546e-05, -2.25752592086792e-05, -2.152472734451294e-05, -2.047419548034668e-05, -1.942366361618042e-05, -1.837313175201416e-05, -1.73225998878479e-05, -1.627206802368164e-05, -1.5221536159515381e-05, -1.4171004295349121e-05, -1.3120472431182861e-05, -1.2069940567016602e-05, -1.1019408702850342e-05, -9.968876838684082e-06, -8.918344974517822e-06, -7.867813110351562e-06, -6.817281246185303e-06, -5.766749382019043e-06, -4.716217517852783e-06, -3.6656856536865234e-06, -2.6151537895202637e-06, -1.564621925354004e-06, -5.140900611877441e-07, 5.364418029785156e-07, 1.5869736671447754e-06, 2.637505531311035e-06, 3.688037395477295e-06, 4.738569259643555e-06, 5.7891011238098145e-06, 6.839632987976074e-06, 7.890164852142334e-06, 8.940696716308594e-06, 9.991228580474854e-06, 1.1041760444641113e-05, 1.2092292308807373e-05, 1.3142824172973633e-05, 1.4193356037139893e-05, 1.5243887901306152e-05, 1.6294419765472412e-05, 1.7344951629638672e-05, 1.839548349380493e-05, 1.944601535797119e-05, 2.049654722213745e-05, 2.154707908630371e-05, 2.259761095046997e-05, 2.364814281463623e-05, 2.469867467880249e-05, 2.574920654296875e-05, 2.679973840713501e-05, 2.785027027130127e-05, 2.890080213546753e-05, 2.995133399963379e-05, 3.100186586380005e-05, 3.205239772796631e-05, 3.310292959213257e-05, 3.415346145629883e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 9.0, 9.0, 6.0, 18.0, 35.0, 34.0, 46.0, 46.0, 75.0, 115.0, 199.0, 256.0, 367.0, 583.0, 904.0, 1558.0, 2555.0, 4600.0, 8753.0, 18630.0, 47036.0, 187293.0, 627171.0, 89761.0, 30240.0, 12865.0, 6374.0, 3501.0, 2048.0, 1209.0, 761.0, 492.0, 311.0, 206.0, 146.0, 89.0, 75.0, 46.0, 28.0, 33.0, 18.0, 13.0, 8.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0001024007797241211, -9.922776371240616e-05, -9.605474770069122e-05, -9.288173168897629e-05, -8.970871567726135e-05, -8.653569966554642e-05, -8.336268365383148e-05, -8.018966764211655e-05, -7.701665163040161e-05, -7.384363561868668e-05, -7.067061960697174e-05, -6.74976035952568e-05, -6.432458758354187e-05, -6.115157157182693e-05, -5.7978555560112e-05, -5.4805539548397064e-05, -5.163252353668213e-05, -4.8459507524967194e-05, -4.528649151325226e-05, -4.211347550153732e-05, -3.894045948982239e-05, -3.576744347810745e-05, -3.259442746639252e-05, -2.9421411454677582e-05, -2.6248395442962646e-05, -2.307537943124771e-05, -1.9902363419532776e-05, -1.672934740781784e-05, -1.3556331396102905e-05, -1.038331538438797e-05, -7.210299372673035e-06, -4.037283360958099e-06, -8.642673492431641e-07, 2.3087486624717712e-06, 5.4817646741867065e-06, 8.654780685901642e-06, 1.1827796697616577e-05, 1.5000812709331512e-05, 1.8173828721046448e-05, 2.1346844732761383e-05, 2.451986074447632e-05, 2.7692876756191254e-05, 3.086589276790619e-05, 3.4038908779621124e-05, 3.721192479133606e-05, 4.0384940803050995e-05, 4.355795681476593e-05, 4.6730972826480865e-05, 4.99039888381958e-05, 5.3077004849910736e-05, 5.625002086162567e-05, 5.942303687334061e-05, 6.259605288505554e-05, 6.576906889677048e-05, 6.894208490848541e-05, 7.211510092020035e-05, 7.528811693191528e-05, 7.846113294363022e-05, 8.163414895534515e-05, 8.480716496706009e-05, 8.798018097877502e-05, 9.115319699048996e-05, 9.43262130022049e-05, 9.749922901391983e-05, 0.00010067224502563477]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 1.0, 7.0, 7.0, 4.0, 6.0, 6.0, 8.0, 14.0, 19.0, 10.0, 14.0, 19.0, 18.0, 23.0, 39.0, 38.0, 38.0, 40.0, 73.0, 78.0, 102.0, 76.0, 53.0, 37.0, 33.0, 41.0, 22.0, 27.0, 19.0, 17.0, 15.0, 14.0, 13.0, 12.0, 4.0, 9.0, 8.0, 11.0, 3.0, 7.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.9206275939941406e-05, -2.8304755687713623e-05, -2.740323543548584e-05, -2.6501715183258057e-05, -2.5600194931030273e-05, -2.469867467880249e-05, -2.3797154426574707e-05, -2.2895634174346924e-05, -2.199411392211914e-05, -2.1092593669891357e-05, -2.0191073417663574e-05, -1.928955316543579e-05, -1.8388032913208008e-05, -1.7486512660980225e-05, -1.658499240875244e-05, -1.5683472156524658e-05, -1.4781951904296875e-05, -1.3880431652069092e-05, -1.2978911399841309e-05, -1.2077391147613525e-05, -1.1175870895385742e-05, -1.0274350643157959e-05, -9.372830390930176e-06, -8.471310138702393e-06, -7.569789886474609e-06, -6.668269634246826e-06, -5.766749382019043e-06, -4.86522912979126e-06, -3.9637088775634766e-06, -3.0621886253356934e-06, -2.16066837310791e-06, -1.259148120880127e-06, -3.5762786865234375e-07, 5.438923835754395e-07, 1.4454126358032227e-06, 2.346932888031006e-06, 3.248453140258789e-06, 4.149973392486572e-06, 5.0514936447143555e-06, 5.953013896942139e-06, 6.854534149169922e-06, 7.756054401397705e-06, 8.657574653625488e-06, 9.559094905853271e-06, 1.0460615158081055e-05, 1.1362135410308838e-05, 1.2263655662536621e-05, 1.3165175914764404e-05, 1.4066696166992188e-05, 1.496821641921997e-05, 1.5869736671447754e-05, 1.6771256923675537e-05, 1.767277717590332e-05, 1.8574297428131104e-05, 1.9475817680358887e-05, 2.037733793258667e-05, 2.1278858184814453e-05, 2.2180378437042236e-05, 2.308189868927002e-05, 2.3983418941497803e-05, 2.4884939193725586e-05, 2.578645944595337e-05, 2.6687979698181152e-05, 2.7589499950408936e-05, 2.849102020263672e-05]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 6.0, 6.0, 32.0, 83.0, 311.0, 465.0, 89.0, 19.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014379165368154645, -0.0012634414015337825, -0.0010889661498367786, -0.0009144910145550966, -0.0007400158792734146, -0.0005655407439917326, -0.00039106549229472876, -0.00021659035701304674, -4.211522173136473e-05, 0.00013235994265414774, 0.0003068351070396602, 0.00048131030052900314, 0.0006557854358106852, 0.0008302605710923672, 0.001004735822789371, 0.001179210958071053, 0.001353686093352735, 0.001528161228634417, 0.001702636480331421, 0.001877111615613103, 0.002051586750894785, 0.002226061886176467, 0.002400537021458149, 0.0025750123895704746, 0.002749487292021513, 0.002923962427303195, 0.003098437562584877, 0.0032729129306972027, 0.003447387833148241, 0.0036218632012605667, 0.0037963383365422487, 0.003970813471823931, 0.004145288839936256, 0.004319764208048582, 0.0044942391104996204, 0.004668714478611946, 0.0048431893810629845, 0.00501766474917531, 0.005192140117287636, 0.005366615019738674, 0.0055410899221897125, 0.005715565290302038, 0.0058900401927530766, 0.006064515560865402, 0.006238990463316441, 0.006413465831428766, 0.006587941199541092, 0.00676241610199213, 0.006936891470104456, 0.007111366838216782, 0.00728584174066782, 0.007460317108780146, 0.007634792011231184, 0.00780926737934351, 0.007983742281794548, 0.008158218115568161, 0.0083326930180192, 0.008507167920470238, 0.00868164375424385, 0.008856118656694889, 0.009030593559145927, 0.009205068461596966, 0.009379544295370579, 0.009554019197821617, 0.009728494100272655]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 17.0, 20.0, 18.0, 46.0, 35.0, 55.0, 61.0, 71.0, 84.0, 78.0, 76.0, 70.0, 73.0, 62.0, 56.0, 54.0, 32.0, 30.0, 28.0, 13.0, 12.0, 5.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0016422271728515625, -0.001606806181371212, -0.0015713851898908615, -0.001535964198410511, -0.0015005432069301605, -0.00146512221544981, -0.0014297012239694595, -0.001394280232489109, -0.0013588592410087585, -0.001323438249528408, -0.0012880172580480576, -0.001252596266567707, -0.0012171752750873566, -0.001181754283607006, -0.0011463332921266556, -0.001110912300646305, -0.0010754913091659546, -0.001040070317685604, -0.0010046493262052536, -0.0009692283347249031, -0.0009338073432445526, -0.0008983863517642021, -0.0008629653602838516, -0.0008275443688035011, -0.0007921233773231506, -0.0007567023858428001, -0.0007212813943624496, -0.0006858604028820992, -0.0006504394114017487, -0.0006150184199213982, -0.0005795974284410477, -0.0005441764369606972, -0.0005087554454803467, -0.0004733344539999962, -0.0004379134625196457, -0.0004024924710392952, -0.0003670714795589447, -0.0003316504880785942, -0.0002962294965982437, -0.0002608085051178932, -0.00022538751363754272, -0.00018996652215719223, -0.00015454553067684174, -0.00011912453919649124, -8.370354771614075e-05, -4.828255623579025e-05, -1.2861564755439758e-05, 2.2559426724910736e-05, 5.798041820526123e-05, 9.340140968561172e-05, 0.00012882240116596222, 0.00016424339264631271, 0.0001996643841266632, 0.0002350853756070137, 0.0002705063670873642, 0.0003059273585677147, 0.0003413483500480652, 0.0003767693415284157, 0.0004121903330087662, 0.00044761132448911667, 0.00048303231596946716, 0.0005184533074498177, 0.0005538742989301682, 0.0005892952904105186, 0.0006247162818908691]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 14.0, 20.0, 44.0, 90.0, 185.0, 332.0, 649.0, 1484.0, 3502.0, 9681.0, 31949.0, 175841.0, 3785128.0, 143010.0, 27851.0, 8401.0, 3162.0, 1270.0, 619.0, 321.0, 173.0, 130.0, 91.0, 71.0, 59.0, 47.0, 33.0, 33.0, 24.0, 18.0, 11.0, 10.0, 7.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037169456481933594, -0.0003543831408023834, -0.0003370717167854309, -0.0003197602927684784, -0.0003024488687515259, -0.00028513744473457336, -0.00026782602071762085, -0.00025051459670066833, -0.00023320317268371582, -0.0002158917486667633, -0.0001985803246498108, -0.00018126890063285828, -0.00016395747661590576, -0.00014664605259895325, -0.00012933462858200073, -0.00011202320456504822, -9.47117805480957e-05, -7.740035653114319e-05, -6.0088932514190674e-05, -4.277750849723816e-05, -2.5466084480285645e-05, -8.15466046333313e-06, 9.156763553619385e-06, 2.64681875705719e-05, 4.3779611587524414e-05, 6.109103560447693e-05, 7.840245962142944e-05, 9.571388363838196e-05, 0.00011302530765533447, 0.000130336731672287, 0.0001476481556892395, 0.00016495957970619202, 0.00018227100372314453, 0.00019958242774009705, 0.00021689385175704956, 0.00023420527577400208, 0.0002515166997909546, 0.0002688281238079071, 0.0002861395478248596, 0.00030345097184181213, 0.00032076239585876465, 0.00033807381987571716, 0.0003553852438926697, 0.0003726966679096222, 0.0003900080919265747, 0.0004073195159435272, 0.00042463093996047974, 0.00044194236397743225, 0.00045925378799438477, 0.0004765652120113373, 0.0004938766360282898, 0.0005111880600452423, 0.0005284994840621948, 0.0005458109080791473, 0.0005631223320960999, 0.0005804337561130524, 0.0005977451801300049, 0.0006150566041469574, 0.0006323680281639099, 0.0006496794521808624, 0.0006669908761978149, 0.0006843023002147675, 0.00070161372423172, 0.0007189251482486725, 0.000736236572265625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 10.0, 9.0, 12.0, 14.0, 21.0, 39.0, 49.0, 88.0, 132.0, 116.0, 139.0, 127.0, 74.0, 56.0, 35.0, 29.0, 17.0, 8.0, 8.0, 5.0, 10.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.664327621459961e-05, -2.538040280342102e-05, -2.411752939224243e-05, -2.2854655981063843e-05, -2.1591782569885254e-05, -2.0328909158706665e-05, -1.9066035747528076e-05, -1.7803162336349487e-05, -1.65402889251709e-05, -1.527741551399231e-05, -1.401454210281372e-05, -1.2751668691635132e-05, -1.1488795280456543e-05, -1.0225921869277954e-05, -8.963048458099365e-06, -7.700175046920776e-06, -6.4373016357421875e-06, -5.174428224563599e-06, -3.91155481338501e-06, -2.648681402206421e-06, -1.385807991027832e-06, -1.2293457984924316e-07, 1.1399388313293457e-06, 2.4028122425079346e-06, 3.6656856536865234e-06, 4.928559064865112e-06, 6.191432476043701e-06, 7.45430588722229e-06, 8.717179298400879e-06, 9.980052709579468e-06, 1.1242926120758057e-05, 1.2505799531936646e-05, 1.3768672943115234e-05, 1.5031546354293823e-05, 1.6294419765472412e-05, 1.7557293176651e-05, 1.882016658782959e-05, 2.008303999900818e-05, 2.1345913410186768e-05, 2.2608786821365356e-05, 2.3871660232543945e-05, 2.5134533643722534e-05, 2.6397407054901123e-05, 2.7660280466079712e-05, 2.89231538772583e-05, 3.018602728843689e-05, 3.144890069961548e-05, 3.271177411079407e-05, 3.3974647521972656e-05, 3.5237520933151245e-05, 3.6500394344329834e-05, 3.776326775550842e-05, 3.902614116668701e-05, 4.02890145778656e-05, 4.155188798904419e-05, 4.281476140022278e-05, 4.407763481140137e-05, 4.5340508222579956e-05, 4.6603381633758545e-05, 4.7866255044937134e-05, 4.912912845611572e-05, 5.039200186729431e-05, 5.16548752784729e-05, 5.291774868965149e-05, 5.418062210083008e-05]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 10.0, 14.0, 14.0, 29.0, 37.0, 57.0, 84.0, 137.0, 257.0, 486.0, 839.0, 1870.0, 3944.0, 9792.0, 28646.0, 111797.0, 3254919.0, 666726.0, 78477.0, 21712.0, 7960.0, 3273.0, 1444.0, 770.0, 391.0, 230.0, 137.0, 78.0, 43.0, 37.0, 25.0, 8.0, 7.0, 10.0, 8.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003521442413330078, -0.0003407411277294159, -0.000329338014125824, -0.00031793490052223206, -0.00030653178691864014, -0.0002951286733150482, -0.0002837255597114563, -0.0002723224461078644, -0.00026091933250427246, -0.00024951621890068054, -0.00023811310529708862, -0.0002267099916934967, -0.00021530687808990479, -0.00020390376448631287, -0.00019250065088272095, -0.00018109753727912903, -0.0001696944236755371, -0.0001582913100719452, -0.00014688819646835327, -0.00013548508286476135, -0.00012408196926116943, -0.00011267885565757751, -0.0001012757420539856, -8.987262845039368e-05, -7.846951484680176e-05, -6.706640124320984e-05, -5.566328763961792e-05, -4.4260174036026e-05, -3.285706043243408e-05, -2.1453946828842163e-05, -1.0050833225250244e-05, 1.3522803783416748e-06, 1.2755393981933594e-05, 2.4158507585525513e-05, 3.556162118911743e-05, 4.696473479270935e-05, 5.836784839630127e-05, 6.977096199989319e-05, 8.117407560348511e-05, 9.257718920707703e-05, 0.00010398030281066895, 0.00011538341641426086, 0.00012678653001785278, 0.0001381896436214447, 0.00014959275722503662, 0.00016099587082862854, 0.00017239898443222046, 0.00018380209803581238, 0.0001952052116394043, 0.00020660832524299622, 0.00021801143884658813, 0.00022941455245018005, 0.00024081766605377197, 0.0002522207796573639, 0.0002636238932609558, 0.00027502700686454773, 0.00028643012046813965, 0.00029783323407173157, 0.0003092363476753235, 0.0003206394612789154, 0.0003320425748825073, 0.00034344568848609924, 0.00035484880208969116, 0.0003662519156932831, 0.000377655029296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 10.0, 10.0, 5.0, 13.0, 21.0, 17.0, 35.0, 39.0, 55.0, 82.0, 116.0, 191.0, 463.0, 1891.0, 395.0, 153.0, 126.0, 115.0, 92.0, 60.0, 50.0, 41.0, 29.0, 15.0, 15.0, 12.0, 9.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00013303756713867188, -0.00012975279241800308, -0.0001264680176973343, -0.0001231832429766655, -0.0001198984682559967, -0.00011661369353532791, -0.00011332891881465912, -0.00011004414409399033, -0.00010675936937332153, -0.00010347459465265274, -0.00010018981993198395, -9.690504521131516e-05, -9.362027049064636e-05, -9.033549576997757e-05, -8.705072104930878e-05, -8.376594632863998e-05, -8.048117160797119e-05, -7.71963968873024e-05, -7.39116221666336e-05, -7.062684744596481e-05, -6.734207272529602e-05, -6.405729800462723e-05, -6.0772523283958435e-05, -5.748774856328964e-05, -5.420297384262085e-05, -5.091819912195206e-05, -4.7633424401283264e-05, -4.434864968061447e-05, -4.106387495994568e-05, -3.7779100239276886e-05, -3.449432551860809e-05, -3.12095507979393e-05, -2.7924776077270508e-05, -2.4640001356601715e-05, -2.1355226635932922e-05, -1.807045191526413e-05, -1.4785677194595337e-05, -1.1500902473926544e-05, -8.216127753257751e-06, -4.931353032588959e-06, -1.646578311920166e-06, 1.6381964087486267e-06, 4.9229711294174194e-06, 8.207745850086212e-06, 1.1492520570755005e-05, 1.4777295291423798e-05, 1.806207001209259e-05, 2.1346844732761383e-05, 2.4631619453430176e-05, 2.791639417409897e-05, 3.120116889476776e-05, 3.4485943615436554e-05, 3.777071833610535e-05, 4.105549305677414e-05, 4.434026777744293e-05, 4.7625042498111725e-05, 5.090981721878052e-05, 5.419459193944931e-05, 5.74793666601181e-05, 6.0764141380786896e-05, 6.404891610145569e-05, 6.733369082212448e-05, 7.061846554279327e-05, 7.390324026346207e-05, 7.718801498413086e-05]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 12.0, 43.0, 213.0, 493.0, 161.0, 60.0, 16.0, 13.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000394349277485162, -0.00030173323466442525, -0.00020911717729177326, -0.00011650111991912127, -2.38850770983845e-05, 6.873096572235227e-05, 0.0001613470376469195, 0.0002539630513638258, 0.000346579123288393, 0.0004391951661091298, 0.0005318112089298666, 0.0006244272808544338, 0.0007170432945713401, 0.0008096593664959073, 0.0009022754384204745, 0.00099489139392972, 0.0010875074658542871, 0.0011801235377788544, 0.0012727396097034216, 0.0013653556816279888, 0.0014579716371372342, 0.0015505877090618014, 0.0016432037809863687, 0.001735819736495614, 0.001828435924835503, 0.0019210519967600703, 0.0020136679522693157, 0.002106284024193883, 0.00219890009611845, 0.0022915161680430174, 0.0023841322399675846, 0.002476748311892152, 0.0025693641509860754, 0.0026619802229106426, 0.00275459629483521, 0.002847212366759777, 0.0029398284386843443, 0.0030324445106089115, 0.003125060349702835, 0.0032176764216274023, 0.0033102924935519695, 0.0034029085654765368, 0.003495524637401104, 0.003588140709325671, 0.0036807567812502384, 0.003773372620344162, 0.003865988925099373, 0.003958604764193296, 0.004051221068948507, 0.004143836908042431, 0.004236453212797642, 0.004329069051891565, 0.004421685356646776, 0.0045143011957407, 0.004606917500495911, 0.004699533339589834, 0.004792149178683758, 0.004884765017777681, 0.004977381322532892, 0.005069997161626816, 0.005162613466382027, 0.00525522930547595, 0.005347845610231161, 0.005440461449325085, 0.0055330777540802956]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 6.0, 10.0, 12.0, 10.0, 19.0, 22.0, 26.0, 31.0, 51.0, 54.0, 53.0, 48.0, 58.0, 56.0, 75.0, 71.0, 54.0, 44.0, 58.0, 45.0, 39.0, 36.0, 40.0, 23.0, 20.0, 15.0, 6.0, 11.0, 7.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000633537769317627, -0.0006163548678159714, -0.0005991719663143158, -0.0005819890648126602, -0.0005648061633110046, -0.0005476232618093491, -0.0005304403603076935, -0.0005132574588060379, -0.0004960745573043823, -0.00047889165580272675, -0.00046170875430107117, -0.0004445258527994156, -0.00042734295129776, -0.00041016004979610443, -0.00039297714829444885, -0.0003757942467927933, -0.0003586113452911377, -0.0003414284437894821, -0.00032424554228782654, -0.00030706264078617096, -0.0002898797392845154, -0.0002726968377828598, -0.0002555139362812042, -0.00023833103477954865, -0.00022114813327789307, -0.0002039652317762375, -0.0001867823302745819, -0.00016959942877292633, -0.00015241652727127075, -0.00013523362576961517, -0.0001180507242679596, -0.00010086782276630402, -8.368492126464844e-05, -6.650201976299286e-05, -4.931911826133728e-05, -3.21362167596817e-05, -1.4953315258026123e-05, 2.2295862436294556e-06, 1.9412487745285034e-05, 3.659538924694061e-05, 5.377829074859619e-05, 7.096119225025177e-05, 8.814409375190735e-05, 0.00010532699525356293, 0.0001225098967552185, 0.00013969279825687408, 0.00015687569975852966, 0.00017405860126018524, 0.00019124150276184082, 0.0002084244042634964, 0.00022560730576515198, 0.00024279020726680756, 0.00025997310876846313, 0.0002771560102701187, 0.0002943389117717743, 0.00031152181327342987, 0.00032870471477508545, 0.00034588761627674103, 0.0003630705177783966, 0.0003802534192800522, 0.00039743632078170776, 0.00041461922228336334, 0.0004318021237850189, 0.0004489850252866745, 0.0004661679267883301]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 16.0, 3.0, 20.0, 27.0, 29.0, 48.0, 58.0, 118.0, 179.0, 271.0, 444.0, 752.0, 1271.0, 2190.0, 4481.0, 9735.0, 25490.0, 75943.0, 423206.0, 387218.0, 73946.0, 23934.0, 9675.0, 4194.0, 2208.0, 1208.0, 704.0, 415.0, 259.0, 174.0, 108.0, 71.0, 54.0, 41.0, 17.0, 15.0, 12.0, 10.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002319812774658203, -0.0002253502607345581, -0.0002187192440032959, -0.0002120882272720337, -0.00020545721054077148, -0.00019882619380950928, -0.00019219517707824707, -0.00018556416034698486, -0.00017893314361572266, -0.00017230212688446045, -0.00016567111015319824, -0.00015904009342193604, -0.00015240907669067383, -0.00014577805995941162, -0.00013914704322814941, -0.0001325160264968872, -0.000125885009765625, -0.00011925399303436279, -0.00011262297630310059, -0.00010599195957183838, -9.936094284057617e-05, -9.272992610931396e-05, -8.609890937805176e-05, -7.946789264678955e-05, -7.283687591552734e-05, -6.620585918426514e-05, -5.957484245300293e-05, -5.294382572174072e-05, -4.6312808990478516e-05, -3.968179225921631e-05, -3.30507755279541e-05, -2.6419758796691895e-05, -1.9788742065429688e-05, -1.315772533416748e-05, -6.5267086029052734e-06, 1.043081283569336e-07, 6.735324859619141e-06, 1.3366341590881348e-05, 1.9997358322143555e-05, 2.6628375053405762e-05, 3.325939178466797e-05, 3.9890408515930176e-05, 4.652142524719238e-05, 5.315244197845459e-05, 5.97834587097168e-05, 6.6414475440979e-05, 7.304549217224121e-05, 7.967650890350342e-05, 8.630752563476562e-05, 9.293854236602783e-05, 9.956955909729004e-05, 0.00010620057582855225, 0.00011283159255981445, 0.00011946260929107666, 0.00012609362602233887, 0.00013272464275360107, 0.00013935565948486328, 0.0001459866762161255, 0.0001526176929473877, 0.0001592487096786499, 0.0001658797264099121, 0.00017251074314117432, 0.00017914175987243652, 0.00018577277660369873, 0.00019240379333496094]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 3.0, 6.0, 11.0, 10.0, 8.0, 21.0, 18.0, 44.0, 37.0, 55.0, 62.0, 76.0, 111.0, 82.0, 100.0, 76.0, 64.0, 56.0, 45.0, 30.0, 20.0, 19.0, 15.0, 14.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.396106719970703e-05, -2.3093074560165405e-05, -2.222508192062378e-05, -2.1357089281082153e-05, -2.0489096641540527e-05, -1.96211040019989e-05, -1.8753111362457275e-05, -1.788511872291565e-05, -1.7017126083374023e-05, -1.6149133443832397e-05, -1.528114080429077e-05, -1.4413148164749146e-05, -1.354515552520752e-05, -1.2677162885665894e-05, -1.1809170246124268e-05, -1.0941177606582642e-05, -1.0073184967041016e-05, -9.20519232749939e-06, -8.337199687957764e-06, -7.469207048416138e-06, -6.601214408874512e-06, -5.733221769332886e-06, -4.86522912979126e-06, -3.997236490249634e-06, -3.129243850708008e-06, -2.261251211166382e-06, -1.3932585716247559e-06, -5.252659320831299e-07, 3.427267074584961e-07, 1.210719347000122e-06, 2.078711986541748e-06, 2.946704626083374e-06, 3.814697265625e-06, 4.682689905166626e-06, 5.550682544708252e-06, 6.418675184249878e-06, 7.286667823791504e-06, 8.15466046333313e-06, 9.022653102874756e-06, 9.890645742416382e-06, 1.0758638381958008e-05, 1.1626631021499634e-05, 1.249462366104126e-05, 1.3362616300582886e-05, 1.4230608940124512e-05, 1.5098601579666138e-05, 1.5966594219207764e-05, 1.683458685874939e-05, 1.7702579498291016e-05, 1.857057213783264e-05, 1.9438564777374268e-05, 2.0306557416915894e-05, 2.117455005645752e-05, 2.2042542695999146e-05, 2.291053533554077e-05, 2.3778527975082397e-05, 2.4646520614624023e-05, 2.551451325416565e-05, 2.6382505893707275e-05, 2.72504985332489e-05, 2.8118491172790527e-05, 2.8986483812332153e-05, 2.985447645187378e-05, 3.0722469091415405e-05, 3.159046173095703e-05]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 11.0, 9.0, 20.0, 22.0, 26.0, 44.0, 64.0, 95.0, 166.0, 255.0, 457.0, 691.0, 1223.0, 2189.0, 4231.0, 8102.0, 17121.0, 36240.0, 91453.0, 300483.0, 399399.0, 106355.0, 41619.0, 19021.0, 8876.0, 4590.0, 2510.0, 1268.0, 774.0, 462.0, 272.0, 181.0, 108.0, 69.0, 51.0, 27.0, 18.0, 21.0, 8.0, 13.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00014793872833251953, -0.00014359690248966217, -0.0001392550766468048, -0.00013491325080394745, -0.0001305714249610901, -0.00012622959911823273, -0.00012188777327537537, -0.000117545947432518, -0.00011320412158966064, -0.00010886229574680328, -0.00010452046990394592, -0.00010017864406108856, -9.58368182182312e-05, -9.149499237537384e-05, -8.715316653251648e-05, -8.281134068965912e-05, -7.846951484680176e-05, -7.41276890039444e-05, -6.978586316108704e-05, -6.544403731822968e-05, -6.110221147537231e-05, -5.6760385632514954e-05, -5.241855978965759e-05, -4.807673394680023e-05, -4.373490810394287e-05, -3.939308226108551e-05, -3.505125641822815e-05, -3.070943057537079e-05, -2.6367604732513428e-05, -2.2025778889656067e-05, -1.7683953046798706e-05, -1.3342127203941345e-05, -9.000301361083984e-06, -4.6584755182266235e-06, -3.166496753692627e-07, 4.025176167488098e-06, 8.367002010345459e-06, 1.270882785320282e-05, 1.705065369606018e-05, 2.139247953891754e-05, 2.5734305381774902e-05, 3.0076131224632263e-05, 3.4417957067489624e-05, 3.8759782910346985e-05, 4.3101608753204346e-05, 4.7443434596061707e-05, 5.178526043891907e-05, 5.612708628177643e-05, 6.046891212463379e-05, 6.481073796749115e-05, 6.915256381034851e-05, 7.349438965320587e-05, 7.783621549606323e-05, 8.21780413389206e-05, 8.651986718177795e-05, 9.086169302463531e-05, 9.520351886749268e-05, 9.954534471035004e-05, 0.0001038871705532074, 0.00010822899639606476, 0.00011257082223892212, 0.00011691264808177948, 0.00012125447392463684, 0.0001255962997674942, 0.00012993812561035156]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 15.0, 16.0, 25.0, 19.0, 23.0, 30.0, 27.0, 44.0, 47.0, 45.0, 59.0, 36.0, 59.0, 49.0, 51.0, 52.0, 50.0, 65.0, 37.0, 36.0, 36.0, 38.0, 20.0, 21.0, 19.0, 26.0, 12.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-05, -4.3502077460289e-05, -4.170462489128113e-05, -3.9907172322273254e-05, -3.810971975326538e-05, -3.631226718425751e-05, -3.4514814615249634e-05, -3.271736204624176e-05, -3.091990947723389e-05, -2.9122456908226013e-05, -2.732500433921814e-05, -2.5527551770210266e-05, -2.3730099201202393e-05, -2.193264663219452e-05, -2.0135194063186646e-05, -1.8337741494178772e-05, -1.65402889251709e-05, -1.4742836356163025e-05, -1.2945383787155151e-05, -1.1147931218147278e-05, -9.350478649139404e-06, -7.553026080131531e-06, -5.755573511123657e-06, -3.958120942115784e-06, -2.16066837310791e-06, -3.632158041000366e-07, 1.434236764907837e-06, 3.2316893339157104e-06, 5.029141902923584e-06, 6.8265944719314575e-06, 8.624047040939331e-06, 1.0421499609947205e-05, 1.2218952178955078e-05, 1.4016404747962952e-05, 1.5813857316970825e-05, 1.76113098859787e-05, 1.9408762454986572e-05, 2.1206215023994446e-05, 2.300366759300232e-05, 2.4801120162010193e-05, 2.6598572731018066e-05, 2.839602530002594e-05, 3.0193477869033813e-05, 3.199093043804169e-05, 3.378838300704956e-05, 3.5585835576057434e-05, 3.738328814506531e-05, 3.918074071407318e-05, 4.0978193283081055e-05, 4.277564585208893e-05, 4.45730984210968e-05, 4.6370550990104675e-05, 4.816800355911255e-05, 4.996545612812042e-05, 5.1762908697128296e-05, 5.356036126613617e-05, 5.535781383514404e-05, 5.7155266404151917e-05, 5.895271897315979e-05, 6.0750171542167664e-05, 6.254762411117554e-05, 6.434507668018341e-05, 6.614252924919128e-05, 6.793998181819916e-05, 6.973743438720703e-05]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 9.0, 4.0, 18.0, 19.0, 31.0, 19.0, 34.0, 35.0, 73.0, 93.0, 177.0, 233.0, 345.0, 539.0, 823.0, 1403.0, 2030.0, 3880.0, 7588.0, 17100.0, 47491.0, 255634.0, 589159.0, 76357.0, 22392.0, 10636.0, 5063.0, 2817.0, 1638.0, 1028.0, 616.0, 415.0, 258.0, 182.0, 122.0, 84.0, 56.0, 37.0, 37.0, 22.0, 13.0, 12.0, 11.0, 6.0, 6.0, 1.0, 7.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.4139881134033203e-05, -2.3312866687774658e-05, -2.2485852241516113e-05, -2.165883779525757e-05, -2.0831823348999023e-05, -2.000480890274048e-05, -1.9177794456481934e-05, -1.835078001022339e-05, -1.7523765563964844e-05, -1.66967511177063e-05, -1.5869736671447754e-05, -1.5042722225189209e-05, -1.4215707778930664e-05, -1.3388693332672119e-05, -1.2561678886413574e-05, -1.173466444015503e-05, -1.0907649993896484e-05, -1.008063554763794e-05, -9.253621101379395e-06, -8.42660665512085e-06, -7.599592208862305e-06, -6.77257776260376e-06, -5.945563316345215e-06, -5.11854887008667e-06, -4.291534423828125e-06, -3.46451997756958e-06, -2.637505531311035e-06, -1.8104910850524902e-06, -9.834766387939453e-07, -1.564621925354004e-07, 6.705522537231445e-07, 1.4975666999816895e-06, 2.3245811462402344e-06, 3.1515955924987793e-06, 3.978610038757324e-06, 4.805624485015869e-06, 5.632638931274414e-06, 6.459653377532959e-06, 7.286667823791504e-06, 8.113682270050049e-06, 8.940696716308594e-06, 9.767711162567139e-06, 1.0594725608825684e-05, 1.1421740055084229e-05, 1.2248754501342773e-05, 1.3075768947601318e-05, 1.3902783393859863e-05, 1.4729797840118408e-05, 1.5556812286376953e-05, 1.6383826732635498e-05, 1.7210841178894043e-05, 1.8037855625152588e-05, 1.8864870071411133e-05, 1.9691884517669678e-05, 2.0518898963928223e-05, 2.1345913410186768e-05, 2.2172927856445312e-05, 2.2999942302703857e-05, 2.3826956748962402e-05, 2.4653971195220947e-05, 2.5480985641479492e-05, 2.6308000087738037e-05, 2.7135014533996582e-05, 2.7962028980255127e-05, 2.8789043426513672e-05]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 4.0, 4.0, 5.0, 8.0, 12.0, 5.0, 8.0, 22.0, 22.0, 33.0, 43.0, 64.0, 96.0, 159.0, 162.0, 105.0, 74.0, 45.0, 22.0, 25.0, 16.0, 14.0, 4.0, 4.0, 12.0, 5.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.329183578491211e-05, -1.295190304517746e-05, -1.261197030544281e-05, -1.227203756570816e-05, -1.193210482597351e-05, -1.1592172086238861e-05, -1.1252239346504211e-05, -1.0912306606769562e-05, -1.0572373867034912e-05, -1.0232441127300262e-05, -9.892508387565613e-06, -9.552575647830963e-06, -9.212642908096313e-06, -8.872710168361664e-06, -8.532777428627014e-06, -8.192844688892365e-06, -7.852911949157715e-06, -7.512979209423065e-06, -7.1730464696884155e-06, -6.833113729953766e-06, -6.493180990219116e-06, -6.1532482504844666e-06, -5.813315510749817e-06, -5.473382771015167e-06, -5.133450031280518e-06, -4.793517291545868e-06, -4.453584551811218e-06, -4.113651812076569e-06, -3.773719072341919e-06, -3.4337863326072693e-06, -3.0938535928726196e-06, -2.75392085313797e-06, -2.4139881134033203e-06, -2.0740553736686707e-06, -1.734122633934021e-06, -1.3941898941993713e-06, -1.0542571544647217e-06, -7.14324414730072e-07, -3.7439167499542236e-07, -3.4458935260772705e-08, 3.0547380447387695e-07, 6.454065442085266e-07, 9.853392839431763e-07, 1.325272023677826e-06, 1.6652047634124756e-06, 2.0051375031471252e-06, 2.345070242881775e-06, 2.6850029826164246e-06, 3.0249357223510742e-06, 3.364868462085724e-06, 3.7048012018203735e-06, 4.044733941555023e-06, 4.384666681289673e-06, 4.7245994210243225e-06, 5.064532160758972e-06, 5.404464900493622e-06, 5.7443976402282715e-06, 6.084330379962921e-06, 6.424263119697571e-06, 6.7641958594322205e-06, 7.10412859916687e-06, 7.44406133890152e-06, 7.78399407863617e-06, 8.123926818370819e-06, 8.463859558105469e-06]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 8.0, 6.0, 8.0, 12.0, 16.0, 29.0, 31.0, 38.0, 47.0, 70.0, 102.0, 137.0, 190.0, 284.0, 403.0, 641.0, 984.0, 1730.0, 3482.0, 9256.0, 32621.0, 653962.0, 303665.0, 25378.0, 7655.0, 3244.0, 1684.0, 970.0, 588.0, 375.0, 268.0, 178.0, 130.0, 86.0, 80.0, 52.0, 47.0, 20.0, 23.0, 12.0, 10.0, 12.0, 4.0, 3.0, 9.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.409385681152344e-05, -3.295484930276871e-05, -3.181584179401398e-05, -3.067683428525925e-05, -2.9537826776504517e-05, -2.8398819267749786e-05, -2.7259811758995056e-05, -2.6120804250240326e-05, -2.4981796741485596e-05, -2.3842789232730865e-05, -2.2703781723976135e-05, -2.1564774215221405e-05, -2.0425766706466675e-05, -1.9286759197711945e-05, -1.8147751688957214e-05, -1.7008744180202484e-05, -1.5869736671447754e-05, -1.4730729162693024e-05, -1.3591721653938293e-05, -1.2452714145183563e-05, -1.1313706636428833e-05, -1.0174699127674103e-05, -9.035691618919373e-06, -7.896684110164642e-06, -6.757676601409912e-06, -5.618669092655182e-06, -4.479661583900452e-06, -3.3406540751457214e-06, -2.201646566390991e-06, -1.062639057636261e-06, 7.636845111846924e-08, 1.2153759598731995e-06, 2.3543834686279297e-06, 3.49339097738266e-06, 4.63239848613739e-06, 5.77140599489212e-06, 6.910413503646851e-06, 8.04942101240158e-06, 9.188428521156311e-06, 1.0327436029911041e-05, 1.1466443538665771e-05, 1.2605451047420502e-05, 1.3744458556175232e-05, 1.4883466064929962e-05, 1.6022473573684692e-05, 1.7161481082439423e-05, 1.8300488591194153e-05, 1.9439496099948883e-05, 2.0578503608703613e-05, 2.1717511117458344e-05, 2.2856518626213074e-05, 2.3995526134967804e-05, 2.5134533643722534e-05, 2.6273541152477264e-05, 2.7412548661231995e-05, 2.8551556169986725e-05, 2.9690563678741455e-05, 3.0829571187496185e-05, 3.1968578696250916e-05, 3.3107586205005646e-05, 3.4246593713760376e-05, 3.5385601222515106e-05, 3.6524608731269836e-05, 3.766361624002457e-05, 3.88026237487793e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 11.0, 13.0, 26.0, 31.0, 54.0, 121.0, 231.0, 244.0, 108.0, 70.0, 27.0, 11.0, 12.0, 4.0, 10.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.823902130126953e-05, -1.774728298187256e-05, -1.7255544662475586e-05, -1.6763806343078613e-05, -1.627206802368164e-05, -1.5780329704284668e-05, -1.5288591384887695e-05, -1.4796853065490723e-05, -1.430511474609375e-05, -1.3813376426696777e-05, -1.3321638107299805e-05, -1.2829899787902832e-05, -1.233816146850586e-05, -1.1846423149108887e-05, -1.1354684829711914e-05, -1.0862946510314941e-05, -1.0371208190917969e-05, -9.879469871520996e-06, -9.387731552124023e-06, -8.89599323272705e-06, -8.404254913330078e-06, -7.912516593933105e-06, -7.420778274536133e-06, -6.92903995513916e-06, -6.4373016357421875e-06, -5.945563316345215e-06, -5.453824996948242e-06, -4.9620866775512695e-06, -4.470348358154297e-06, -3.978610038757324e-06, -3.4868717193603516e-06, -2.995133399963379e-06, -2.5033950805664062e-06, -2.0116567611694336e-06, -1.519918441772461e-06, -1.0281801223754883e-06, -5.364418029785156e-07, -4.470348358154297e-08, 4.470348358154297e-07, 9.387731552124023e-07, 1.430511474609375e-06, 1.9222497940063477e-06, 2.4139881134033203e-06, 2.905726432800293e-06, 3.3974647521972656e-06, 3.889203071594238e-06, 4.380941390991211e-06, 4.872679710388184e-06, 5.364418029785156e-06, 5.856156349182129e-06, 6.3478946685791016e-06, 6.839632987976074e-06, 7.331371307373047e-06, 7.82310962677002e-06, 8.314847946166992e-06, 8.806586265563965e-06, 9.298324584960938e-06, 9.79006290435791e-06, 1.0281801223754883e-05, 1.0773539543151855e-05, 1.1265277862548828e-05, 1.17570161819458e-05, 1.2248754501342773e-05, 1.2740492820739746e-05, 1.3232231140136719e-05]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 13.0, 38.0, 131.0, 490.0, 201.0, 87.0, 25.0, 20.0, 6.0, 2.0, 1.0, 1.0], "bins": [-0.002239497611299157, -0.0021992502734065056, -0.0021590027026832104, -0.002118755364790559, -0.0020785080268979073, -0.002038260456174612, -0.0019980131182819605, -0.001957765780389309, -0.0019175182096660137, -0.0018772707553580403, -0.0018370234174653888, -0.0017967759631574154, -0.001756528508849442, -0.0017162810545414686, -0.001676033716648817, -0.0016357862623408437, -0.0015955389244481921, -0.0015552914701402187, -0.0015150441322475672, -0.0014747966779395938, -0.0014345492236316204, -0.0013943018857389688, -0.0013540544314309955, -0.001313806977123022, -0.0012735596392303705, -0.0012333121849223971, -0.0011930648470297456, -0.0011528173927217722, -0.0011125699384137988, -0.0010723224841058254, -0.0010320751462131739, -0.0009918276919052005, -0.0009515803540125489, -0.0009113329579122365, -0.0008710855036042631, -0.0008308381075039506, -0.0007905906531959772, -0.0007503432570956647, -0.0007100958609953523, -0.0006698484066873789, -0.0006296009523794055, -0.000589353556279093, -0.0005491061019711196, -0.0005088587058708072, -0.00046861128066666424, -0.0004283638554625213, -0.00038811645936220884, -0.0003478690341580659, -0.00030762163805775344, -0.0002673742128536105, -0.00022712680220138282, -0.00018687939154915512, -0.0001466319663450122, -0.00010638454114086926, -6.613713048864156e-05, -2.588971983641386e-05, 1.4357705367729068e-05, 5.460512329591438e-05, 9.48525412240997e-05, 0.0001350999518763274, 0.00017534737708047032, 0.00021559480228461325, 0.0002558422274887562, 0.00029608962358906865, 0.0003363370487932116]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 10.0, 12.0, 8.0, 11.0, 23.0, 23.0, 27.0, 29.0, 38.0, 53.0, 42.0, 60.0, 44.0, 57.0, 69.0, 50.0, 46.0, 54.0, 52.0, 42.0, 43.0, 37.0, 39.0, 29.0, 18.0, 24.0, 17.0, 16.0, 14.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021082162857055664, -0.00020285975188016891, -0.0001948978751897812, -0.00018693599849939346, -0.00017897412180900574, -0.000171012245118618, -0.00016305036842823029, -0.00015508849173784256, -0.00014712661504745483, -0.0001391647383570671, -0.00013120286166667938, -0.00012324098497629166, -0.00011527910828590393, -0.0001073172315955162, -9.935535490512848e-05, -9.139347821474075e-05, -8.343160152435303e-05, -7.54697248339653e-05, -6.750784814357758e-05, -5.954597145318985e-05, -5.1584094762802124e-05, -4.36222180724144e-05, -3.566034138202667e-05, -2.7698464691638947e-05, -1.973658800125122e-05, -1.1774711310863495e-05, -3.812834620475769e-06, 4.149042069911957e-06, 1.2110918760299683e-05, 2.007279545068741e-05, 2.8034672141075134e-05, 3.599654883146286e-05, 4.3958425521850586e-05, 5.192030221223831e-05, 5.988217890262604e-05, 6.784405559301376e-05, 7.580593228340149e-05, 8.376780897378922e-05, 9.172968566417694e-05, 9.969156235456467e-05, 0.00010765343904495239, 0.00011561531573534012, 0.00012357719242572784, 0.00013153906911611557, 0.0001395009458065033, 0.00014746282249689102, 0.00015542469918727875, 0.00016338657587766647, 0.0001713484525680542, 0.00017931032925844193, 0.00018727220594882965, 0.00019523408263921738, 0.0002031959593296051, 0.00021115783601999283, 0.00021911971271038055, 0.00022708158940076828, 0.000235043466091156, 0.00024300534278154373, 0.00025096721947193146, 0.0002589290961623192, 0.0002668909728527069, 0.00027485284954309464, 0.00028281472623348236, 0.0002907766029238701, 0.0002987384796142578]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 12.0, 24.0, 27.0, 60.0, 94.0, 163.0, 255.0, 476.0, 719.0, 1205.0, 1991.0, 3450.0, 6265.0, 12265.0, 26135.0, 62543.0, 198301.0, 3500875.0, 252326.0, 68951.0, 28593.0, 13257.0, 6601.0, 3438.0, 2070.0, 1252.0, 790.0, 524.0, 352.0, 310.0, 187.0, 166.0, 124.0, 94.0, 76.0, 75.0, 56.0, 45.0, 26.0, 28.0, 21.0, 14.0, 9.0, 10.0, 10.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00012540817260742188, -0.00012008845806121826, -0.00011476874351501465, -0.00010944902896881104, -0.00010412931442260742, -9.880959987640381e-05, -9.34898853302002e-05, -8.817017078399658e-05, -8.285045623779297e-05, -7.753074169158936e-05, -7.221102714538574e-05, -6.689131259918213e-05, -6.157159805297852e-05, -5.62518835067749e-05, -5.093216896057129e-05, -4.5612454414367676e-05, -4.029273986816406e-05, -3.497302532196045e-05, -2.9653310775756836e-05, -2.4333596229553223e-05, -1.901388168334961e-05, -1.3694167137145996e-05, -8.374452590942383e-06, -3.0547380447387695e-06, 2.2649765014648438e-06, 7.584691047668457e-06, 1.290440559387207e-05, 1.8224120140075684e-05, 2.3543834686279297e-05, 2.886354923248291e-05, 3.4183263778686523e-05, 3.950297832489014e-05, 4.482269287109375e-05, 5.014240741729736e-05, 5.5462121963500977e-05, 6.078183650970459e-05, 6.61015510559082e-05, 7.142126560211182e-05, 7.674098014831543e-05, 8.206069469451904e-05, 8.738040924072266e-05, 9.270012378692627e-05, 9.801983833312988e-05, 0.0001033395528793335, 0.00010865926742553711, 0.00011397898197174072, 0.00011929869651794434, 0.00012461841106414795, 0.00012993812561035156, 0.00013525784015655518, 0.0001405775547027588, 0.0001458972692489624, 0.00015121698379516602, 0.00015653669834136963, 0.00016185641288757324, 0.00016717612743377686, 0.00017249584197998047, 0.00017781555652618408, 0.0001831352710723877, 0.0001884549856185913, 0.00019377470016479492, 0.00019909441471099854, 0.00020441412925720215, 0.00020973384380340576, 0.00021505355834960938]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 3.0, 7.0, 8.0, 16.0, 19.0, 20.0, 25.0, 53.0, 44.0, 74.0, 77.0, 99.0, 87.0, 92.0, 87.0, 67.0, 48.0, 43.0, 29.0, 29.0, 19.0, 13.0, 12.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1576881408691406e-05, -2.0663253962993622e-05, -1.9749626517295837e-05, -1.8835999071598053e-05, -1.792237162590027e-05, -1.7008744180202484e-05, -1.60951167345047e-05, -1.5181489288806915e-05, -1.4267861843109131e-05, -1.3354234397411346e-05, -1.2440606951713562e-05, -1.1526979506015778e-05, -1.0613352060317993e-05, -9.699724614620209e-06, -8.786097168922424e-06, -7.87246972322464e-06, -6.9588422775268555e-06, -6.045214831829071e-06, -5.131587386131287e-06, -4.217959940433502e-06, -3.3043324947357178e-06, -2.3907050490379333e-06, -1.477077603340149e-06, -5.634501576423645e-07, 3.501772880554199e-07, 1.2638047337532043e-06, 2.1774321794509888e-06, 3.091059625148773e-06, 4.004687070846558e-06, 4.918314516544342e-06, 5.8319419622421265e-06, 6.745569407939911e-06, 7.659196853637695e-06, 8.57282429933548e-06, 9.486451745033264e-06, 1.0400079190731049e-05, 1.1313706636428833e-05, 1.2227334082126617e-05, 1.3140961527824402e-05, 1.4054588973522186e-05, 1.496821641921997e-05, 1.5881843864917755e-05, 1.679547131061554e-05, 1.7709098756313324e-05, 1.862272620201111e-05, 1.9536353647708893e-05, 2.0449981093406677e-05, 2.136360853910446e-05, 2.2277235984802246e-05, 2.319086343050003e-05, 2.4104490876197815e-05, 2.50181183218956e-05, 2.5931745767593384e-05, 2.6845373213291168e-05, 2.7759000658988953e-05, 2.8672628104686737e-05, 2.958625555038452e-05, 3.0499882996082306e-05, 3.141351044178009e-05, 3.2327137887477875e-05, 3.324076533317566e-05, 3.4154392778873444e-05, 3.506802022457123e-05, 3.598164767026901e-05, 3.68952751159668e-05]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 20.0, 16.0, 16.0, 41.0, 73.0, 104.0, 227.0, 405.0, 794.0, 1825.0, 4422.0, 12097.0, 36583.0, 141018.0, 3043087.0, 811536.0, 98032.0, 27766.0, 9615.0, 3563.0, 1507.0, 699.0, 370.0, 170.0, 101.0, 65.0, 41.0, 21.0, 15.0, 17.0, 4.0, 8.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019478797912597656, -0.0001882687211036682, -0.00018174946308135986, -0.00017523020505905151, -0.00016871094703674316, -0.00016219168901443481, -0.00015567243099212646, -0.00014915317296981812, -0.00014263391494750977, -0.00013611465692520142, -0.00012959539890289307, -0.00012307614088058472, -0.00011655688285827637, -0.00011003762483596802, -0.00010351836681365967, -9.699910879135132e-05, -9.047985076904297e-05, -8.396059274673462e-05, -7.744133472442627e-05, -7.092207670211792e-05, -6.440281867980957e-05, -5.788356065750122e-05, -5.136430263519287e-05, -4.484504461288452e-05, -3.832578659057617e-05, -3.180652856826782e-05, -2.5287270545959473e-05, -1.8768012523651123e-05, -1.2248754501342773e-05, -5.729496479034424e-06, 7.897615432739258e-07, 7.309019565582275e-06, 1.3828277587890625e-05, 2.0347535610198975e-05, 2.6866793632507324e-05, 3.3386051654815674e-05, 3.9905309677124023e-05, 4.642456769943237e-05, 5.294382572174072e-05, 5.946308374404907e-05, 6.598234176635742e-05, 7.250159978866577e-05, 7.902085781097412e-05, 8.554011583328247e-05, 9.205937385559082e-05, 9.857863187789917e-05, 0.00010509788990020752, 0.00011161714792251587, 0.00011813640594482422, 0.00012465566396713257, 0.00013117492198944092, 0.00013769418001174927, 0.00014421343803405762, 0.00015073269605636597, 0.00015725195407867432, 0.00016377121210098267, 0.00017029047012329102, 0.00017680972814559937, 0.00018332898616790771, 0.00018984824419021606, 0.00019636750221252441, 0.00020288676023483276, 0.0002094060182571411, 0.00021592527627944946, 0.0002224445343017578]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 7.0, 5.0, 4.0, 15.0, 5.0, 21.0, 25.0, 31.0, 32.0, 46.0, 54.0, 79.0, 99.0, 111.0, 182.0, 296.0, 837.0, 1118.0, 347.0, 183.0, 118.0, 98.0, 59.0, 65.0, 41.0, 40.0, 27.0, 34.0, 33.0, 18.0, 17.0, 14.0, 8.0, 5.0, 9.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.543231964111328e-05, -5.314033478498459e-05, -5.0848349928855896e-05, -4.85563650727272e-05, -4.626438021659851e-05, -4.397239536046982e-05, -4.1680410504341125e-05, -3.938842564821243e-05, -3.709644079208374e-05, -3.480445593595505e-05, -3.2512471079826355e-05, -3.0220486223697662e-05, -2.792850136756897e-05, -2.5636516511440277e-05, -2.3344531655311584e-05, -2.1052546799182892e-05, -1.87605619430542e-05, -1.6468577086925507e-05, -1.4176592230796814e-05, -1.1884607374668121e-05, -9.592622518539429e-06, -7.300637662410736e-06, -5.0086528062820435e-06, -2.716667950153351e-06, -4.246830940246582e-07, 1.8673017621040344e-06, 4.159286618232727e-06, 6.45127147436142e-06, 8.743256330490112e-06, 1.1035241186618805e-05, 1.3327226042747498e-05, 1.561921089887619e-05, 1.7911195755004883e-05, 2.0203180611133575e-05, 2.2495165467262268e-05, 2.478715032339096e-05, 2.7079135179519653e-05, 2.9371120035648346e-05, 3.166310489177704e-05, 3.395508974790573e-05, 3.6247074604034424e-05, 3.8539059460163116e-05, 4.083104431629181e-05, 4.31230291724205e-05, 4.5415014028549194e-05, 4.770699888467789e-05, 4.999898374080658e-05, 5.229096859693527e-05, 5.4582953453063965e-05, 5.687493830919266e-05, 5.916692316532135e-05, 6.145890802145004e-05, 6.375089287757874e-05, 6.604287773370743e-05, 6.833486258983612e-05, 7.062684744596481e-05, 7.29188323020935e-05, 7.52108171582222e-05, 7.750280201435089e-05, 7.979478687047958e-05, 8.208677172660828e-05, 8.437875658273697e-05, 8.667074143886566e-05, 8.896272629499435e-05, 9.125471115112305e-05]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 15.0, 20.0, 49.0, 90.0, 264.0, 295.0, 118.0, 69.0, 30.0, 30.0, 13.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003115566505584866, -0.0002770348219200969, -0.00024251299328170717, -0.00020799115009140223, -0.00017346932145301253, -0.00013894749281462282, -0.00010442564962431788, -6.990382098592818e-05, -3.538199234753847e-05, -8.601600711699575e-07, 3.3661672205198556e-05, 6.818350811954588e-05, 0.00010270533675793558, 0.0001372271653963253, 0.00017174900858663023, 0.00020627083722501993, 0.00024079266586340964, 0.00027531449450179935, 0.00030983632314018905, 0.00034435815177857876, 0.0003788800095207989, 0.00041340180905535817, 0.00044792366679757833, 0.00048244549543596804, 0.0005169673240743577, 0.0005514891818165779, 0.0005860109813511372, 0.0006205328390933573, 0.0006550546386279166, 0.0006895764963701367, 0.000724098295904696, 0.0007586201536469162, 0.0007931420113891363, 0.0008276638691313565, 0.0008621856686659157, 0.0008967075264081359, 0.0009312293259426951, 0.0009657511836849153, 0.0010002730414271355, 0.0010347948409616947, 0.001069316640496254, 0.0011038384400308132, 0.0011383603559806943, 0.0011728821555152535, 0.0012074039550498128, 0.001241925754584372, 0.0012764476705342531, 0.0013109694700688124, 0.0013454912696033716, 0.0013800130691379309, 0.001414534985087812, 0.0014490567846223712, 0.0014835785841569304, 0.0015181003836914897, 0.0015526222996413708, 0.00158714409917593, 0.001621666015125811, 0.0016561878146603703, 0.0016907097306102514, 0.0017252315301448107, 0.00175975332967937, 0.0017942751292139292, 0.0018287970451638103, 0.0018633188446983695, 0.0018978406442329288]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 5.0, 16.0, 19.0, 19.0, 27.0, 24.0, 28.0, 48.0, 56.0, 57.0, 57.0, 79.0, 69.0, 51.0, 64.0, 49.0, 53.0, 49.0, 55.0, 45.0, 34.0, 27.0, 21.0, 12.0, 9.0, 11.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00034540891647338867, -0.00033328961580991745, -0.00032117031514644623, -0.000309051014482975, -0.0002969317138195038, -0.00028481241315603256, -0.00027269311249256134, -0.0002605738118290901, -0.0002484545111656189, -0.00023633521050214767, -0.00022421590983867645, -0.00021209660917520523, -0.000199977308511734, -0.0001878580078482628, -0.00017573870718479156, -0.00016361940652132034, -0.00015150010585784912, -0.0001393808051943779, -0.00012726150453090668, -0.00011514220386743546, -0.00010302290320396423, -9.090360254049301e-05, -7.878430187702179e-05, -6.666500121355057e-05, -5.4545700550079346e-05, -4.2426399886608124e-05, -3.0307099223136902e-05, -1.818779855966568e-05, -6.068497896194458e-06, 6.050802767276764e-06, 1.8170103430747986e-05, 3.0289404094219208e-05, 4.240870475769043e-05, 5.452800542116165e-05, 6.664730608463287e-05, 7.87666067481041e-05, 9.088590741157532e-05, 0.00010300520807504654, 0.00011512450873851776, 0.00012724380940198898, 0.0001393631100654602, 0.00015148241072893143, 0.00016360171139240265, 0.00017572101205587387, 0.0001878403127193451, 0.00019995961338281631, 0.00021207891404628754, 0.00022419821470975876, 0.00023631751537322998, 0.0002484368160367012, 0.0002605561167001724, 0.00027267541736364365, 0.00028479471802711487, 0.0002969140186905861, 0.0003090333193540573, 0.00032115262001752853, 0.00033327192068099976, 0.000345391221344471, 0.0003575105220079422, 0.0003696298226714134, 0.00038174912333488464, 0.00039386842399835587, 0.0004059877246618271, 0.0004181070253252983, 0.00043022632598876953]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 12.0, 9.0, 15.0, 19.0, 22.0, 37.0, 53.0, 74.0, 152.0, 226.0, 344.0, 698.0, 1290.0, 2416.0, 4866.0, 11393.0, 32935.0, 133655.0, 673445.0, 132265.0, 33198.0, 11350.0, 4735.0, 2415.0, 1307.0, 664.0, 341.0, 216.0, 136.0, 86.0, 60.0, 39.0, 29.0, 17.0, 9.0, 11.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002906322479248047, -0.0002819560468196869, -0.0002732798457145691, -0.0002646036446094513, -0.0002559274435043335, -0.0002472512423992157, -0.0002385750412940979, -0.0002298988401889801, -0.0002212226390838623, -0.0002125464379787445, -0.0002038702368736267, -0.0001951940357685089, -0.0001865178346633911, -0.00017784163355827332, -0.00016916543245315552, -0.00016048923134803772, -0.00015181303024291992, -0.00014313682913780212, -0.00013446062803268433, -0.00012578442692756653, -0.00011710822582244873, -0.00010843202471733093, -9.975582361221313e-05, -9.107962250709534e-05, -8.240342140197754e-05, -7.372722029685974e-05, -6.505101919174194e-05, -5.6374818086624146e-05, -4.769861698150635e-05, -3.902241587638855e-05, -3.0346214771270752e-05, -2.1670013666152954e-05, -1.2993812561035156e-05, -4.317611455917358e-06, 4.3585896492004395e-06, 1.3034790754318237e-05, 2.1710991859436035e-05, 3.0387192964553833e-05, 3.906339406967163e-05, 4.773959517478943e-05, 5.6415796279907227e-05, 6.509199738502502e-05, 7.376819849014282e-05, 8.244439959526062e-05, 9.112060070037842e-05, 9.979680180549622e-05, 0.00010847300291061401, 0.00011714920401573181, 0.0001258254051208496, 0.0001345016062259674, 0.0001431778073310852, 0.000151854008436203, 0.0001605302095413208, 0.0001692064106464386, 0.0001778826117515564, 0.0001865588128566742, 0.000195235013961792, 0.0002039112150669098, 0.0002125874161720276, 0.00022126361727714539, 0.00022993981838226318, 0.00023861601948738098, 0.0002472922205924988, 0.0002559684216976166, 0.0002646446228027344]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 5.0, 5.0, 14.0, 7.0, 18.0, 29.0, 44.0, 46.0, 70.0, 72.0, 103.0, 104.0, 120.0, 102.0, 65.0, 45.0, 39.0, 37.0, 18.0, 15.0, 6.0, 4.0, 6.0, 2.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7298927307128906e-05, -2.63117253780365e-05, -2.5324523448944092e-05, -2.4337321519851685e-05, -2.3350119590759277e-05, -2.236291766166687e-05, -2.1375715732574463e-05, -2.0388513803482056e-05, -1.940131187438965e-05, -1.841410994529724e-05, -1.7426908016204834e-05, -1.6439706087112427e-05, -1.545250415802002e-05, -1.4465302228927612e-05, -1.3478100299835205e-05, -1.2490898370742798e-05, -1.150369644165039e-05, -1.0516494512557983e-05, -9.529292583465576e-06, -8.542090654373169e-06, -7.554888725280762e-06, -6.5676867961883545e-06, -5.580484867095947e-06, -4.59328293800354e-06, -3.606081008911133e-06, -2.6188790798187256e-06, -1.6316771507263184e-06, -6.444752216339111e-07, 3.427267074584961e-07, 1.3299286365509033e-06, 2.3171305656433105e-06, 3.3043324947357178e-06, 4.291534423828125e-06, 5.278736352920532e-06, 6.2659382820129395e-06, 7.253140211105347e-06, 8.240342140197754e-06, 9.227544069290161e-06, 1.0214745998382568e-05, 1.1201947927474976e-05, 1.2189149856567383e-05, 1.317635178565979e-05, 1.4163553714752197e-05, 1.5150755643844604e-05, 1.6137957572937012e-05, 1.712515950202942e-05, 1.8112361431121826e-05, 1.9099563360214233e-05, 2.008676528930664e-05, 2.1073967218399048e-05, 2.2061169147491455e-05, 2.3048371076583862e-05, 2.403557300567627e-05, 2.5022774934768677e-05, 2.6009976863861084e-05, 2.699717879295349e-05, 2.79843807220459e-05, 2.8971582651138306e-05, 2.9958784580230713e-05, 3.094598650932312e-05, 3.193318843841553e-05, 3.2920390367507935e-05, 3.390759229660034e-05, 3.489479422569275e-05, 3.5881996154785156e-05]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 6.0, 12.0, 11.0, 12.0, 24.0, 40.0, 33.0, 66.0, 69.0, 107.0, 166.0, 235.0, 351.0, 492.0, 760.0, 1057.0, 1664.0, 2617.0, 4086.0, 6736.0, 10721.0, 18394.0, 31662.0, 59642.0, 115900.0, 343182.0, 236164.0, 95337.0, 49987.0, 27223.0, 15928.0, 9469.0, 5779.0, 3657.0, 2305.0, 1525.0, 994.0, 654.0, 456.0, 304.0, 224.0, 135.0, 109.0, 78.0, 45.0, 36.0, 27.0, 25.0, 17.0, 11.0, 11.0, 2.0, 5.0, 5.0, 2.0, 1.0, 2.0], "bins": [-0.00010281801223754883, -9.968969970941544e-05, -9.656138718128204e-05, -9.343307465314865e-05, -9.030476212501526e-05, -8.717644959688187e-05, -8.404813706874847e-05, -8.091982454061508e-05, -7.779151201248169e-05, -7.46631994843483e-05, -7.15348869562149e-05, -6.840657442808151e-05, -6.527826189994812e-05, -6.214994937181473e-05, -5.9021636843681335e-05, -5.589332431554794e-05, -5.276501178741455e-05, -4.963669925928116e-05, -4.6508386731147766e-05, -4.3380074203014374e-05, -4.025176167488098e-05, -3.712344914674759e-05, -3.39951366186142e-05, -3.0866824090480804e-05, -2.7738511562347412e-05, -2.461019903421402e-05, -2.1481886506080627e-05, -1.8353573977947235e-05, -1.5225261449813843e-05, -1.209694892168045e-05, -8.968636393547058e-06, -5.840323865413666e-06, -2.7120113372802734e-06, 4.163011908531189e-07, 3.5446137189865112e-06, 6.6729262471199036e-06, 9.801238775253296e-06, 1.2929551303386688e-05, 1.605786383152008e-05, 1.9186176359653473e-05, 2.2314488887786865e-05, 2.5442801415920258e-05, 2.857111394405365e-05, 3.169942647218704e-05, 3.4827739000320435e-05, 3.795605152845383e-05, 4.108436405658722e-05, 4.421267658472061e-05, 4.7340989112854004e-05, 5.0469301640987396e-05, 5.359761416912079e-05, 5.672592669725418e-05, 5.985423922538757e-05, 6.298255175352097e-05, 6.611086428165436e-05, 6.923917680978775e-05, 7.236748933792114e-05, 7.549580186605453e-05, 7.862411439418793e-05, 8.175242692232132e-05, 8.488073945045471e-05, 8.80090519785881e-05, 9.11373645067215e-05, 9.426567703485489e-05, 9.739398956298828e-05]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 5.0, 5.0, 2.0, 5.0, 7.0, 10.0, 11.0, 12.0, 15.0, 10.0, 25.0, 15.0, 20.0, 22.0, 28.0, 25.0, 31.0, 37.0, 37.0, 41.0, 47.0, 44.0, 50.0, 45.0, 40.0, 31.0, 36.0, 31.0, 34.0, 39.0, 30.0, 31.0, 23.0, 26.0, 18.0, 18.0, 10.0, 21.0, 14.0, 12.0, 11.0, 6.0, 5.0, 5.0, 4.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.667043685913086e-05, -4.516914486885071e-05, -4.366785287857056e-05, -4.2166560888290405e-05, -4.0665268898010254e-05, -3.91639769077301e-05, -3.766268491744995e-05, -3.61613929271698e-05, -3.466010093688965e-05, -3.31588089466095e-05, -3.1657516956329346e-05, -3.0156224966049194e-05, -2.8654932975769043e-05, -2.715364098548889e-05, -2.565234899520874e-05, -2.415105700492859e-05, -2.2649765014648438e-05, -2.1148473024368286e-05, -1.9647181034088135e-05, -1.8145889043807983e-05, -1.6644597053527832e-05, -1.514330506324768e-05, -1.364201307296753e-05, -1.2140721082687378e-05, -1.0639429092407227e-05, -9.138137102127075e-06, -7.636845111846924e-06, -6.1355531215667725e-06, -4.634261131286621e-06, -3.1329691410064697e-06, -1.6316771507263184e-06, -1.30385160446167e-07, 1.3709068298339844e-06, 2.8721988201141357e-06, 4.373490810394287e-06, 5.8747828006744385e-06, 7.37607479095459e-06, 8.877366781234741e-06, 1.0378658771514893e-05, 1.1879950761795044e-05, 1.3381242752075195e-05, 1.4882534742355347e-05, 1.6383826732635498e-05, 1.788511872291565e-05, 1.93864107131958e-05, 2.0887702703475952e-05, 2.2388994693756104e-05, 2.3890286684036255e-05, 2.5391578674316406e-05, 2.6892870664596558e-05, 2.839416265487671e-05, 2.989545464515686e-05, 3.139674663543701e-05, 3.289803862571716e-05, 3.4399330615997314e-05, 3.5900622606277466e-05, 3.740191459655762e-05, 3.890320658683777e-05, 4.040449857711792e-05, 4.190579056739807e-05, 4.340708255767822e-05, 4.4908374547958374e-05, 4.6409666538238525e-05, 4.791095852851868e-05, 4.941225051879883e-05]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 9.0, 20.0, 24.0, 30.0, 47.0, 68.0, 100.0, 179.0, 248.0, 454.0, 760.0, 1276.0, 2410.0, 6086.0, 18027.0, 117136.0, 796135.0, 82225.0, 13295.0, 4745.0, 2273.0, 1258.0, 644.0, 381.0, 262.0, 157.0, 108.0, 52.0, 45.0, 35.0, 17.0, 15.0, 12.0, 6.0, 2.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1636486053466797e-05, -2.084672451019287e-05, -2.0056962966918945e-05, -1.926720142364502e-05, -1.8477439880371094e-05, -1.7687678337097168e-05, -1.6897916793823242e-05, -1.6108155250549316e-05, -1.531839370727539e-05, -1.4528632164001465e-05, -1.3738870620727539e-05, -1.2949109077453613e-05, -1.2159347534179688e-05, -1.1369585990905762e-05, -1.0579824447631836e-05, -9.79006290435791e-06, -9.000301361083984e-06, -8.210539817810059e-06, -7.420778274536133e-06, -6.631016731262207e-06, -5.841255187988281e-06, -5.0514936447143555e-06, -4.26173210144043e-06, -3.471970558166504e-06, -2.682209014892578e-06, -1.8924474716186523e-06, -1.1026859283447266e-06, -3.129243850708008e-07, 4.76837158203125e-07, 1.2665987014770508e-06, 2.0563602447509766e-06, 2.8461217880249023e-06, 3.635883331298828e-06, 4.425644874572754e-06, 5.21540641784668e-06, 6.0051679611206055e-06, 6.794929504394531e-06, 7.584691047668457e-06, 8.374452590942383e-06, 9.164214134216309e-06, 9.953975677490234e-06, 1.074373722076416e-05, 1.1533498764038086e-05, 1.2323260307312012e-05, 1.3113021850585938e-05, 1.3902783393859863e-05, 1.4692544937133789e-05, 1.5482306480407715e-05, 1.627206802368164e-05, 1.7061829566955566e-05, 1.7851591110229492e-05, 1.8641352653503418e-05, 1.9431114196777344e-05, 2.022087574005127e-05, 2.1010637283325195e-05, 2.180039882659912e-05, 2.2590160369873047e-05, 2.3379921913146973e-05, 2.41696834564209e-05, 2.4959444999694824e-05, 2.574920654296875e-05, 2.6538968086242676e-05, 2.73287296295166e-05, 2.8118491172790527e-05, 2.8908252716064453e-05]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 10.0, 4.0, 8.0, 25.0, 34.0, 64.0, 99.0, 236.0, 225.0, 134.0, 56.0, 36.0, 19.0, 11.0, 10.0, 3.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0728836059570312e-05, -1.0439194738864899e-05, -1.0149553418159485e-05, -9.859912097454071e-06, -9.570270776748657e-06, -9.280629456043243e-06, -8.99098813533783e-06, -8.701346814632416e-06, -8.411705493927002e-06, -8.122064173221588e-06, -7.832422852516174e-06, -7.5427815318107605e-06, -7.253140211105347e-06, -6.963498890399933e-06, -6.673857569694519e-06, -6.384216248989105e-06, -6.094574928283691e-06, -5.804933607578278e-06, -5.515292286872864e-06, -5.22565096616745e-06, -4.936009645462036e-06, -4.646368324756622e-06, -4.3567270040512085e-06, -4.067085683345795e-06, -3.777444362640381e-06, -3.487803041934967e-06, -3.1981617212295532e-06, -2.9085204005241394e-06, -2.6188790798187256e-06, -2.3292377591133118e-06, -2.039596438407898e-06, -1.7499551177024841e-06, -1.4603137969970703e-06, -1.1706724762916565e-06, -8.810311555862427e-07, -5.913898348808289e-07, -3.0174851417541504e-07, -1.210719347000122e-08, 2.775341272354126e-07, 5.671754479408264e-07, 8.568167686462402e-07, 1.146458089351654e-06, 1.4360994100570679e-06, 1.7257407307624817e-06, 2.0153820514678955e-06, 2.3050233721733093e-06, 2.594664692878723e-06, 2.884306013584137e-06, 3.1739473342895508e-06, 3.4635886549949646e-06, 3.7532299757003784e-06, 4.042871296405792e-06, 4.332512617111206e-06, 4.62215393781662e-06, 4.911795258522034e-06, 5.2014365792274475e-06, 5.491077899932861e-06, 5.780719220638275e-06, 6.070360541343689e-06, 6.360001862049103e-06, 6.649643182754517e-06, 6.93928450345993e-06, 7.228925824165344e-06, 7.518567144870758e-06, 7.808208465576172e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 13.0, 3.0, 8.0, 14.0, 21.0, 33.0, 36.0, 69.0, 116.0, 127.0, 214.0, 355.0, 573.0, 987.0, 1765.0, 2949.0, 5477.0, 24169.0, 967288.0, 30938.0, 5877.0, 3044.0, 1812.0, 969.0, 617.0, 388.0, 241.0, 133.0, 94.0, 65.0, 33.0, 44.0, 28.0, 22.0, 8.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3048133850097656e-05, -5.131028592586517e-05, -4.957243800163269e-05, -4.783459007740021e-05, -4.6096742153167725e-05, -4.435889422893524e-05, -4.262104630470276e-05, -4.0883198380470276e-05, -3.914535045623779e-05, -3.740750253200531e-05, -3.566965460777283e-05, -3.3931806683540344e-05, -3.219395875930786e-05, -3.045611083507538e-05, -2.8718262910842896e-05, -2.6980414986610413e-05, -2.524256706237793e-05, -2.3504719138145447e-05, -2.1766871213912964e-05, -2.002902328968048e-05, -1.8291175365447998e-05, -1.6553327441215515e-05, -1.4815479516983032e-05, -1.307763159275055e-05, -1.1339783668518066e-05, -9.601935744285583e-06, -7.8640878200531e-06, -6.126239895820618e-06, -4.388391971588135e-06, -2.650544047355652e-06, -9.126961231231689e-07, 8.25151801109314e-07, 2.562999725341797e-06, 4.30084764957428e-06, 6.038695573806763e-06, 7.776543498039246e-06, 9.514391422271729e-06, 1.1252239346504211e-05, 1.2990087270736694e-05, 1.4727935194969177e-05, 1.646578311920166e-05, 1.8203631043434143e-05, 1.9941478967666626e-05, 2.167932689189911e-05, 2.3417174816131592e-05, 2.5155022740364075e-05, 2.6892870664596558e-05, 2.863071858882904e-05, 3.0368566513061523e-05, 3.2106414437294006e-05, 3.384426236152649e-05, 3.558211028575897e-05, 3.7319958209991455e-05, 3.905780613422394e-05, 4.079565405845642e-05, 4.2533501982688904e-05, 4.427134990692139e-05, 4.600919783115387e-05, 4.774704575538635e-05, 4.9484893679618835e-05, 5.122274160385132e-05, 5.29605895280838e-05, 5.4698437452316284e-05, 5.643628537654877e-05, 5.817413330078125e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 22.0, 94.0, 385.0, 353.0, 79.0, 27.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.759695053100586e-05, -2.6851892471313477e-05, -2.6106834411621094e-05, -2.536177635192871e-05, -2.4616718292236328e-05, -2.3871660232543945e-05, -2.3126602172851562e-05, -2.238154411315918e-05, -2.1636486053466797e-05, -2.0891427993774414e-05, -2.014636993408203e-05, -1.940131187438965e-05, -1.8656253814697266e-05, -1.7911195755004883e-05, -1.71661376953125e-05, -1.6421079635620117e-05, -1.5676021575927734e-05, -1.4930963516235352e-05, -1.4185905456542969e-05, -1.3440847396850586e-05, -1.2695789337158203e-05, -1.195073127746582e-05, -1.1205673217773438e-05, -1.0460615158081055e-05, -9.715557098388672e-06, -8.970499038696289e-06, -8.225440979003906e-06, -7.4803829193115234e-06, -6.735324859619141e-06, -5.990266799926758e-06, -5.245208740234375e-06, -4.500150680541992e-06, -3.7550926208496094e-06, -3.0100345611572266e-06, -2.2649765014648438e-06, -1.519918441772461e-06, -7.748603820800781e-07, -2.9802322387695312e-08, 7.152557373046875e-07, 1.4603137969970703e-06, 2.205371856689453e-06, 2.950429916381836e-06, 3.6954879760742188e-06, 4.4405460357666016e-06, 5.185604095458984e-06, 5.930662155151367e-06, 6.67572021484375e-06, 7.420778274536133e-06, 8.165836334228516e-06, 8.910894393920898e-06, 9.655952453613281e-06, 1.0401010513305664e-05, 1.1146068572998047e-05, 1.189112663269043e-05, 1.2636184692382812e-05, 1.3381242752075195e-05, 1.4126300811767578e-05, 1.4871358871459961e-05, 1.5616416931152344e-05, 1.6361474990844727e-05, 1.710653305053711e-05, 1.7851591110229492e-05, 1.8596649169921875e-05, 1.9341707229614258e-05, 2.008676528930664e-05]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 6.0, 12.0, 18.0, 22.0, 37.0, 63.0, 100.0, 228.0, 209.0, 101.0, 76.0, 35.0, 27.0, 27.0, 12.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009368520113639534, -0.000911522307433188, -0.0008861925452947617, -0.0008608627831563354, -0.00083553307922557, -0.0008102033752948046, -0.0007848736131563783, -0.000759543851017952, -0.0007342141470871866, -0.0007088844431564212, -0.0006835546810179949, -0.0006582249188795686, -0.0006328952149488032, -0.0006075655110180378, -0.0005822357488796115, -0.0005569059867411852, -0.0005315762828104198, -0.0005062465788796544, -0.0004809168167412281, -0.00045558708370663226, -0.0004302573506720364, -0.00040492761763744056, -0.0003795978846028447, -0.00035426815156824887, -0.000328938418533653, -0.0003036086854990572, -0.0002782789524644613, -0.0002529492194298655, -0.00022761948639526963, -0.00020228975336067379, -0.00017696002032607794, -0.0001516302872914821, -0.00012630055425688624, -0.0001009708212222904, -7.564108818769455e-05, -5.03113551530987e-05, -2.4981622118502855e-05, 3.4811091609299183e-07, 2.567784395068884e-05, 5.1007576985284686e-05, 7.633731001988053e-05, 0.00010166704305447638, 0.00012699677608907223, 0.00015232650912366807, 0.00017765624215826392, 0.00020298597519285977, 0.00022831570822745562, 0.00025364544126205146, 0.0002789751742966473, 0.00030430490733124316, 0.000329634640365839, 0.00035496437340043485, 0.0003802941064350307, 0.00040562383946962655, 0.0004309535725042224, 0.00045628330553881824, 0.0004816130385734141, 0.0005069427425041795, 0.0005322725046426058, 0.0005576022667810321, 0.0005829319707117975, 0.0006082616746425629, 0.0006335914367809892, 0.0006589211989194155, 0.0006842509028501809]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 4.0, 9.0, 9.0, 9.0, 7.0, 11.0, 19.0, 24.0, 16.0, 15.0, 26.0, 31.0, 35.0, 35.0, 30.0, 41.0, 35.0, 34.0, 42.0, 40.0, 43.0, 33.0, 35.0, 43.0, 38.0, 37.0, 29.0, 33.0, 24.0, 33.0, 20.0, 30.0, 19.0, 19.0, 12.0, 13.0, 12.0, 8.0, 6.0, 6.0, 6.0, 8.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00026488304138183594, -0.00025603268295526505, -0.00024718232452869415, -0.00023833196610212326, -0.00022948160767555237, -0.00022063124924898148, -0.00021178089082241058, -0.0002029305323958397, -0.0001940801739692688, -0.0001852298155426979, -0.00017637945711612701, -0.00016752909868955612, -0.00015867874026298523, -0.00014982838183641434, -0.00014097802340984344, -0.00013212766498327255, -0.00012327730655670166, -0.00011442694813013077, -0.00010557658970355988, -9.672623127698898e-05, -8.787587285041809e-05, -7.90255144238472e-05, -7.01751559972763e-05, -6.132479757070541e-05, -5.247443914413452e-05, -4.362408071756363e-05, -3.477372229099274e-05, -2.5923363864421844e-05, -1.7073005437850952e-05, -8.22264701128006e-06, 6.277114152908325e-07, 9.478069841861725e-06, 1.8328428268432617e-05, 2.717878669500351e-05, 3.60291451215744e-05, 4.4879503548145294e-05, 5.3729861974716187e-05, 6.258022040128708e-05, 7.143057882785797e-05, 8.028093725442886e-05, 8.913129568099976e-05, 9.798165410757065e-05, 0.00010683201253414154, 0.00011568237096071243, 0.00012453272938728333, 0.00013338308781385422, 0.0001422334462404251, 0.000151083804666996, 0.0001599341630935669, 0.0001687845215201378, 0.00017763487994670868, 0.00018648523837327957, 0.00019533559679985046, 0.00020418595522642136, 0.00021303631365299225, 0.00022188667207956314, 0.00023073703050613403, 0.00023958738893270493, 0.0002484377473592758, 0.0002572881057858467, 0.0002661384642124176, 0.0002749888226389885, 0.0002838391810655594, 0.0002926895394921303, 0.00030153989791870117]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 5.0, 11.0, 21.0, 36.0, 64.0, 90.0, 145.0, 226.0, 349.0, 530.0, 874.0, 1428.0, 2384.0, 4256.0, 7799.0, 14461.0, 30553.0, 73785.0, 288260.0, 3501381.0, 160870.0, 52609.0, 24410.0, 12545.0, 6584.0, 3712.0, 2170.0, 1324.0, 895.0, 610.0, 404.0, 342.0, 215.0, 175.0, 132.0, 129.0, 102.0, 64.0, 65.0, 49.0, 44.0, 28.0, 31.0, 26.0, 15.0, 14.0, 19.0, 10.0, 7.0, 12.0, 4.0, 8.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00011032819747924805, -0.00010540056973695755, -0.00010047294199466705, -9.554531425237656e-05, -9.061768651008606e-05, -8.569005876779556e-05, -8.076243102550507e-05, -7.583480328321457e-05, -7.090717554092407e-05, -6.597954779863358e-05, -6.105192005634308e-05, -5.612429231405258e-05, -5.1196664571762085e-05, -4.626903682947159e-05, -4.134140908718109e-05, -3.6413781344890594e-05, -3.14861536026001e-05, -2.65585258603096e-05, -2.1630898118019104e-05, -1.6703270375728607e-05, -1.177564263343811e-05, -6.8480148911476135e-06, -1.9203871488571167e-06, 3.00724059343338e-06, 7.934868335723877e-06, 1.2862496078014374e-05, 1.779012382030487e-05, 2.2717751562595367e-05, 2.7645379304885864e-05, 3.257300704717636e-05, 3.750063478946686e-05, 4.2428262531757355e-05, 4.735589027404785e-05, 5.228351801633835e-05, 5.7211145758628845e-05, 6.213877350091934e-05, 6.706640124320984e-05, 7.199402898550034e-05, 7.692165672779083e-05, 8.184928447008133e-05, 8.677691221237183e-05, 9.170453995466232e-05, 9.663216769695282e-05, 0.00010155979543924332, 0.00010648742318153381, 0.00011141505092382431, 0.00011634267866611481, 0.0001212703064084053, 0.0001261979341506958, 0.0001311255618929863, 0.0001360531896352768, 0.0001409808173775673, 0.0001459084451198578, 0.00015083607286214828, 0.00015576370060443878, 0.00016069132834672928, 0.00016561895608901978, 0.00017054658383131027, 0.00017547421157360077, 0.00018040183931589127, 0.00018532946705818176, 0.00019025709480047226, 0.00019518472254276276, 0.00020011235028505325, 0.00020503997802734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 9.0, 6.0, 8.0, 17.0, 18.0, 22.0, 32.0, 49.0, 49.0, 79.0, 95.0, 110.0, 111.0, 98.0, 76.0, 44.0, 42.0, 35.0, 21.0, 19.0, 24.0, 12.0, 7.0, 4.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1338462829589844e-05, -2.0381063222885132e-05, -1.942366361618042e-05, -1.8466264009475708e-05, -1.7508864402770996e-05, -1.6551464796066284e-05, -1.5594065189361572e-05, -1.463666558265686e-05, -1.3679265975952148e-05, -1.2721866369247437e-05, -1.1764466762542725e-05, -1.0807067155838013e-05, -9.8496675491333e-06, -8.892267942428589e-06, -7.934868335723877e-06, -6.977468729019165e-06, -6.020069122314453e-06, -5.062669515609741e-06, -4.105269908905029e-06, -3.1478703022003174e-06, -2.1904706954956055e-06, -1.2330710887908936e-06, -2.7567148208618164e-07, 6.817281246185303e-07, 1.6391277313232422e-06, 2.596527338027954e-06, 3.553926944732666e-06, 4.511326551437378e-06, 5.46872615814209e-06, 6.426125764846802e-06, 7.383525371551514e-06, 8.340924978256226e-06, 9.298324584960938e-06, 1.025572419166565e-05, 1.1213123798370361e-05, 1.2170523405075073e-05, 1.3127923011779785e-05, 1.4085322618484497e-05, 1.5042722225189209e-05, 1.600012183189392e-05, 1.6957521438598633e-05, 1.7914921045303345e-05, 1.8872320652008057e-05, 1.982972025871277e-05, 2.078711986541748e-05, 2.1744519472122192e-05, 2.2701919078826904e-05, 2.3659318685531616e-05, 2.4616718292236328e-05, 2.557411789894104e-05, 2.6531517505645752e-05, 2.7488917112350464e-05, 2.8446316719055176e-05, 2.9403716325759888e-05, 3.03611159324646e-05, 3.131851553916931e-05, 3.2275915145874023e-05, 3.3233314752578735e-05, 3.419071435928345e-05, 3.514811396598816e-05, 3.610551357269287e-05, 3.706291317939758e-05, 3.8020312786102295e-05, 3.897771239280701e-05, 3.993511199951172e-05]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 10.0, 7.0, 9.0, 25.0, 29.0, 37.0, 52.0, 79.0, 99.0, 130.0, 220.0, 334.0, 516.0, 772.0, 1123.0, 1872.0, 2938.0, 4787.0, 8358.0, 14860.0, 28551.0, 60016.0, 145879.0, 588563.0, 2847298.0, 293525.0, 99016.0, 43887.0, 22105.0, 11874.0, 6518.0, 4013.0, 2406.0, 1428.0, 972.0, 651.0, 411.0, 266.0, 187.0, 150.0, 96.0, 64.0, 43.0, 30.0, 20.0, 29.0, 7.0, 3.0, 6.0, 2.0, 4.0, 2.0, 3.0, 4.0], "bins": [-0.00010639429092407227, -0.0001032920554280281, -0.00010018981993198395, -9.708758443593979e-05, -9.398534893989563e-05, -9.088311344385147e-05, -8.778087794780731e-05, -8.467864245176315e-05, -8.1576406955719e-05, -7.847417145967484e-05, -7.537193596363068e-05, -7.226970046758652e-05, -6.916746497154236e-05, -6.60652294754982e-05, -6.296299397945404e-05, -5.986075848340988e-05, -5.675852298736572e-05, -5.3656287491321564e-05, -5.0554051995277405e-05, -4.7451816499233246e-05, -4.434958100318909e-05, -4.124734550714493e-05, -3.814511001110077e-05, -3.504287451505661e-05, -3.194063901901245e-05, -2.8838403522968292e-05, -2.5736168026924133e-05, -2.2633932530879974e-05, -1.9531697034835815e-05, -1.6429461538791656e-05, -1.3327226042747498e-05, -1.0224990546703339e-05, -7.12275505065918e-06, -4.020519554615021e-06, -9.182840585708618e-07, 2.183951437473297e-06, 5.286186933517456e-06, 8.388422429561615e-06, 1.1490657925605774e-05, 1.4592893421649933e-05, 1.7695128917694092e-05, 2.079736441373825e-05, 2.389959990978241e-05, 2.700183540582657e-05, 3.0104070901870728e-05, 3.3206306397914886e-05, 3.6308541893959045e-05, 3.9410777390003204e-05, 4.251301288604736e-05, 4.561524838209152e-05, 4.871748387813568e-05, 5.181971937417984e-05, 5.4921954870224e-05, 5.802419036626816e-05, 6.112642586231232e-05, 6.422866135835648e-05, 6.733089685440063e-05, 7.04331323504448e-05, 7.353536784648895e-05, 7.663760334253311e-05, 7.973983883857727e-05, 8.284207433462143e-05, 8.594430983066559e-05, 8.904654532670975e-05, 9.21487808227539e-05]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 10.0, 18.0, 13.0, 19.0, 21.0, 46.0, 46.0, 62.0, 84.0, 97.0, 124.0, 149.0, 268.0, 652.0, 999.0, 486.0, 218.0, 144.0, 91.0, 75.0, 59.0, 63.0, 51.0, 48.0, 35.0, 31.0, 29.0, 24.0, 15.0, 10.0, 8.0, 13.0, 11.0, 12.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-6.318092346191406e-05, -6.134528666734695e-05, -5.9509649872779846e-05, -5.767401307821274e-05, -5.583837628364563e-05, -5.400273948907852e-05, -5.2167102694511414e-05, -5.0331465899944305e-05, -4.84958291053772e-05, -4.666019231081009e-05, -4.482455551624298e-05, -4.298891872167587e-05, -4.1153281927108765e-05, -3.9317645132541656e-05, -3.748200833797455e-05, -3.564637154340744e-05, -3.381073474884033e-05, -3.1975097954273224e-05, -3.0139461159706116e-05, -2.8303824365139008e-05, -2.64681875705719e-05, -2.463255077600479e-05, -2.2796913981437683e-05, -2.0961277186870575e-05, -1.9125640392303467e-05, -1.729000359773636e-05, -1.545436680316925e-05, -1.3618730008602142e-05, -1.1783093214035034e-05, -9.947456419467926e-06, -8.111819624900818e-06, -6.27618283033371e-06, -4.4405460357666016e-06, -2.6049092411994934e-06, -7.692724466323853e-07, 1.066364347934723e-06, 2.902001142501831e-06, 4.737637937068939e-06, 6.573274731636047e-06, 8.408911526203156e-06, 1.0244548320770264e-05, 1.2080185115337372e-05, 1.391582190990448e-05, 1.5751458704471588e-05, 1.7587095499038696e-05, 1.9422732293605804e-05, 2.1258369088172913e-05, 2.309400588274002e-05, 2.492964267730713e-05, 2.6765279471874237e-05, 2.8600916266441345e-05, 3.0436553061008453e-05, 3.227218985557556e-05, 3.410782665014267e-05, 3.594346344470978e-05, 3.7779100239276886e-05, 3.9614737033843994e-05, 4.14503738284111e-05, 4.328601062297821e-05, 4.512164741754532e-05, 4.695728421211243e-05, 4.8792921006679535e-05, 5.062855780124664e-05, 5.246419459581375e-05, 5.429983139038086e-05]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 19.0, 51.0, 242.0, 404.0, 148.0, 72.0, 38.0, 15.0, 11.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042655286961235106, -0.00038011689321137965, -0.00033368091681040823, -0.0002872449404094368, -0.0002408089640084654, -0.000194372987607494, -0.00014793701120652258, -0.00010150103480555117, -5.506505840457976e-05, -8.629082003608346e-06, 3.780689439736307e-05, 8.424287079833448e-05, 0.0001306788471993059, 0.0001771148236002773, 0.00022355080000124872, 0.00026998677640222013, 0.00031642275280319154, 0.00036285872920416296, 0.00040929470560513437, 0.0004557306820061058, 0.0005021666875109076, 0.0005486026639118791, 0.0005950386403128505, 0.0006414746167138219, 0.0006879105931147933, 0.0007343465695157647, 0.0007807825459167361, 0.0008272185223177075, 0.000873654498718679, 0.0009200904751196504, 0.0009665264515206218, 0.0010129624279215932, 0.0010593982879072428, 0.0011058342643082142, 0.0011522702407091856, 0.001198706217110157, 0.0012451421935111284, 0.0012915781699120998, 0.0013380141463130713, 0.0013844501227140427, 0.001430886099115014, 0.0014773220755159855, 0.001523758051916957, 0.0015701940283179283, 0.0016166300047188997, 0.0016630659811198711, 0.0017095019575208426, 0.001755937933921814, 0.0018023739103227854, 0.0018488098867237568, 0.0018952458631247282, 0.0019416818395256996, 0.001988117815926671, 0.0020345537923276424, 0.002080989768728614, 0.0021274257451295853, 0.0021738617215305567, 0.002220297697931528, 0.0022667336743324995, 0.002313169650733471, 0.0023596056271344423, 0.0024060416035354137, 0.002452477579936385, 0.0024989135563373566, 0.002545349532738328]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 5.0, 2.0, 8.0, 8.0, 12.0, 12.0, 20.0, 19.0, 24.0, 25.0, 29.0, 33.0, 37.0, 40.0, 55.0, 54.0, 49.0, 45.0, 44.0, 40.0, 46.0, 59.0, 51.0, 38.0, 31.0, 36.0, 24.0, 34.0, 26.0, 21.0, 17.0, 12.0, 11.0, 15.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.00031948089599609375, -0.0003105495125055313, -0.00030161812901496887, -0.00029268674552440643, -0.000283755362033844, -0.00027482397854328156, -0.0002658925950527191, -0.0002569612115621567, -0.00024802982807159424, -0.0002390984445810318, -0.00023016706109046936, -0.00022123567759990692, -0.00021230429410934448, -0.00020337291061878204, -0.0001944415271282196, -0.00018551014363765717, -0.00017657876014709473, -0.0001676473766565323, -0.00015871599316596985, -0.0001497846096754074, -0.00014085322618484497, -0.00013192184269428253, -0.0001229904592037201, -0.00011405907571315765, -0.00010512769222259521, -9.619630873203278e-05, -8.726492524147034e-05, -7.83335417509079e-05, -6.940215826034546e-05, -6.047077476978302e-05, -5.153939127922058e-05, -4.260800778865814e-05, -3.36766242980957e-05, -2.4745240807533264e-05, -1.5813857316970825e-05, -6.882473826408386e-06, 2.0489096641540527e-06, 1.0980293154716492e-05, 1.991167664527893e-05, 2.884306013584137e-05, 3.777444362640381e-05, 4.670582711696625e-05, 5.5637210607528687e-05, 6.456859409809113e-05, 7.349997758865356e-05, 8.2431361079216e-05, 9.136274456977844e-05, 0.00010029412806034088, 0.00010922551155090332, 0.00011815689504146576, 0.0001270882785320282, 0.00013601966202259064, 0.00014495104551315308, 0.00015388242900371552, 0.00016281381249427795, 0.0001717451959848404, 0.00018067657947540283, 0.00018960796296596527, 0.0001985393464565277, 0.00020747072994709015, 0.0002164021134376526, 0.00022533349692821503, 0.00023426488041877747, 0.0002431962639093399, 0.00025212764739990234]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 6.0, 7.0, 9.0, 9.0, 14.0, 14.0, 23.0, 22.0, 27.0, 38.0, 61.0, 104.0, 168.0, 269.0, 509.0, 938.0, 1945.0, 4300.0, 10511.0, 29924.0, 118764.0, 656863.0, 163801.0, 37730.0, 12649.0, 5088.0, 2215.0, 1078.0, 559.0, 314.0, 184.0, 105.0, 80.0, 40.0, 42.0, 30.0, 20.0, 19.0, 12.0, 13.0, 9.0, 7.0, 8.0, 2.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.00027108192443847656, -0.00026301294565200806, -0.00025494396686553955, -0.00024687498807907104, -0.00023880600929260254, -0.00023073703050613403, -0.00022266805171966553, -0.00021459907293319702, -0.00020653009414672852, -0.00019846111536026, -0.0001903921365737915, -0.000182323157787323, -0.0001742541790008545, -0.00016618520021438599, -0.00015811622142791748, -0.00015004724264144897, -0.00014197826385498047, -0.00013390928506851196, -0.00012584030628204346, -0.00011777132749557495, -0.00010970234870910645, -0.00010163336992263794, -9.356439113616943e-05, -8.549541234970093e-05, -7.742643356323242e-05, -6.935745477676392e-05, -6.128847599029541e-05, -5.3219497203826904e-05, -4.51505184173584e-05, -3.708153963088989e-05, -2.9012560844421387e-05, -2.094358205795288e-05, -1.2874603271484375e-05, -4.805624485015869e-06, 3.2633543014526367e-06, 1.1332333087921143e-05, 1.940131187438965e-05, 2.7470290660858154e-05, 3.553926944732666e-05, 4.3608248233795166e-05, 5.167722702026367e-05, 5.974620580673218e-05, 6.781518459320068e-05, 7.588416337966919e-05, 8.39531421661377e-05, 9.20221209526062e-05, 0.00010009109973907471, 0.00010816007852554321, 0.00011622905731201172, 0.00012429803609848022, 0.00013236701488494873, 0.00014043599367141724, 0.00014850497245788574, 0.00015657395124435425, 0.00016464293003082275, 0.00017271190881729126, 0.00018078088760375977, 0.00018884986639022827, 0.00019691884517669678, 0.00020498782396316528, 0.0002130568027496338, 0.0002211257815361023, 0.0002291947603225708, 0.0002372637391090393, 0.0002453327178955078]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 15.0, 13.0, 18.0, 30.0, 51.0, 73.0, 99.0, 101.0, 154.0, 130.0, 94.0, 76.0, 39.0, 38.0, 16.0, 16.0, 7.0, 12.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6404857635498047e-05, -2.5181099772453308e-05, -2.395734190940857e-05, -2.273358404636383e-05, -2.1509826183319092e-05, -2.0286068320274353e-05, -1.9062310457229614e-05, -1.7838552594184875e-05, -1.6614794731140137e-05, -1.5391036868095398e-05, -1.416727900505066e-05, -1.294352114200592e-05, -1.1719763278961182e-05, -1.0496005415916443e-05, -9.272247552871704e-06, -8.048489689826965e-06, -6.8247318267822266e-06, -5.600973963737488e-06, -4.377216100692749e-06, -3.1534582376480103e-06, -1.9297003746032715e-06, -7.059425115585327e-07, 5.178153514862061e-07, 1.7415732145309448e-06, 2.9653310775756836e-06, 4.189088940620422e-06, 5.412846803665161e-06, 6.6366046667099e-06, 7.860362529754639e-06, 9.084120392799377e-06, 1.0307878255844116e-05, 1.1531636118888855e-05, 1.2755393981933594e-05, 1.3979151844978333e-05, 1.5202909708023071e-05, 1.642666757106781e-05, 1.765042543411255e-05, 1.8874183297157288e-05, 2.0097941160202026e-05, 2.1321699023246765e-05, 2.2545456886291504e-05, 2.3769214749336243e-05, 2.499297261238098e-05, 2.621673047542572e-05, 2.744048833847046e-05, 2.8664246201515198e-05, 2.9888004064559937e-05, 3.1111761927604675e-05, 3.2335519790649414e-05, 3.355927765369415e-05, 3.478303551673889e-05, 3.600679337978363e-05, 3.723055124282837e-05, 3.845430910587311e-05, 3.967806696891785e-05, 4.0901824831962585e-05, 4.2125582695007324e-05, 4.334934055805206e-05, 4.45730984210968e-05, 4.579685628414154e-05, 4.702061414718628e-05, 4.824437201023102e-05, 4.946812987327576e-05, 5.0691887736320496e-05, 5.1915645599365234e-05]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 5.0, 10.0, 9.0, 12.0, 26.0, 39.0, 57.0, 81.0, 96.0, 164.0, 256.0, 395.0, 535.0, 892.0, 1321.0, 2102.0, 3507.0, 5701.0, 9666.0, 16700.0, 31137.0, 58654.0, 121118.0, 361602.0, 235127.0, 92814.0, 46826.0, 25044.0, 13706.0, 8041.0, 4754.0, 2936.0, 1814.0, 1140.0, 781.0, 439.0, 350.0, 230.0, 147.0, 94.0, 80.0, 45.0, 38.0, 22.0, 15.0, 10.0, 9.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.888410568237305e-05, -9.577721357345581e-05, -9.267032146453857e-05, -8.956342935562134e-05, -8.64565372467041e-05, -8.334964513778687e-05, -8.024275302886963e-05, -7.713586091995239e-05, -7.402896881103516e-05, -7.092207670211792e-05, -6.781518459320068e-05, -6.470829248428345e-05, -6.160140037536621e-05, -5.8494508266448975e-05, -5.538761615753174e-05, -5.22807240486145e-05, -4.9173831939697266e-05, -4.606693983078003e-05, -4.296004772186279e-05, -3.985315561294556e-05, -3.674626350402832e-05, -3.3639371395111084e-05, -3.053247928619385e-05, -2.742558717727661e-05, -2.4318695068359375e-05, -2.121180295944214e-05, -1.8104910850524902e-05, -1.4998018741607666e-05, -1.189112663269043e-05, -8.784234523773193e-06, -5.677342414855957e-06, -2.5704503059387207e-06, 5.364418029785156e-07, 3.643333911895752e-06, 6.750226020812988e-06, 9.857118129730225e-06, 1.2964010238647461e-05, 1.6070902347564697e-05, 1.9177794456481934e-05, 2.228468656539917e-05, 2.5391578674316406e-05, 2.8498470783233643e-05, 3.160536289215088e-05, 3.4712255001068115e-05, 3.781914710998535e-05, 4.092603921890259e-05, 4.4032931327819824e-05, 4.713982343673706e-05, 5.02467155456543e-05, 5.335360765457153e-05, 5.646049976348877e-05, 5.9567391872406006e-05, 6.267428398132324e-05, 6.578117609024048e-05, 6.888806819915771e-05, 7.199496030807495e-05, 7.510185241699219e-05, 7.820874452590942e-05, 8.131563663482666e-05, 8.44225287437439e-05, 8.752942085266113e-05, 9.063631296157837e-05, 9.37432050704956e-05, 9.685009717941284e-05, 9.995698928833008e-05]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 5.0, 9.0, 5.0, 3.0, 6.0, 10.0, 13.0, 12.0, 16.0, 33.0, 20.0, 37.0, 26.0, 30.0, 32.0, 44.0, 41.0, 48.0, 52.0, 56.0, 33.0, 49.0, 42.0, 40.0, 40.0, 41.0, 34.0, 25.0, 34.0, 22.0, 20.0, 36.0, 19.0, 13.0, 6.0, 10.0, 5.0, 10.0, 3.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08427619934082e-05, -4.904251545667648e-05, -4.724226891994476e-05, -4.544202238321304e-05, -4.364177584648132e-05, -4.18415293097496e-05, -4.004128277301788e-05, -3.824103623628616e-05, -3.644078969955444e-05, -3.4640543162822723e-05, -3.2840296626091003e-05, -3.1040050089359283e-05, -2.9239803552627563e-05, -2.7439557015895844e-05, -2.5639310479164124e-05, -2.3839063942432404e-05, -2.2038817405700684e-05, -2.0238570868968964e-05, -1.8438324332237244e-05, -1.6638077795505524e-05, -1.4837831258773804e-05, -1.3037584722042084e-05, -1.1237338185310364e-05, -9.437091648578644e-06, -7.636845111846924e-06, -5.836598575115204e-06, -4.036352038383484e-06, -2.236105501651764e-06, -4.3585896492004395e-07, 1.364387571811676e-06, 3.164634108543396e-06, 4.964880645275116e-06, 6.765127182006836e-06, 8.565373718738556e-06, 1.0365620255470276e-05, 1.2165866792201996e-05, 1.3966113328933716e-05, 1.5766359865665436e-05, 1.7566606402397156e-05, 1.9366852939128876e-05, 2.1167099475860596e-05, 2.2967346012592316e-05, 2.4767592549324036e-05, 2.6567839086055756e-05, 2.8368085622787476e-05, 3.0168332159519196e-05, 3.1968578696250916e-05, 3.3768825232982635e-05, 3.5569071769714355e-05, 3.7369318306446075e-05, 3.9169564843177795e-05, 4.0969811379909515e-05, 4.2770057916641235e-05, 4.4570304453372955e-05, 4.6370550990104675e-05, 4.8170797526836395e-05, 4.9971044063568115e-05, 5.1771290600299835e-05, 5.3571537137031555e-05, 5.5371783673763275e-05, 5.7172030210494995e-05, 5.8972276747226715e-05, 6.0772523283958435e-05, 6.257276982069016e-05, 6.437301635742188e-05]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 1.0, 4.0, 8.0, 13.0, 20.0, 32.0, 60.0, 111.0, 98.0, 178.0, 290.0, 459.0, 642.0, 1031.0, 1831.0, 3276.0, 6077.0, 9105.0, 25270.0, 83728.0, 480254.0, 331609.0, 63200.0, 20880.0, 9108.0, 4637.0, 2170.0, 1670.0, 1045.0, 638.0, 390.0, 237.0, 152.0, 106.0, 60.0, 53.0, 30.0, 26.0, 14.0, 12.0, 8.0, 7.0, 10.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.000301361083984e-06, -8.70879739522934e-06, -8.417293429374695e-06, -8.12578946352005e-06, -7.834285497665405e-06, -7.5427815318107605e-06, -7.251277565956116e-06, -6.959773600101471e-06, -6.668269634246826e-06, -6.376765668392181e-06, -6.085261702537537e-06, -5.793757736682892e-06, -5.502253770828247e-06, -5.210749804973602e-06, -4.9192458391189575e-06, -4.627741873264313e-06, -4.336237907409668e-06, -4.044733941555023e-06, -3.7532299757003784e-06, -3.4617260098457336e-06, -3.170222043991089e-06, -2.878718078136444e-06, -2.5872141122817993e-06, -2.2957101464271545e-06, -2.0042061805725098e-06, -1.712702214717865e-06, -1.4211982488632202e-06, -1.1296942830085754e-06, -8.381903171539307e-07, -5.466863512992859e-07, -2.551823854446411e-07, 3.632158041000366e-08, 3.2782554626464844e-07, 6.193295121192932e-07, 9.10833477973938e-07, 1.2023374438285828e-06, 1.4938414096832275e-06, 1.7853453755378723e-06, 2.076849341392517e-06, 2.368353307247162e-06, 2.6598572731018066e-06, 2.9513612389564514e-06, 3.242865204811096e-06, 3.534369170665741e-06, 3.825873136520386e-06, 4.1173771023750305e-06, 4.408881068229675e-06, 4.70038503408432e-06, 4.991888999938965e-06, 5.28339296579361e-06, 5.574896931648254e-06, 5.866400897502899e-06, 6.157904863357544e-06, 6.449408829212189e-06, 6.7409127950668335e-06, 7.032416760921478e-06, 7.323920726776123e-06, 7.615424692630768e-06, 7.906928658485413e-06, 8.198432624340057e-06, 8.489936590194702e-06, 8.781440556049347e-06, 9.072944521903992e-06, 9.364448487758636e-06, 9.655952453613281e-06]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 5.0, 14.0, 16.0, 28.0, 27.0, 73.0, 47.0, 127.0, 101.0, 156.0, 124.0, 63.0, 71.0, 29.0, 22.0, 16.0, 27.0, 4.0, 9.0, 1.0, 4.0, 2.0, 6.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.649162292480469e-06, -4.499219357967377e-06, -4.349276423454285e-06, -4.199333488941193e-06, -4.049390554428101e-06, -3.8994476199150085e-06, -3.7495046854019165e-06, -3.5995617508888245e-06, -3.4496188163757324e-06, -3.2996758818626404e-06, -3.1497329473495483e-06, -2.9997900128364563e-06, -2.8498470783233643e-06, -2.6999041438102722e-06, -2.54996120929718e-06, -2.400018274784088e-06, -2.250075340270996e-06, -2.100132405757904e-06, -1.950189471244812e-06, -1.80024653673172e-06, -1.650303602218628e-06, -1.5003606677055359e-06, -1.3504177331924438e-06, -1.2004747986793518e-06, -1.0505318641662598e-06, -9.005889296531677e-07, -7.506459951400757e-07, -6.007030606269836e-07, -4.507601261138916e-07, -3.0081719160079956e-07, -1.5087425708770752e-07, -9.313225746154785e-10, 1.4901161193847656e-07, 2.989545464515686e-07, 4.4889748096466064e-07, 5.988404154777527e-07, 7.487833499908447e-07, 8.987262845039368e-07, 1.0486692190170288e-06, 1.1986121535301208e-06, 1.3485550880432129e-06, 1.498498022556305e-06, 1.648440957069397e-06, 1.798383891582489e-06, 1.948326826095581e-06, 2.098269760608673e-06, 2.248212695121765e-06, 2.398155629634857e-06, 2.5480985641479492e-06, 2.6980414986610413e-06, 2.8479844331741333e-06, 2.9979273676872253e-06, 3.1478703022003174e-06, 3.2978132367134094e-06, 3.4477561712265015e-06, 3.5976991057395935e-06, 3.7476420402526855e-06, 3.897584974765778e-06, 4.04752790927887e-06, 4.197470843791962e-06, 4.347413778305054e-06, 4.497356712818146e-06, 4.647299647331238e-06, 4.79724258184433e-06, 4.947185516357422e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 1.0, 9.0, 11.0, 13.0, 23.0, 22.0, 33.0, 34.0, 84.0, 85.0, 141.0, 222.0, 268.0, 511.0, 863.0, 1253.0, 2719.0, 4680.0, 12860.0, 35025.0, 350891.0, 569445.0, 42568.0, 14731.0, 5308.0, 2929.0, 1383.0, 923.0, 514.0, 297.0, 215.0, 130.0, 112.0, 77.0, 38.0, 34.0, 22.0, 21.0, 13.0, 10.0, 12.0, 2.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4483928680419922e-05, -1.4032237231731415e-05, -1.3580545783042908e-05, -1.31288543343544e-05, -1.2677162885665894e-05, -1.2225471436977386e-05, -1.177377998828888e-05, -1.1322088539600372e-05, -1.0870397090911865e-05, -1.0418705642223358e-05, -9.967014193534851e-06, -9.515322744846344e-06, -9.063631296157837e-06, -8.61193984746933e-06, -8.160248398780823e-06, -7.708556950092316e-06, -7.256865501403809e-06, -6.8051740527153015e-06, -6.3534826040267944e-06, -5.901791155338287e-06, -5.45009970664978e-06, -4.998408257961273e-06, -4.546716809272766e-06, -4.095025360584259e-06, -3.643333911895752e-06, -3.191642463207245e-06, -2.739951014518738e-06, -2.2882595658302307e-06, -1.8365681171417236e-06, -1.3848766684532166e-06, -9.331852197647095e-07, -4.814937710762024e-07, -2.9802322387695312e-08, 4.2188912630081177e-07, 8.735805749893188e-07, 1.325272023677826e-06, 1.776963472366333e-06, 2.22865492105484e-06, 2.680346369743347e-06, 3.1320378184318542e-06, 3.5837292671203613e-06, 4.035420715808868e-06, 4.4871121644973755e-06, 4.9388036131858826e-06, 5.39049506187439e-06, 5.842186510562897e-06, 6.293877959251404e-06, 6.745569407939911e-06, 7.197260856628418e-06, 7.648952305316925e-06, 8.100643754005432e-06, 8.55233520269394e-06, 9.004026651382446e-06, 9.455718100070953e-06, 9.90740954875946e-06, 1.0359100997447968e-05, 1.0810792446136475e-05, 1.1262483894824982e-05, 1.1714175343513489e-05, 1.2165866792201996e-05, 1.2617558240890503e-05, 1.306924968957901e-05, 1.3520941138267517e-05, 1.3972632586956024e-05, 1.4424324035644531e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 6.0, 5.0, 5.0, 8.0, 9.0, 19.0, 27.0, 32.0, 73.0, 146.0, 209.0, 185.0, 117.0, 59.0, 34.0, 24.0, 15.0, 11.0, 3.0, 3.0, 4.0, 5.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.179115295410156e-06, -8.890405297279358e-06, -8.60169529914856e-06, -8.312985301017761e-06, -8.024275302886963e-06, -7.735565304756165e-06, -7.446855306625366e-06, -7.158145308494568e-06, -6.8694353103637695e-06, -6.580725312232971e-06, -6.292015314102173e-06, -6.0033053159713745e-06, -5.714595317840576e-06, -5.425885319709778e-06, -5.1371753215789795e-06, -4.848465323448181e-06, -4.559755325317383e-06, -4.2710453271865845e-06, -3.982335329055786e-06, -3.693625330924988e-06, -3.4049153327941895e-06, -3.116205334663391e-06, -2.8274953365325928e-06, -2.5387853384017944e-06, -2.250075340270996e-06, -1.9613653421401978e-06, -1.6726553440093994e-06, -1.383945345878601e-06, -1.0952353477478027e-06, -8.065253496170044e-07, -5.178153514862061e-07, -2.2910535335540771e-07, 5.960464477539063e-08, 3.4831464290618896e-07, 6.370246410369873e-07, 9.257346391677856e-07, 1.214444637298584e-06, 1.5031546354293823e-06, 1.7918646335601807e-06, 2.080574631690979e-06, 2.3692846298217773e-06, 2.6579946279525757e-06, 2.946704626083374e-06, 3.2354146242141724e-06, 3.5241246223449707e-06, 3.812834620475769e-06, 4.101544618606567e-06, 4.390254616737366e-06, 4.678964614868164e-06, 4.967674612998962e-06, 5.256384611129761e-06, 5.545094609260559e-06, 5.833804607391357e-06, 6.122514605522156e-06, 6.411224603652954e-06, 6.6999346017837524e-06, 6.988644599914551e-06, 7.277354598045349e-06, 7.5660645961761475e-06, 7.854774594306946e-06, 8.143484592437744e-06, 8.432194590568542e-06, 8.72090458869934e-06, 9.00961458683014e-06, 9.298324584960938e-06]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 5.0, 7.0, 9.0, 12.0, 27.0, 41.0, 88.0, 152.0, 311.0, 140.0, 81.0, 43.0, 39.0, 16.0, 11.0, 11.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009723770199343562, -0.0009518836159259081, -0.0009313902701251209, -0.0009108968661166728, -0.0008904034621082246, -0.0008699101163074374, -0.0008494167122989893, -0.0008289233082905412, -0.000808429904282093, -0.0007879365002736449, -0.0007674431544728577, -0.0007469497504644096, -0.0007264563464559615, -0.0007059630006551743, -0.0006854695966467261, -0.000664976192638278, -0.0006444828468374908, -0.0006239894428290427, -0.0006034960970282555, -0.0005830026930198073, -0.0005625092890113592, -0.0005420158850029111, -0.0005215225392021239, -0.0005010291351936758, -0.0004805357602890581, -0.0004600423853844404, -0.0004395489813759923, -0.00041905560647137463, -0.00039856223156675696, -0.00037806882755830884, -0.00035757545265369117, -0.0003370820777490735, -0.00031658861553296447, -0.0002960952406283468, -0.0002756018366198987, -0.000255108461715281, -0.00023461507225874811, -0.00021412168280221522, -0.00019362830789759755, -0.00017313491844106466, -0.00015264152898453176, -0.00013214813952799886, -0.00011165475734742358, -9.11613751668483e-05, -7.06679857103154e-05, -5.017459625378251e-05, -2.9681221349164844e-05, -9.187831892631948e-06, 1.1305557563900948e-05, 3.1798943382455036e-05, 5.2292329201009125e-05, 7.27857113815844e-05, 9.32791008381173e-05, 0.0001137724902946502, 0.00013426586519926786, 0.00015475925465580076, 0.00017525264411233366, 0.00019574603356886655, 0.00021623942302539945, 0.00023673279793001711, 0.0002572261728346348, 0.0002777195768430829, 0.00029821295174770057, 0.00031870632665231824, 0.00033919973066076636]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 7.0, 7.0, 17.0, 12.0, 14.0, 12.0, 26.0, 23.0, 28.0, 27.0, 24.0, 27.0, 41.0, 32.0, 44.0, 45.0, 41.0, 31.0, 49.0, 53.0, 35.0, 47.0, 42.0, 30.0, 45.0, 29.0, 24.0, 29.0, 19.0, 18.0, 8.0, 21.0, 18.0, 15.0, 11.0, 6.0, 6.0, 3.0, 10.0, 2.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00021183490753173828, -0.00020554568618535995, -0.00019925646483898163, -0.0001929672434926033, -0.00018667802214622498, -0.00018038880079984665, -0.00017409957945346832, -0.00016781035810709, -0.00016152113676071167, -0.00015523191541433334, -0.00014894269406795502, -0.0001426534727215767, -0.00013636425137519836, -0.00013007503002882004, -0.0001237858086824417, -0.00011749658733606339, -0.00011120736598968506, -0.00010491814464330673, -9.86289232969284e-05, -9.233970195055008e-05, -8.605048060417175e-05, -7.976125925779343e-05, -7.34720379114151e-05, -6.718281656503677e-05, -6.089359521865845e-05, -5.460437387228012e-05, -4.8315152525901794e-05, -4.202593117952347e-05, -3.573670983314514e-05, -2.9447488486766815e-05, -2.315826714038849e-05, -1.6869045794010162e-05, -1.0579824447631836e-05, -4.2906031012535095e-06, 1.998618245124817e-06, 8.287839591503143e-06, 1.457706093788147e-05, 2.0866282284259796e-05, 2.7155503630638123e-05, 3.344472497701645e-05, 3.9733946323394775e-05, 4.60231676697731e-05, 5.231238901615143e-05, 5.8601610362529755e-05, 6.489083170890808e-05, 7.118005305528641e-05, 7.746927440166473e-05, 8.375849574804306e-05, 9.004771709442139e-05, 9.633693844079971e-05, 0.00010262615978717804, 0.00010891538113355637, 0.00011520460247993469, 0.00012149382382631302, 0.00012778304517269135, 0.00013407226651906967, 0.000140361487865448, 0.00014665070921182632, 0.00015293993055820465, 0.00015922915190458298, 0.0001655183732509613, 0.00017180759459733963, 0.00017809681594371796, 0.00018438603729009628, 0.0001906752586364746]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 17.0, 44.0, 75.0, 214.0, 402.0, 832.0, 1822.0, 3908.0, 8562.0, 20869.0, 60488.0, 274251.0, 3577467.0, 164970.0, 45821.0, 17791.0, 8058.0, 3945.0, 1906.0, 984.0, 587.0, 368.0, 216.0, 157.0, 107.0, 84.0, 57.0, 58.0, 24.0, 38.0, 32.0, 16.0, 23.0, 15.0, 15.0, 16.0, 6.0, 8.0, 9.0, 4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011146068572998047, -0.0001053977757692337, -9.933486580848694e-05, -9.327195584774017e-05, -8.720904588699341e-05, -8.114613592624664e-05, -7.508322596549988e-05, -6.902031600475311e-05, -6.295740604400635e-05, -5.689449608325958e-05, -5.083158612251282e-05, -4.476867616176605e-05, -3.870576620101929e-05, -3.264285624027252e-05, -2.6579946279525757e-05, -2.0517036318778992e-05, -1.4454126358032227e-05, -8.391216397285461e-06, -2.3283064365386963e-06, 3.734603524208069e-06, 9.797513484954834e-06, 1.58604234457016e-05, 2.1923333406448364e-05, 2.798624336719513e-05, 3.4049153327941895e-05, 4.011206328868866e-05, 4.6174973249435425e-05, 5.223788321018219e-05, 5.8300793170928955e-05, 6.436370313167572e-05, 7.042661309242249e-05, 7.648952305316925e-05, 8.255243301391602e-05, 8.861534297466278e-05, 9.467825293540955e-05, 0.00010074116289615631, 0.00010680407285690308, 0.00011286698281764984, 0.0001189298927783966, 0.00012499280273914337, 0.00013105571269989014, 0.0001371186226606369, 0.00014318153262138367, 0.00014924444258213043, 0.0001553073525428772, 0.00016137026250362396, 0.00016743317246437073, 0.0001734960824251175, 0.00017955899238586426, 0.00018562190234661102, 0.0001916848123073578, 0.00019774772226810455, 0.00020381063222885132, 0.00020987354218959808, 0.00021593645215034485, 0.00022199936211109161, 0.00022806227207183838, 0.00023412518203258514, 0.0002401880919933319, 0.0002462510019540787, 0.00025231391191482544, 0.0002583768218755722, 0.00026443973183631897, 0.00027050264179706573, 0.0002765655517578125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 8.0, 13.0, 10.0, 32.0, 19.0, 50.0, 55.0, 95.0, 96.0, 123.0, 112.0, 76.0, 82.0, 55.0, 43.0, 33.0, 23.0, 14.0, 12.0, 18.0, 6.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8358230590820312e-05, -1.7342157661914825e-05, -1.632608473300934e-05, -1.531001180410385e-05, -1.4293938875198364e-05, -1.3277865946292877e-05, -1.226179301738739e-05, -1.1245720088481903e-05, -1.0229647159576416e-05, -9.213574230670929e-06, -8.197501301765442e-06, -7.181428372859955e-06, -6.165355443954468e-06, -5.149282515048981e-06, -4.133209586143494e-06, -3.1171366572380066e-06, -2.1010637283325195e-06, -1.0849907994270325e-06, -6.891787052154541e-08, 9.471550583839417e-07, 1.9632279872894287e-06, 2.9793009161949158e-06, 3.995373845100403e-06, 5.01144677400589e-06, 6.027519702911377e-06, 7.043592631816864e-06, 8.059665560722351e-06, 9.075738489627838e-06, 1.0091811418533325e-05, 1.1107884347438812e-05, 1.21239572763443e-05, 1.3140030205249786e-05, 1.4156103134155273e-05, 1.517217606306076e-05, 1.6188248991966248e-05, 1.7204321920871735e-05, 1.822039484977722e-05, 1.923646777868271e-05, 2.0252540707588196e-05, 2.1268613636493683e-05, 2.228468656539917e-05, 2.3300759494304657e-05, 2.4316832423210144e-05, 2.533290535211563e-05, 2.6348978281021118e-05, 2.7365051209926605e-05, 2.8381124138832092e-05, 2.939719706773758e-05, 3.0413269996643066e-05, 3.1429342925548553e-05, 3.244541585445404e-05, 3.346148878335953e-05, 3.4477561712265015e-05, 3.54936346411705e-05, 3.650970757007599e-05, 3.7525780498981476e-05, 3.854185342788696e-05, 3.955792635679245e-05, 4.057399928569794e-05, 4.1590072214603424e-05, 4.260614514350891e-05, 4.36222180724144e-05, 4.4638291001319885e-05, 4.565436393022537e-05, 4.667043685913086e-05]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 9.0, 12.0, 23.0, 16.0, 25.0, 46.0, 64.0, 101.0, 146.0, 256.0, 316.0, 489.0, 756.0, 1253.0, 1891.0, 3039.0, 5103.0, 8311.0, 14762.0, 26815.0, 51566.0, 106798.0, 290773.0, 2620738.0, 716781.0, 181027.0, 76462.0, 37965.0, 19859.0, 11354.0, 6541.0, 4090.0, 2370.0, 1638.0, 1041.0, 593.0, 398.0, 280.0, 184.0, 127.0, 91.0, 51.0, 39.0, 31.0, 19.0, 14.0, 9.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.934736251831055e-05, -8.662138134241104e-05, -8.389540016651154e-05, -8.116941899061203e-05, -7.844343781471252e-05, -7.571745663881302e-05, -7.299147546291351e-05, -7.026549428701401e-05, -6.75395131111145e-05, -6.4813531935215e-05, -6.208755075931549e-05, -5.9361569583415985e-05, -5.663558840751648e-05, -5.3909607231616974e-05, -5.118362605571747e-05, -4.845764487981796e-05, -4.573166370391846e-05, -4.300568252801895e-05, -4.0279701352119446e-05, -3.755372017621994e-05, -3.4827739000320435e-05, -3.210175782442093e-05, -2.9375776648521423e-05, -2.6649795472621918e-05, -2.3923814296722412e-05, -2.1197833120822906e-05, -1.84718519449234e-05, -1.5745870769023895e-05, -1.301988959312439e-05, -1.0293908417224884e-05, -7.567927241325378e-06, -4.841946065425873e-06, -2.115964889526367e-06, 6.100162863731384e-07, 3.335997462272644e-06, 6.06197863817215e-06, 8.787959814071655e-06, 1.1513940989971161e-05, 1.4239922165870667e-05, 1.6965903341770172e-05, 1.9691884517669678e-05, 2.2417865693569183e-05, 2.514384686946869e-05, 2.7869828045368195e-05, 3.05958092212677e-05, 3.3321790397167206e-05, 3.604777157306671e-05, 3.877375274896622e-05, 4.149973392486572e-05, 4.422571510076523e-05, 4.6951696276664734e-05, 4.967767745256424e-05, 5.2403658628463745e-05, 5.512963980436325e-05, 5.7855620980262756e-05, 6.058160215616226e-05, 6.330758333206177e-05, 6.603356450796127e-05, 6.875954568386078e-05, 7.148552685976028e-05, 7.421150803565979e-05, 7.69374892115593e-05, 7.96634703874588e-05, 8.238945156335831e-05, 8.511543273925781e-05]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 8.0, 13.0, 18.0, 26.0, 14.0, 36.0, 34.0, 49.0, 38.0, 71.0, 79.0, 86.0, 107.0, 143.0, 253.0, 520.0, 1004.0, 583.0, 218.0, 131.0, 105.0, 94.0, 64.0, 70.0, 48.0, 46.0, 38.0, 23.0, 24.0, 22.0, 20.0, 16.0, 7.0, 5.0, 11.0, 13.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-6.777048110961914e-05, -6.586499512195587e-05, -6.39595091342926e-05, -6.205402314662933e-05, -6.0148537158966064e-05, -5.8243051171302795e-05, -5.6337565183639526e-05, -5.443207919597626e-05, -5.252659320831299e-05, -5.062110722064972e-05, -4.871562123298645e-05, -4.681013524532318e-05, -4.490464925765991e-05, -4.299916326999664e-05, -4.1093677282333374e-05, -3.9188191294670105e-05, -3.7282705307006836e-05, -3.537721931934357e-05, -3.34717333316803e-05, -3.156624734401703e-05, -2.966076135635376e-05, -2.775527536869049e-05, -2.584978938102722e-05, -2.3944303393363953e-05, -2.2038817405700684e-05, -2.0133331418037415e-05, -1.8227845430374146e-05, -1.6322359442710876e-05, -1.4416873455047607e-05, -1.2511387467384338e-05, -1.060590147972107e-05, -8.7004154920578e-06, -6.794929504394531e-06, -4.889443516731262e-06, -2.983957529067993e-06, -1.0784715414047241e-06, 8.270144462585449e-07, 2.732500433921814e-06, 4.637986421585083e-06, 6.543472409248352e-06, 8.448958396911621e-06, 1.035444438457489e-05, 1.225993037223816e-05, 1.4165416359901428e-05, 1.6070902347564697e-05, 1.7976388335227966e-05, 1.9881874322891235e-05, 2.1787360310554504e-05, 2.3692846298217773e-05, 2.5598332285881042e-05, 2.750381827354431e-05, 2.940930426120758e-05, 3.131479024887085e-05, 3.322027623653412e-05, 3.512576222419739e-05, 3.703124821186066e-05, 3.8936734199523926e-05, 4.0842220187187195e-05, 4.2747706174850464e-05, 4.465319216251373e-05, 4.6558678150177e-05, 4.846416413784027e-05, 5.036965012550354e-05, 5.227513611316681e-05, 5.418062210083008e-05]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 11.0, 15.0, 37.0, 71.0, 147.0, 290.0, 171.0, 112.0, 60.0, 42.0, 22.0, 15.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004101599333807826, -0.0003774420765694231, -0.00034472421975806355, -0.0003120063338428736, -0.00027928847703151405, -0.0002465706202201545, -0.00021385274885687977, -0.00018113487749360502, -0.0001484170206822455, -0.00011569915659492835, -8.298129250761122e-05, -5.0263428420294076e-05, -1.7545564332976937e-05, 1.5172292478382587e-05, 4.789016384165734e-05, 8.06080352049321e-05, 0.00011332589201629162, 0.00014604374882765114, 0.0001787616201909259, 0.00021147949155420065, 0.0002441973483655602, 0.0002769152051769197, 0.0003096330910921097, 0.0003423509479034692, 0.00037506880471482873, 0.00040778666152618825, 0.0004405045183375478, 0.00047322240425273776, 0.0005059402901679277, 0.0005386581178754568, 0.0005713760037906468, 0.0006040938897058368, 0.0006368117174133658, 0.0006695296033285558, 0.0007022474310360849, 0.0007349653169512749, 0.0007676831446588039, 0.0008004010305739939, 0.0008331189164891839, 0.000865836744196713, 0.000898554630111903, 0.0009312725160270929, 0.000963990343734622, 0.000996708171442151, 0.001029426115565002, 0.001062143943272531, 0.00109486177098006, 0.001127579715102911, 0.00116029754281044, 0.0011930153705179691, 0.00122573331464082, 0.001258451142348349, 0.0012911689700558782, 0.001323886914178729, 0.0013566047418862581, 0.0013893225695937872, 0.0014220403973013163, 0.0014547582250088453, 0.0014874761691316962, 0.0015201939968392253, 0.0015529118245467544, 0.0015856297686696053, 0.0016183475963771343, 0.0016510654240846634, 0.0016837833682075143]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 10.0, 12.0, 17.0, 15.0, 27.0, 26.0, 29.0, 27.0, 27.0, 29.0, 46.0, 43.0, 42.0, 47.0, 50.0, 36.0, 41.0, 53.0, 36.0, 40.0, 37.0, 47.0, 38.0, 43.0, 34.0, 27.0, 21.0, 17.0, 22.0, 7.0, 8.0, 15.0, 6.0, 4.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003261566162109375, -0.00031673070043325424, -0.000307304784655571, -0.0002978788688778877, -0.00028845295310020447, -0.0002790270373225212, -0.00026960112154483795, -0.0002601752057671547, -0.00025074928998947144, -0.00024132337421178818, -0.00023189745843410492, -0.00022247154265642166, -0.0002130456268787384, -0.00020361971110105515, -0.0001941937953233719, -0.00018476787954568863, -0.00017534196376800537, -0.0001659160479903221, -0.00015649013221263885, -0.0001470642164349556, -0.00013763830065727234, -0.00012821238487958908, -0.00011878646910190582, -0.00010936055332422256, -9.99346375465393e-05, -9.050872176885605e-05, -8.108280599117279e-05, -7.165689021348953e-05, -6.223097443580627e-05, -5.2805058658123016e-05, -4.337914288043976e-05, -3.39532271027565e-05, -2.4527311325073242e-05, -1.5101395547389984e-05, -5.675479769706726e-06, 3.750436007976532e-06, 1.317635178565979e-05, 2.2602267563343048e-05, 3.2028183341026306e-05, 4.1454099118709564e-05, 5.088001489639282e-05, 6.030593067407608e-05, 6.973184645175934e-05, 7.91577622294426e-05, 8.858367800712585e-05, 9.800959378480911e-05, 0.00010743550956249237, 0.00011686142534017563, 0.0001262873411178589, 0.00013571325689554214, 0.0001451391726732254, 0.00015456508845090866, 0.00016399100422859192, 0.00017341692000627518, 0.00018284283578395844, 0.0001922687515616417, 0.00020169466733932495, 0.0002111205831170082, 0.00022054649889469147, 0.00022997241467237473, 0.00023939833045005798, 0.00024882424622774124, 0.0002582501620054245, 0.00026767607778310776, 0.000277101993560791]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 9.0, 15.0, 19.0, 24.0, 29.0, 53.0, 85.0, 127.0, 209.0, 361.0, 549.0, 882.0, 1659.0, 3032.0, 5673.0, 12159.0, 29348.0, 85278.0, 501707.0, 293551.0, 67664.0, 24513.0, 10242.0, 5115.0, 2555.0, 1458.0, 839.0, 549.0, 292.0, 204.0, 110.0, 74.0, 39.0, 29.0, 23.0, 25.0, 15.0, 9.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020742416381835938, -0.000200711190700531, -0.00019399821758270264, -0.00018728524446487427, -0.0001805722713470459, -0.00017385929822921753, -0.00016714632511138916, -0.0001604333519935608, -0.00015372037887573242, -0.00014700740575790405, -0.00014029443264007568, -0.00013358145952224731, -0.00012686848640441895, -0.00012015551328659058, -0.00011344254016876221, -0.00010672956705093384, -0.00010001659393310547, -9.33036208152771e-05, -8.659064769744873e-05, -7.987767457962036e-05, -7.316470146179199e-05, -6.645172834396362e-05, -5.9738755226135254e-05, -5.3025782108306885e-05, -4.6312808990478516e-05, -3.9599835872650146e-05, -3.288686275482178e-05, -2.6173889636993408e-05, -1.946091651916504e-05, -1.274794340133667e-05, -6.034970283508301e-06, 6.780028343200684e-07, 7.3909759521484375e-06, 1.4103949069976807e-05, 2.0816922187805176e-05, 2.7529895305633545e-05, 3.4242868423461914e-05, 4.095584154129028e-05, 4.766881465911865e-05, 5.438178777694702e-05, 6.109476089477539e-05, 6.780773401260376e-05, 7.452070713043213e-05, 8.12336802482605e-05, 8.794665336608887e-05, 9.465962648391724e-05, 0.0001013725996017456, 0.00010808557271957397, 0.00011479854583740234, 0.00012151151895523071, 0.00012822449207305908, 0.00013493746519088745, 0.00014165043830871582, 0.0001483634114265442, 0.00015507638454437256, 0.00016178935766220093, 0.0001685023307800293, 0.00017521530389785767, 0.00018192827701568604, 0.0001886412501335144, 0.00019535422325134277, 0.00020206719636917114, 0.0002087801694869995, 0.00021549314260482788, 0.00022220611572265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 6.0, 7.0, 9.0, 13.0, 21.0, 16.0, 22.0, 50.0, 46.0, 65.0, 80.0, 102.0, 96.0, 96.0, 82.0, 65.0, 54.0, 30.0, 37.0, 23.0, 22.0, 12.0, 9.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 7.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.996755599975586e-05, -1.9088387489318848e-05, -1.8209218978881836e-05, -1.7330050468444824e-05, -1.6450881958007812e-05, -1.55717134475708e-05, -1.4692544937133789e-05, -1.3813376426696777e-05, -1.2934207916259766e-05, -1.2055039405822754e-05, -1.1175870895385742e-05, -1.029670238494873e-05, -9.417533874511719e-06, -8.538365364074707e-06, -7.659196853637695e-06, -6.780028343200684e-06, -5.900859832763672e-06, -5.02169132232666e-06, -4.1425228118896484e-06, -3.2633543014526367e-06, -2.384185791015625e-06, -1.5050172805786133e-06, -6.258487701416016e-07, 2.5331974029541016e-07, 1.1324882507324219e-06, 2.0116567611694336e-06, 2.8908252716064453e-06, 3.769993782043457e-06, 4.649162292480469e-06, 5.5283308029174805e-06, 6.407499313354492e-06, 7.286667823791504e-06, 8.165836334228516e-06, 9.045004844665527e-06, 9.924173355102539e-06, 1.080334186553955e-05, 1.1682510375976562e-05, 1.2561678886413574e-05, 1.3440847396850586e-05, 1.4320015907287598e-05, 1.519918441772461e-05, 1.607835292816162e-05, 1.6957521438598633e-05, 1.7836689949035645e-05, 1.8715858459472656e-05, 1.9595026969909668e-05, 2.047419548034668e-05, 2.135336399078369e-05, 2.2232532501220703e-05, 2.3111701011657715e-05, 2.3990869522094727e-05, 2.4870038032531738e-05, 2.574920654296875e-05, 2.6628375053405762e-05, 2.7507543563842773e-05, 2.8386712074279785e-05, 2.9265880584716797e-05, 3.014504909515381e-05, 3.102421760559082e-05, 3.190338611602783e-05, 3.2782554626464844e-05, 3.3661723136901855e-05, 3.454089164733887e-05, 3.542006015777588e-05, 3.629922866821289e-05]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 6.0, 7.0, 9.0, 19.0, 30.0, 36.0, 62.0, 78.0, 115.0, 167.0, 249.0, 359.0, 461.0, 723.0, 1174.0, 1745.0, 2350.0, 3908.0, 6114.0, 9380.0, 15359.0, 25431.0, 43297.0, 78191.0, 156969.0, 362127.0, 153790.0, 76671.0, 42796.0, 25071.0, 15162.0, 9365.0, 5951.0, 3840.0, 2381.0, 1632.0, 1167.0, 759.0, 471.0, 334.0, 263.0, 178.0, 117.0, 72.0, 53.0, 35.0, 36.0, 22.0, 11.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0], "bins": [-7.94529914855957e-05, -7.700733840465546e-05, -7.456168532371521e-05, -7.211603224277496e-05, -6.967037916183472e-05, -6.722472608089447e-05, -6.477907299995422e-05, -6.233341991901398e-05, -5.988776683807373e-05, -5.7442113757133484e-05, -5.499646067619324e-05, -5.255080759525299e-05, -5.0105154514312744e-05, -4.76595014333725e-05, -4.521384835243225e-05, -4.2768195271492004e-05, -4.032254219055176e-05, -3.787688910961151e-05, -3.5431236028671265e-05, -3.298558294773102e-05, -3.053992986679077e-05, -2.8094276785850525e-05, -2.564862370491028e-05, -2.3202970623970032e-05, -2.0757317543029785e-05, -1.831166446208954e-05, -1.5866011381149292e-05, -1.3420358300209045e-05, -1.0974705219268799e-05, -8.529052138328552e-06, -6.083399057388306e-06, -3.637745976448059e-06, -1.1920928955078125e-06, 1.253560185432434e-06, 3.6992132663726807e-06, 6.144866347312927e-06, 8.590519428253174e-06, 1.103617250919342e-05, 1.3481825590133667e-05, 1.5927478671073914e-05, 1.837313175201416e-05, 2.0818784832954407e-05, 2.3264437913894653e-05, 2.57100909948349e-05, 2.8155744075775146e-05, 3.060139715671539e-05, 3.304705023765564e-05, 3.5492703318595886e-05, 3.793835639953613e-05, 4.038400948047638e-05, 4.2829662561416626e-05, 4.527531564235687e-05, 4.772096872329712e-05, 5.0166621804237366e-05, 5.261227488517761e-05, 5.505792796611786e-05, 5.7503581047058105e-05, 5.994923412799835e-05, 6.23948872089386e-05, 6.484054028987885e-05, 6.728619337081909e-05, 6.973184645175934e-05, 7.217749953269958e-05, 7.462315261363983e-05, 7.706880569458008e-05]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 13.0, 4.0, 6.0, 10.0, 15.0, 24.0, 21.0, 21.0, 34.0, 25.0, 34.0, 45.0, 35.0, 40.0, 39.0, 45.0, 43.0, 38.0, 56.0, 39.0, 48.0, 46.0, 36.0, 35.0, 44.0, 30.0, 31.0, 16.0, 24.0, 20.0, 13.0, 13.0, 9.0, 9.0, 8.0, 8.0, 9.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.459785461425781e-05, -5.286373198032379e-05, -5.112960934638977e-05, -4.939548671245575e-05, -4.766136407852173e-05, -4.592724144458771e-05, -4.4193118810653687e-05, -4.2458996176719666e-05, -4.0724873542785645e-05, -3.8990750908851624e-05, -3.72566282749176e-05, -3.552250564098358e-05, -3.378838300704956e-05, -3.205426037311554e-05, -3.032013773918152e-05, -2.8586015105247498e-05, -2.6851892471313477e-05, -2.5117769837379456e-05, -2.3383647203445435e-05, -2.1649524569511414e-05, -1.9915401935577393e-05, -1.818127930164337e-05, -1.644715666770935e-05, -1.471303403377533e-05, -1.2978911399841309e-05, -1.1244788765907288e-05, -9.510666131973267e-06, -7.776543498039246e-06, -6.042420864105225e-06, -4.308298230171204e-06, -2.5741755962371826e-06, -8.400529623031616e-07, 8.940696716308594e-07, 2.6281923055648804e-06, 4.362314939498901e-06, 6.096437573432922e-06, 7.830560207366943e-06, 9.564682841300964e-06, 1.1298805475234985e-05, 1.3032928109169006e-05, 1.4767050743103027e-05, 1.650117337703705e-05, 1.823529601097107e-05, 1.996941864490509e-05, 2.170354127883911e-05, 2.3437663912773132e-05, 2.5171786546707153e-05, 2.6905909180641174e-05, 2.8640031814575195e-05, 3.0374154448509216e-05, 3.210827708244324e-05, 3.384239971637726e-05, 3.557652235031128e-05, 3.73106449842453e-05, 3.904476761817932e-05, 4.077889025211334e-05, 4.251301288604736e-05, 4.4247135519981384e-05, 4.5981258153915405e-05, 4.7715380787849426e-05, 4.944950342178345e-05, 5.118362605571747e-05, 5.291774868965149e-05, 5.465187132358551e-05, 5.638599395751953e-05]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 6.0, 3.0, 9.0, 7.0, 14.0, 12.0, 29.0, 38.0, 45.0, 69.0, 97.0, 150.0, 235.0, 331.0, 654.0, 926.0, 1566.0, 3705.0, 6781.0, 21052.0, 60761.0, 349914.0, 505557.0, 60964.0, 20909.0, 6802.0, 3340.0, 1918.0, 933.0, 671.0, 354.0, 223.0, 143.0, 110.0, 57.0, 53.0, 32.0, 35.0, 20.0, 10.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2576580047607422e-05, -1.2195669114589691e-05, -1.181475818157196e-05, -1.143384724855423e-05, -1.1052936315536499e-05, -1.0672025382518768e-05, -1.0291114449501038e-05, -9.910203516483307e-06, -9.529292583465576e-06, -9.148381650447845e-06, -8.767470717430115e-06, -8.386559784412384e-06, -8.005648851394653e-06, -7.624737918376923e-06, -7.243826985359192e-06, -6.862916052341461e-06, -6.4820051193237305e-06, -6.101094186306e-06, -5.720183253288269e-06, -5.339272320270538e-06, -4.958361387252808e-06, -4.577450454235077e-06, -4.196539521217346e-06, -3.8156285881996155e-06, -3.4347176551818848e-06, -3.053806722164154e-06, -2.6728957891464233e-06, -2.2919848561286926e-06, -1.911073923110962e-06, -1.5301629900932312e-06, -1.1492520570755005e-06, -7.683411240577698e-07, -3.8743019104003906e-07, -6.51925802230835e-09, 3.7439167499542236e-07, 7.553026080131531e-07, 1.1362135410308838e-06, 1.5171244740486145e-06, 1.8980354070663452e-06, 2.278946340084076e-06, 2.6598572731018066e-06, 3.0407682061195374e-06, 3.421679139137268e-06, 3.8025900721549988e-06, 4.1835010051727295e-06, 4.56441193819046e-06, 4.945322871208191e-06, 5.326233804225922e-06, 5.707144737243652e-06, 6.088055670261383e-06, 6.468966603279114e-06, 6.8498775362968445e-06, 7.230788469314575e-06, 7.611699402332306e-06, 7.992610335350037e-06, 8.373521268367767e-06, 8.754432201385498e-06, 9.135343134403229e-06, 9.51625406742096e-06, 9.89716500043869e-06, 1.0278075933456421e-05, 1.0658986866474152e-05, 1.1039897799491882e-05, 1.1420808732509613e-05, 1.1801719665527344e-05]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 5.0, 15.0, 12.0, 18.0, 21.0, 45.0, 67.0, 145.0, 155.0, 208.0, 100.0, 77.0, 38.0, 27.0, 15.0, 16.0, 9.0, 4.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.185604095458984e-06, -4.978850483894348e-06, -4.772096872329712e-06, -4.565343260765076e-06, -4.3585896492004395e-06, -4.151836037635803e-06, -3.945082426071167e-06, -3.7383288145065308e-06, -3.5315752029418945e-06, -3.3248215913772583e-06, -3.118067979812622e-06, -2.911314368247986e-06, -2.7045607566833496e-06, -2.4978071451187134e-06, -2.291053533554077e-06, -2.084299921989441e-06, -1.8775463104248047e-06, -1.6707926988601685e-06, -1.4640390872955322e-06, -1.257285475730896e-06, -1.0505318641662598e-06, -8.437782526016235e-07, -6.370246410369873e-07, -4.302710294723511e-07, -2.2351741790771484e-07, -1.6763806343078613e-08, 1.8998980522155762e-07, 3.9674341678619385e-07, 6.034970283508301e-07, 8.102506399154663e-07, 1.0170042514801025e-06, 1.2237578630447388e-06, 1.430511474609375e-06, 1.6372650861740112e-06, 1.8440186977386475e-06, 2.0507723093032837e-06, 2.25752592086792e-06, 2.464279532432556e-06, 2.6710331439971924e-06, 2.8777867555618286e-06, 3.084540367126465e-06, 3.291293978691101e-06, 3.4980475902557373e-06, 3.7048012018203735e-06, 3.91155481338501e-06, 4.118308424949646e-06, 4.325062036514282e-06, 4.5318156480789185e-06, 4.738569259643555e-06, 4.945322871208191e-06, 5.152076482772827e-06, 5.358830094337463e-06, 5.5655837059021e-06, 5.772337317466736e-06, 5.979090929031372e-06, 6.185844540596008e-06, 6.3925981521606445e-06, 6.599351763725281e-06, 6.806105375289917e-06, 7.012858986854553e-06, 7.2196125984191895e-06, 7.426366209983826e-06, 7.633119821548462e-06, 7.839873433113098e-06, 8.046627044677734e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 4.0, 7.0, 2.0, 6.0, 5.0, 16.0, 17.0, 29.0, 41.0, 56.0, 62.0, 64.0, 118.0, 172.0, 223.0, 327.0, 461.0, 716.0, 1091.0, 1791.0, 2257.0, 4835.0, 9424.0, 20285.0, 51807.0, 191461.0, 559165.0, 128980.0, 39877.0, 13576.0, 9346.0, 4955.0, 2669.0, 1594.0, 962.0, 662.0, 450.0, 279.0, 157.0, 165.0, 109.0, 81.0, 46.0, 45.0, 50.0, 35.0, 15.0, 12.0, 7.0, 7.0, 5.0, 6.0, 8.0, 5.0, 7.0, 2.0, 3.0], "bins": [-7.748603820800781e-06, -7.516704499721527e-06, -7.284805178642273e-06, -7.052905857563019e-06, -6.821006536483765e-06, -6.5891072154045105e-06, -6.357207894325256e-06, -6.125308573246002e-06, -5.893409252166748e-06, -5.661509931087494e-06, -5.42961061000824e-06, -5.197711288928986e-06, -4.9658119678497314e-06, -4.733912646770477e-06, -4.502013325691223e-06, -4.270114004611969e-06, -4.038214683532715e-06, -3.8063153624534607e-06, -3.5744160413742065e-06, -3.3425167202949524e-06, -3.1106173992156982e-06, -2.878718078136444e-06, -2.64681875705719e-06, -2.414919435977936e-06, -2.1830201148986816e-06, -1.9511207938194275e-06, -1.7192214727401733e-06, -1.4873221516609192e-06, -1.255422830581665e-06, -1.0235235095024109e-06, -7.916241884231567e-07, -5.597248673439026e-07, -3.2782554626464844e-07, -9.592622518539429e-08, 1.3597309589385986e-07, 3.67872416973114e-07, 5.997717380523682e-07, 8.316710591316223e-07, 1.0635703802108765e-06, 1.2954697012901306e-06, 1.5273690223693848e-06, 1.759268343448639e-06, 1.991167664527893e-06, 2.2230669856071472e-06, 2.4549663066864014e-06, 2.6868656277656555e-06, 2.9187649488449097e-06, 3.150664269924164e-06, 3.382563591003418e-06, 3.614462912082672e-06, 3.846362233161926e-06, 4.07826155424118e-06, 4.3101608753204346e-06, 4.542060196399689e-06, 4.773959517478943e-06, 5.005858838558197e-06, 5.237758159637451e-06, 5.469657480716705e-06, 5.7015568017959595e-06, 5.933456122875214e-06, 6.165355443954468e-06, 6.397254765033722e-06, 6.629154086112976e-06, 6.86105340719223e-06, 7.092952728271484e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 13.0, 16.0, 27.0, 24.0, 33.0, 59.0, 89.0, 72.0, 117.0, 131.0, 73.0, 94.0, 60.0, 42.0, 20.0, 38.0, 19.0, 13.0, 9.0, 8.0, 5.0, 4.0, 6.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.827976226806641e-06, -4.667788743972778e-06, -4.507601261138916e-06, -4.347413778305054e-06, -4.187226295471191e-06, -4.027038812637329e-06, -3.866851329803467e-06, -3.7066638469696045e-06, -3.546476364135742e-06, -3.38628888130188e-06, -3.2261013984680176e-06, -3.0659139156341553e-06, -2.905726432800293e-06, -2.7455389499664307e-06, -2.5853514671325684e-06, -2.425163984298706e-06, -2.2649765014648438e-06, -2.1047890186309814e-06, -1.944601535797119e-06, -1.7844140529632568e-06, -1.6242265701293945e-06, -1.4640390872955322e-06, -1.30385160446167e-06, -1.1436641216278076e-06, -9.834766387939453e-07, -8.23289155960083e-07, -6.631016731262207e-07, -5.029141902923584e-07, -3.427267074584961e-07, -1.825392246246338e-07, -2.2351741790771484e-08, 1.3783574104309082e-07, 2.980232238769531e-07, 4.5821070671081543e-07, 6.183981895446777e-07, 7.7858567237854e-07, 9.387731552124023e-07, 1.0989606380462646e-06, 1.259148120880127e-06, 1.4193356037139893e-06, 1.5795230865478516e-06, 1.7397105693817139e-06, 1.8998980522155762e-06, 2.0600855350494385e-06, 2.2202730178833008e-06, 2.380460500717163e-06, 2.5406479835510254e-06, 2.7008354663848877e-06, 2.86102294921875e-06, 3.0212104320526123e-06, 3.1813979148864746e-06, 3.341585397720337e-06, 3.5017728805541992e-06, 3.6619603633880615e-06, 3.822147846221924e-06, 3.982335329055786e-06, 4.1425228118896484e-06, 4.302710294723511e-06, 4.462897777557373e-06, 4.623085260391235e-06, 4.783272743225098e-06, 4.94346022605896e-06, 5.103647708892822e-06, 5.2638351917266846e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 8.0, 10.0, 15.0, 18.0, 26.0, 38.0, 56.0, 96.0, 195.0, 183.0, 97.0, 90.0, 47.0, 28.0, 29.0, 11.0, 14.0, 11.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005425370181910694, -0.0005289708497002721, -0.0005154046812094748, -0.0005018385127186775, -0.00048827234422788024, -0.00047470617573708296, -0.0004611400072462857, -0.0004475738387554884, -0.0004340076702646911, -0.00042044150177389383, -0.00040687533328309655, -0.00039330916479229927, -0.000379742996301502, -0.0003661768278107047, -0.0003526106593199074, -0.00033904449082911015, -0.0003254782932344824, -0.0003119121247436851, -0.00029834595625288785, -0.00028477978776209056, -0.0002712136192712933, -0.000257647450780496, -0.0002440812677377835, -0.0002305150992469862, -0.00021694893075618893, -0.00020338276226539165, -0.00018981659377459437, -0.00017625041073188186, -0.00016268424224108458, -0.0001491180737502873, -0.00013555190525949, -0.00012198573676869273, -0.00010841956827789545, -9.485339978709817e-05, -8.128723129630089e-05, -6.772105552954599e-05, -5.415488703874871e-05, -4.058871854795143e-05, -2.7022542781196535e-05, -1.3456374290399253e-05, 1.097942003980279e-07, 1.3675964510184713e-05, 2.7242134819971398e-05, 4.0808306948747486e-05, 5.437447543954477e-05, 6.794064393034205e-05, 8.150681969709694e-05, 9.507298818789423e-05, 0.0001086391566786915, 0.0001222053251694888, 0.00013577149366028607, 0.00014933766215108335, 0.00016290383064188063, 0.0001764699991326779, 0.00019003618217539042, 0.0002036023506661877, 0.00021716851915698498, 0.00023073468764778227, 0.0002443008706904948, 0.00025786703918129206, 0.00027143320767208934, 0.0002849993761628866, 0.0002985655446536839, 0.0003121317131444812, 0.00032569788163527846]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 1.0, 2.0, 4.0, 11.0, 10.0, 15.0, 16.0, 8.0, 21.0, 25.0, 33.0, 22.0, 24.0, 30.0, 41.0, 32.0, 42.0, 45.0, 23.0, 28.0, 38.0, 44.0, 32.0, 38.0, 38.0, 51.0, 42.0, 38.0, 29.0, 30.0, 39.0, 21.0, 26.0, 18.0, 10.0, 15.0, 12.0, 18.0, 9.0, 5.0, 5.0, 6.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00017303228378295898, -0.00016720406711101532, -0.00016137585043907166, -0.000155547633767128, -0.00014971941709518433, -0.00014389120042324066, -0.000138062983751297, -0.00013223476707935333, -0.00012640655040740967, -0.000120578333735466, -0.00011475011706352234, -0.00010892190039157867, -0.00010309368371963501, -9.726546704769135e-05, -9.143725037574768e-05, -8.560903370380402e-05, -7.978081703186035e-05, -7.395260035991669e-05, -6.812438368797302e-05, -6.229616701602936e-05, -5.646795034408569e-05, -5.063973367214203e-05, -4.4811517000198364e-05, -3.89833003282547e-05, -3.3155083656311035e-05, -2.732686698436737e-05, -2.1498650312423706e-05, -1.567043364048004e-05, -9.842216968536377e-06, -4.014000296592712e-06, 1.8142163753509521e-06, 7.642433047294617e-06, 1.3470649719238281e-05, 1.9298866391181946e-05, 2.512708306312561e-05, 3.0955299735069275e-05, 3.678351640701294e-05, 4.2611733078956604e-05, 4.843994975090027e-05, 5.426816642284393e-05, 6.00963830947876e-05, 6.592459976673126e-05, 7.175281643867493e-05, 7.758103311061859e-05, 8.340924978256226e-05, 8.923746645450592e-05, 9.506568312644958e-05, 0.00010089389979839325, 0.00010672211647033691, 0.00011255033314228058, 0.00011837854981422424, 0.0001242067664861679, 0.00013003498315811157, 0.00013586319983005524, 0.0001416914165019989, 0.00014751963317394257, 0.00015334784984588623, 0.0001591760665178299, 0.00016500428318977356, 0.00017083249986171722, 0.0001766607165336609, 0.00018248893320560455, 0.00018831714987754822, 0.00019414536654949188, 0.00019997358322143555]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 10.0, 8.0, 16.0, 19.0, 22.0, 51.0, 89.0, 94.0, 148.0, 186.0, 342.0, 466.0, 695.0, 1090.0, 1614.0, 2610.0, 4054.0, 6725.0, 11962.0, 21340.0, 42173.0, 95352.0, 696152.0, 3071205.0, 132872.0, 48971.0, 23552.0, 12683.0, 7315.0, 4248.0, 2714.0, 1739.0, 1113.0, 771.0, 568.0, 394.0, 258.0, 178.0, 141.0, 115.0, 53.0, 53.0, 28.0, 31.0, 25.0, 15.0, 9.0, 12.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00011485815048217773, -0.00011117197573184967, -0.0001074858009815216, -0.00010379962623119354, -0.00010011345148086548, -9.642727673053741e-05, -9.274110198020935e-05, -8.905492722988129e-05, -8.536875247955322e-05, -8.168257772922516e-05, -7.79964029788971e-05, -7.431022822856903e-05, -7.062405347824097e-05, -6.69378787279129e-05, -6.325170397758484e-05, -5.9565529227256775e-05, -5.587935447692871e-05, -5.219317972660065e-05, -4.850700497627258e-05, -4.482083022594452e-05, -4.1134655475616455e-05, -3.744848072528839e-05, -3.376230597496033e-05, -3.0076131224632263e-05, -2.63899564743042e-05, -2.2703781723976135e-05, -1.901760697364807e-05, -1.5331432223320007e-05, -1.1645257472991943e-05, -7.95908272266388e-06, -4.2729079723358154e-06, -5.867332220077515e-07, 3.0994415283203125e-06, 6.7856162786483765e-06, 1.047179102897644e-05, 1.4157965779304504e-05, 1.784414052963257e-05, 2.1530315279960632e-05, 2.5216490030288696e-05, 2.890266478061676e-05, 3.2588839530944824e-05, 3.627501428127289e-05, 3.996118903160095e-05, 4.3647363781929016e-05, 4.733353853225708e-05, 5.1019713282585144e-05, 5.470588803291321e-05, 5.839206278324127e-05, 6.207823753356934e-05, 6.57644122838974e-05, 6.945058703422546e-05, 7.313676178455353e-05, 7.682293653488159e-05, 8.050911128520966e-05, 8.419528603553772e-05, 8.788146078586578e-05, 9.156763553619385e-05, 9.525381028652191e-05, 9.893998503684998e-05, 0.00010262615978717804, 0.0001063123345375061, 0.00010999850928783417, 0.00011368468403816223, 0.0001173708587884903, 0.00012105703353881836]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 12.0, 10.0, 11.0, 7.0, 17.0, 27.0, 32.0, 37.0, 43.0, 46.0, 59.0, 77.0, 77.0, 85.0, 83.0, 83.0, 63.0, 37.0, 49.0, 23.0, 21.0, 20.0, 20.0, 13.0, 7.0, 12.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3543834686279297e-05, -2.2768042981624603e-05, -2.199225127696991e-05, -2.1216459572315216e-05, -2.0440667867660522e-05, -1.966487616300583e-05, -1.8889084458351135e-05, -1.811329275369644e-05, -1.7337501049041748e-05, -1.6561709344387054e-05, -1.578591763973236e-05, -1.5010125935077667e-05, -1.4234334230422974e-05, -1.345854252576828e-05, -1.2682750821113586e-05, -1.1906959116458893e-05, -1.11311674118042e-05, -1.0355375707149506e-05, -9.579584002494812e-06, -8.803792297840118e-06, -8.028000593185425e-06, -7.252208888530731e-06, -6.476417183876038e-06, -5.700625479221344e-06, -4.92483377456665e-06, -4.149042069911957e-06, -3.373250365257263e-06, -2.5974586606025696e-06, -1.821666955947876e-06, -1.0458752512931824e-06, -2.7008354663848877e-07, 5.057081580162048e-07, 1.2814998626708984e-06, 2.057291567325592e-06, 2.8330832719802856e-06, 3.6088749766349792e-06, 4.384666681289673e-06, 5.1604583859443665e-06, 5.93625009059906e-06, 6.712041795253754e-06, 7.487833499908447e-06, 8.263625204563141e-06, 9.039416909217834e-06, 9.815208613872528e-06, 1.0591000318527222e-05, 1.1366792023181915e-05, 1.2142583727836609e-05, 1.2918375432491302e-05, 1.3694167137145996e-05, 1.446995884180069e-05, 1.5245750546455383e-05, 1.6021542251110077e-05, 1.679733395576477e-05, 1.7573125660419464e-05, 1.8348917365074158e-05, 1.912470906972885e-05, 1.9900500774383545e-05, 2.067629247903824e-05, 2.1452084183692932e-05, 2.2227875888347626e-05, 2.300366759300232e-05, 2.3779459297657013e-05, 2.4555251002311707e-05, 2.53310427069664e-05, 2.6106834411621094e-05]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 4.0, 6.0, 6.0, 9.0, 11.0, 22.0, 24.0, 38.0, 62.0, 83.0, 113.0, 188.0, 228.0, 368.0, 559.0, 821.0, 1311.0, 1849.0, 2883.0, 4431.0, 7010.0, 11273.0, 18501.0, 30776.0, 54791.0, 106288.0, 276662.0, 2594066.0, 730286.0, 168885.0, 76874.0, 41392.0, 24200.0, 14706.0, 8968.0, 5703.0, 3642.0, 2410.0, 1651.0, 1036.0, 691.0, 445.0, 323.0, 227.0, 148.0, 92.0, 74.0, 59.0, 24.0, 28.0, 10.0, 13.0, 13.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0], "bins": [-6.604194641113281e-05, -6.396323442459106e-05, -6.188452243804932e-05, -5.980581045150757e-05, -5.772709846496582e-05, -5.564838647842407e-05, -5.3569674491882324e-05, -5.1490962505340576e-05, -4.941225051879883e-05, -4.733353853225708e-05, -4.525482654571533e-05, -4.3176114559173584e-05, -4.1097402572631836e-05, -3.901869058609009e-05, -3.693997859954834e-05, -3.486126661300659e-05, -3.2782554626464844e-05, -3.0703842639923096e-05, -2.8625130653381348e-05, -2.65464186668396e-05, -2.446770668029785e-05, -2.2388994693756104e-05, -2.0310282707214355e-05, -1.8231570720672607e-05, -1.615285873413086e-05, -1.4074146747589111e-05, -1.1995434761047363e-05, -9.916722774505615e-06, -7.838010787963867e-06, -5.759298801422119e-06, -3.680586814880371e-06, -1.601874828338623e-06, 4.76837158203125e-07, 2.555549144744873e-06, 4.634261131286621e-06, 6.712973117828369e-06, 8.791685104370117e-06, 1.0870397090911865e-05, 1.2949109077453613e-05, 1.5027821063995361e-05, 1.710653305053711e-05, 1.9185245037078857e-05, 2.1263957023620605e-05, 2.3342669010162354e-05, 2.54213809967041e-05, 2.750009298324585e-05, 2.9578804969787598e-05, 3.1657516956329346e-05, 3.3736228942871094e-05, 3.581494092941284e-05, 3.789365291595459e-05, 3.997236490249634e-05, 4.2051076889038086e-05, 4.4129788875579834e-05, 4.620850086212158e-05, 4.828721284866333e-05, 5.036592483520508e-05, 5.2444636821746826e-05, 5.4523348808288574e-05, 5.660206079483032e-05, 5.868077278137207e-05, 6.075948476791382e-05, 6.283819675445557e-05, 6.491690874099731e-05, 6.699562072753906e-05]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 4.0, 3.0, 3.0, 6.0, 15.0, 14.0, 12.0, 18.0, 16.0, 27.0, 34.0, 35.0, 49.0, 52.0, 72.0, 83.0, 118.0, 165.0, 340.0, 895.0, 956.0, 374.0, 170.0, 89.0, 84.0, 75.0, 50.0, 44.0, 49.0, 31.0, 41.0, 27.0, 21.0, 23.0, 18.0, 12.0, 13.0, 11.0, 7.0, 3.0, 10.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.638599395751953e-05, -5.462765693664551e-05, -5.2869319915771484e-05, -5.111098289489746e-05, -4.935264587402344e-05, -4.7594308853149414e-05, -4.583597183227539e-05, -4.407763481140137e-05, -4.2319297790527344e-05, -4.056096076965332e-05, -3.88026237487793e-05, -3.7044286727905273e-05, -3.528594970703125e-05, -3.3527612686157227e-05, -3.17692756652832e-05, -3.001093864440918e-05, -2.8252601623535156e-05, -2.6494264602661133e-05, -2.473592758178711e-05, -2.2977590560913086e-05, -2.1219253540039062e-05, -1.946091651916504e-05, -1.7702579498291016e-05, -1.5944242477416992e-05, -1.4185905456542969e-05, -1.2427568435668945e-05, -1.0669231414794922e-05, -8.910894393920898e-06, -7.152557373046875e-06, -5.3942203521728516e-06, -3.635883331298828e-06, -1.8775463104248047e-06, -1.1920928955078125e-07, 1.6391277313232422e-06, 3.3974647521972656e-06, 5.155801773071289e-06, 6.9141387939453125e-06, 8.672475814819336e-06, 1.043081283569336e-05, 1.2189149856567383e-05, 1.3947486877441406e-05, 1.570582389831543e-05, 1.7464160919189453e-05, 1.9222497940063477e-05, 2.09808349609375e-05, 2.2739171981811523e-05, 2.4497509002685547e-05, 2.625584602355957e-05, 2.8014183044433594e-05, 2.9772520065307617e-05, 3.153085708618164e-05, 3.3289194107055664e-05, 3.504753112792969e-05, 3.680586814880371e-05, 3.8564205169677734e-05, 4.032254219055176e-05, 4.208087921142578e-05, 4.3839216232299805e-05, 4.559755325317383e-05, 4.735589027404785e-05, 4.9114227294921875e-05, 5.08725643157959e-05, 5.263090133666992e-05, 5.4389238357543945e-05, 5.614757537841797e-05]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 3.0, 8.0, 8.0, 12.0, 11.0, 21.0, 30.0, 37.0, 52.0, 85.0, 117.0, 121.0, 94.0, 78.0, 62.0, 68.0, 32.0, 29.0, 28.0, 25.0, 9.0, 13.0, 8.0, 6.0, 9.0, 7.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002769384882412851, -0.0002659406163729727, -0.00025494274450466037, -0.000243944872636348, -0.00023294700076803565, -0.0002219491288997233, -0.00021095127158332616, -0.0001999533997150138, -0.00018895552784670144, -0.00017795765597838908, -0.00016695978411007673, -0.0001559619267936796, -0.00014496405492536724, -0.00013396618305705488, -0.00012296831118874252, -0.00011197043932043016, -0.0001009725674521178, -8.997469558380544e-05, -7.897682371549308e-05, -6.797895912313834e-05, -5.698108725482598e-05, -4.598321538651362e-05, -3.4985350794158876e-05, -2.3987478925846517e-05, -1.2989607057534158e-05, -1.991737008211203e-06, 9.006133041111752e-06, 2.0004001271445304e-05, 3.100187313975766e-05, 4.199974500807002e-05, 5.2997609600424767e-05, 6.399548146873713e-05, 7.499335333704948e-05, 8.599122520536184e-05, 9.69890970736742e-05, 0.00010798696166602895, 0.0001189848335343413, 0.00012998271267861128, 0.0001409805699950084, 0.00015197844186332077, 0.00016297631373163313, 0.00017397418559994549, 0.00018497205746825784, 0.00019596991478465497, 0.00020696778665296733, 0.0002179656585212797, 0.00022896353038959205, 0.0002399614022579044, 0.00025095927412621677, 0.00026195714599452913, 0.0002729550178628415, 0.00028395288973115385, 0.0002949507615994662, 0.00030594863346777856, 0.00031694647623226047, 0.0003279443481005728, 0.0003389422199688852, 0.00034994009183719754, 0.0003609379637055099, 0.00037193583557382226, 0.0003829337074421346, 0.000393931579310447, 0.00040492945117875934, 0.0004159273230470717, 0.00042692519491538405]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 0.0, 3.0, 6.0, 14.0, 10.0, 9.0, 15.0, 19.0, 21.0, 15.0, 26.0, 33.0, 26.0, 39.0, 44.0, 35.0, 35.0, 47.0, 38.0, 37.0, 44.0, 34.0, 45.0, 29.0, 35.0, 44.0, 36.0, 30.0, 28.0, 27.0, 20.0, 18.0, 14.0, 22.0, 19.0, 12.0, 10.0, 15.0, 6.0, 11.0, 6.0, 12.0, 1.0, 1.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00018846988677978516, -0.00018220487982034683, -0.0001759398728609085, -0.00016967486590147018, -0.00016340985894203186, -0.00015714485198259354, -0.0001508798450231552, -0.0001446148380637169, -0.00013834983110427856, -0.00013208482414484024, -0.00012581981718540192, -0.00011955481022596359, -0.00011328980326652527, -0.00010702479630708694, -0.00010075978934764862, -9.44947823882103e-05, -8.822977542877197e-05, -8.196476846933365e-05, -7.569976150989532e-05, -6.9434754550457e-05, -6.316974759101868e-05, -5.690474063158035e-05, -5.063973367214203e-05, -4.4374726712703705e-05, -3.810971975326538e-05, -3.184471279382706e-05, -2.5579705834388733e-05, -1.931469887495041e-05, -1.3049691915512085e-05, -6.784684956073761e-06, -5.19677996635437e-07, 5.745328962802887e-06, 1.2010335922241211e-05, 1.8275342881679535e-05, 2.454034984111786e-05, 3.080535680055618e-05, 3.707036375999451e-05, 4.333537071943283e-05, 4.9600377678871155e-05, 5.586538463830948e-05, 6.21303915977478e-05, 6.839539855718613e-05, 7.466040551662445e-05, 8.092541247606277e-05, 8.71904194355011e-05, 9.345542639493942e-05, 9.972043335437775e-05, 0.00010598544031381607, 0.0001122504472732544, 0.00011851545423269272, 0.00012478046119213104, 0.00013104546815156937, 0.0001373104751110077, 0.00014357548207044601, 0.00014984048902988434, 0.00015610549598932266, 0.00016237050294876099, 0.0001686355099081993, 0.00017490051686763763, 0.00018116552382707596, 0.00018743053078651428, 0.0001936955377459526, 0.00019996054470539093, 0.00020622555166482925, 0.00021249055862426758]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 11.0, 12.0, 22.0, 23.0, 37.0, 34.0, 68.0, 93.0, 118.0, 161.0, 258.0, 380.0, 578.0, 870.0, 1286.0, 2241.0, 4046.0, 7428.0, 15067.0, 36607.0, 104052.0, 538670.0, 227321.0, 61187.0, 23875.0, 10501.0, 5660.0, 3005.0, 1687.0, 1038.0, 694.0, 450.0, 323.0, 213.0, 144.0, 118.0, 68.0, 47.0, 30.0, 30.0, 21.0, 13.0, 13.0, 7.0, 7.0, 6.0, 3.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.0001709461212158203, -0.0001657288521528244, -0.0001605115830898285, -0.00015529431402683258, -0.00015007704496383667, -0.00014485977590084076, -0.00013964250683784485, -0.00013442523777484894, -0.00012920796871185303, -0.00012399069964885712, -0.0001187734305858612, -0.0001135561615228653, -0.00010833889245986938, -0.00010312162339687347, -9.790435433387756e-05, -9.268708527088165e-05, -8.746981620788574e-05, -8.225254714488983e-05, -7.703527808189392e-05, -7.181800901889801e-05, -6.66007399559021e-05, -6.138347089290619e-05, -5.616620182991028e-05, -5.094893276691437e-05, -4.573166370391846e-05, -4.0514394640922546e-05, -3.5297125577926636e-05, -3.0079856514930725e-05, -2.4862587451934814e-05, -1.9645318388938904e-05, -1.4428049325942993e-05, -9.210780262947083e-06, -3.993511199951172e-06, 1.2237578630447388e-06, 6.441026926040649e-06, 1.165829598903656e-05, 1.687556505203247e-05, 2.209283411502838e-05, 2.7310103178024292e-05, 3.25273722410202e-05, 3.774464130401611e-05, 4.2961910367012024e-05, 4.8179179430007935e-05, 5.3396448493003845e-05, 5.8613717555999756e-05, 6.383098661899567e-05, 6.904825568199158e-05, 7.426552474498749e-05, 7.94827938079834e-05, 8.470006287097931e-05, 8.991733193397522e-05, 9.513460099697113e-05, 0.00010035187005996704, 0.00010556913912296295, 0.00011078640818595886, 0.00011600367724895477, 0.00012122094631195068, 0.0001264382153749466, 0.0001316554844379425, 0.00013687275350093842, 0.00014209002256393433, 0.00014730729162693024, 0.00015252456068992615, 0.00015774182975292206, 0.00016295909881591797]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 9.0, 19.0, 19.0, 28.0, 36.0, 42.0, 54.0, 61.0, 109.0, 83.0, 105.0, 97.0, 73.0, 58.0, 47.0, 40.0, 26.0, 20.0, 16.0, 8.0, 10.0, 5.0, 3.0, 1.0, 5.0, 3.0, 0.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.181529998779297e-05, -2.095010131597519e-05, -2.008490264415741e-05, -1.921970397233963e-05, -1.835450530052185e-05, -1.748930662870407e-05, -1.662410795688629e-05, -1.5758909285068512e-05, -1.4893710613250732e-05, -1.4028511941432953e-05, -1.3163313269615173e-05, -1.2298114597797394e-05, -1.1432915925979614e-05, -1.0567717254161835e-05, -9.702518582344055e-06, -8.837319910526276e-06, -7.972121238708496e-06, -7.1069225668907166e-06, -6.241723895072937e-06, -5.3765252232551575e-06, -4.511326551437378e-06, -3.6461278796195984e-06, -2.780929207801819e-06, -1.9157305359840393e-06, -1.0505318641662598e-06, -1.8533319234848022e-07, 6.798654794692993e-07, 1.5450641512870789e-06, 2.4102628231048584e-06, 3.275461494922638e-06, 4.1406601667404175e-06, 5.005858838558197e-06, 5.8710575103759766e-06, 6.736256182193756e-06, 7.601454854011536e-06, 8.466653525829315e-06, 9.331852197647095e-06, 1.0197050869464874e-05, 1.1062249541282654e-05, 1.1927448213100433e-05, 1.2792646884918213e-05, 1.3657845556735992e-05, 1.4523044228553772e-05, 1.538824290037155e-05, 1.625344157218933e-05, 1.711864024400711e-05, 1.798383891582489e-05, 1.884903758764267e-05, 1.971423625946045e-05, 2.057943493127823e-05, 2.1444633603096008e-05, 2.2309832274913788e-05, 2.3175030946731567e-05, 2.4040229618549347e-05, 2.4905428290367126e-05, 2.5770626962184906e-05, 2.6635825634002686e-05, 2.7501024305820465e-05, 2.8366222977638245e-05, 2.9231421649456024e-05, 3.0096620321273804e-05, 3.096181899309158e-05, 3.182701766490936e-05, 3.269221633672714e-05, 3.355741500854492e-05]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 4.0, 11.0, 12.0, 19.0, 26.0, 29.0, 49.0, 89.0, 84.0, 159.0, 178.0, 288.0, 401.0, 557.0, 792.0, 1172.0, 1563.0, 2365.0, 3283.0, 4720.0, 6764.0, 10127.0, 14106.0, 21281.0, 30310.0, 47786.0, 74871.0, 142927.0, 291775.0, 157443.0, 80883.0, 50744.0, 32048.0, 22454.0, 14919.0, 10657.0, 7101.0, 5052.0, 3392.0, 2413.0, 1711.0, 1170.0, 810.0, 588.0, 427.0, 281.0, 231.0, 141.0, 103.0, 65.0, 60.0, 39.0, 24.0, 24.0, 14.0, 6.0, 3.0, 7.0, 3.0, 3.0, 1.0], "bins": [-5.549192428588867e-05, -5.373358726501465e-05, -5.1975250244140625e-05, -5.02169132232666e-05, -4.845857620239258e-05, -4.6700239181518555e-05, -4.494190216064453e-05, -4.318356513977051e-05, -4.1425228118896484e-05, -3.966689109802246e-05, -3.790855407714844e-05, -3.6150217056274414e-05, -3.439188003540039e-05, -3.263354301452637e-05, -3.0875205993652344e-05, -2.911686897277832e-05, -2.7358531951904297e-05, -2.5600194931030273e-05, -2.384185791015625e-05, -2.2083520889282227e-05, -2.0325183868408203e-05, -1.856684684753418e-05, -1.6808509826660156e-05, -1.5050172805786133e-05, -1.329183578491211e-05, -1.1533498764038086e-05, -9.775161743164062e-06, -8.016824722290039e-06, -6.258487701416016e-06, -4.500150680541992e-06, -2.7418136596679688e-06, -9.834766387939453e-07, 7.748603820800781e-07, 2.5331974029541016e-06, 4.291534423828125e-06, 6.0498714447021484e-06, 7.808208465576172e-06, 9.566545486450195e-06, 1.1324882507324219e-05, 1.3083219528198242e-05, 1.4841556549072266e-05, 1.659989356994629e-05, 1.8358230590820312e-05, 2.0116567611694336e-05, 2.187490463256836e-05, 2.3633241653442383e-05, 2.5391578674316406e-05, 2.714991569519043e-05, 2.8908252716064453e-05, 3.0666589736938477e-05, 3.24249267578125e-05, 3.4183263778686523e-05, 3.594160079956055e-05, 3.769993782043457e-05, 3.9458274841308594e-05, 4.121661186218262e-05, 4.297494888305664e-05, 4.4733285903930664e-05, 4.649162292480469e-05, 4.824995994567871e-05, 5.0008296966552734e-05, 5.176663398742676e-05, 5.352497100830078e-05, 5.5283308029174805e-05, 5.704164505004883e-05]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 8.0, 5.0, 7.0, 6.0, 8.0, 13.0, 15.0, 16.0, 17.0, 14.0, 25.0, 25.0, 12.0, 31.0, 18.0, 31.0, 27.0, 36.0, 42.0, 34.0, 38.0, 31.0, 32.0, 36.0, 46.0, 33.0, 51.0, 34.0, 34.0, 30.0, 19.0, 29.0, 19.0, 25.0, 19.0, 22.0, 26.0, 11.0, 10.0, 15.0, 10.0, 9.0, 12.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.404783248901367e-05, -4.268251359462738e-05, -4.131719470024109e-05, -3.99518758058548e-05, -3.8586556911468506e-05, -3.7221238017082214e-05, -3.585591912269592e-05, -3.449060022830963e-05, -3.312528133392334e-05, -3.175996243953705e-05, -3.0394643545150757e-05, -2.9029324650764465e-05, -2.7664005756378174e-05, -2.6298686861991882e-05, -2.493336796760559e-05, -2.35680490732193e-05, -2.2202730178833008e-05, -2.0837411284446716e-05, -1.9472092390060425e-05, -1.8106773495674133e-05, -1.6741454601287842e-05, -1.537613570690155e-05, -1.4010816812515259e-05, -1.2645497918128967e-05, -1.1280179023742676e-05, -9.914860129356384e-06, -8.549541234970093e-06, -7.184222340583801e-06, -5.81890344619751e-06, -4.453584551811218e-06, -3.0882656574249268e-06, -1.7229467630386353e-06, -3.5762786865234375e-07, 1.0076910257339478e-06, 2.3730099201202393e-06, 3.7383288145065308e-06, 5.103647708892822e-06, 6.468966603279114e-06, 7.834285497665405e-06, 9.199604392051697e-06, 1.0564923286437988e-05, 1.193024218082428e-05, 1.3295561075210571e-05, 1.4660879969596863e-05, 1.6026198863983154e-05, 1.7391517758369446e-05, 1.8756836652755737e-05, 2.012215554714203e-05, 2.148747444152832e-05, 2.2852793335914612e-05, 2.4218112230300903e-05, 2.5583431124687195e-05, 2.6948750019073486e-05, 2.8314068913459778e-05, 2.967938780784607e-05, 3.104470670223236e-05, 3.241002559661865e-05, 3.3775344491004944e-05, 3.5140663385391235e-05, 3.650598227977753e-05, 3.787130117416382e-05, 3.923662006855011e-05, 4.06019389629364e-05, 4.196725785732269e-05, 4.3332576751708984e-05]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 11.0, 16.0, 13.0, 20.0, 15.0, 59.0, 74.0, 73.0, 123.0, 108.0, 235.0, 350.0, 355.0, 734.0, 1150.0, 1122.0, 2609.0, 2800.0, 6717.0, 13339.0, 16219.0, 50110.0, 72002.0, 274540.0, 377254.0, 102539.0, 67860.0, 21069.0, 16809.0, 8546.0, 3356.0, 3163.0, 1370.0, 1358.0, 811.0, 394.0, 407.0, 238.0, 122.0, 132.0, 56.0, 77.0, 53.0, 33.0, 26.0, 22.0, 27.0, 8.0, 6.0, 9.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0], "bins": [-5.0067901611328125e-06, -4.851259291172028e-06, -4.695728421211243e-06, -4.540197551250458e-06, -4.384666681289673e-06, -4.229135811328888e-06, -4.073604941368103e-06, -3.918074071407318e-06, -3.762543201446533e-06, -3.6070123314857483e-06, -3.4514814615249634e-06, -3.2959505915641785e-06, -3.1404197216033936e-06, -2.9848888516426086e-06, -2.8293579816818237e-06, -2.673827111721039e-06, -2.518296241760254e-06, -2.362765371799469e-06, -2.207234501838684e-06, -2.051703631877899e-06, -1.8961727619171143e-06, -1.7406418919563293e-06, -1.5851110219955444e-06, -1.4295801520347595e-06, -1.2740492820739746e-06, -1.1185184121131897e-06, -9.629875421524048e-07, -8.074566721916199e-07, -6.51925802230835e-07, -4.9639493227005e-07, -3.4086406230926514e-07, -1.8533319234848022e-07, -2.9802322387695312e-08, 1.257285475730896e-07, 2.812594175338745e-07, 4.367902874946594e-07, 5.923211574554443e-07, 7.478520274162292e-07, 9.033828973770142e-07, 1.058913767337799e-06, 1.214444637298584e-06, 1.369975507259369e-06, 1.5255063772201538e-06, 1.6810372471809387e-06, 1.8365681171417236e-06, 1.9920989871025085e-06, 2.1476298570632935e-06, 2.3031607270240784e-06, 2.4586915969848633e-06, 2.614222466945648e-06, 2.769753336906433e-06, 2.925284206867218e-06, 3.080815076828003e-06, 3.236345946788788e-06, 3.3918768167495728e-06, 3.5474076867103577e-06, 3.7029385566711426e-06, 3.8584694266319275e-06, 4.014000296592712e-06, 4.169531166553497e-06, 4.325062036514282e-06, 4.480592906475067e-06, 4.636123776435852e-06, 4.791654646396637e-06, 4.947185516357422e-06]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 6.0, 2.0, 4.0, 5.0, 18.0, 19.0, 20.0, 21.0, 34.0, 36.0, 35.0, 83.0, 42.0, 48.0, 55.0, 55.0, 54.0, 48.0, 106.0, 55.0, 34.0, 39.0, 38.0, 31.0, 24.0, 40.0, 14.0, 4.0, 4.0, 5.0, 5.0, 3.0, 10.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.196989953517914e-06, -2.129003405570984e-06, -2.061016857624054e-06, -1.993030309677124e-06, -1.925043761730194e-06, -1.8570572137832642e-06, -1.7890706658363342e-06, -1.7210841178894043e-06, -1.6530975699424744e-06, -1.5851110219955444e-06, -1.5171244740486145e-06, -1.4491379261016846e-06, -1.3811513781547546e-06, -1.3131648302078247e-06, -1.2451782822608948e-06, -1.1771917343139648e-06, -1.109205186367035e-06, -1.041218638420105e-06, -9.73232090473175e-07, -9.052455425262451e-07, -8.372589945793152e-07, -7.692724466323853e-07, -7.012858986854553e-07, -6.332993507385254e-07, -5.653128027915955e-07, -4.973262548446655e-07, -4.293397068977356e-07, -3.6135315895080566e-07, -2.9336661100387573e-07, -2.253800630569458e-07, -1.5739351511001587e-07, -8.940696716308594e-08, -2.1420419216156006e-08, 4.6566128730773926e-08, 1.1455267667770386e-07, 1.825392246246338e-07, 2.505257725715637e-07, 3.1851232051849365e-07, 3.864988684654236e-07, 4.544854164123535e-07, 5.224719643592834e-07, 5.904585123062134e-07, 6.584450602531433e-07, 7.264316082000732e-07, 7.944181561470032e-07, 8.624047040939331e-07, 9.30391252040863e-07, 9.98377799987793e-07, 1.066364347934723e-06, 1.1343508958816528e-06, 1.2023374438285828e-06, 1.2703239917755127e-06, 1.3383105397224426e-06, 1.4062970876693726e-06, 1.4742836356163025e-06, 1.5422701835632324e-06, 1.6102567315101624e-06, 1.6782432794570923e-06, 1.7462298274040222e-06, 1.8142163753509521e-06, 1.882202923297882e-06, 1.950189471244812e-06, 2.018176019191742e-06, 2.086162567138672e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 5.0, 10.0, 4.0, 3.0, 16.0, 16.0, 43.0, 49.0, 72.0, 96.0, 270.0, 329.0, 492.0, 854.0, 1373.0, 3743.0, 5892.0, 12295.0, 29362.0, 77509.0, 501755.0, 281617.0, 77840.0, 29007.0, 15002.0, 4795.0, 2529.0, 1423.0, 834.0, 568.0, 237.0, 183.0, 103.0, 77.0, 39.0, 34.0, 22.0, 13.0, 11.0, 13.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.318092346191406e-06, -6.126239895820618e-06, -5.934387445449829e-06, -5.7425349950790405e-06, -5.550682544708252e-06, -5.358830094337463e-06, -5.166977643966675e-06, -4.975125193595886e-06, -4.783272743225098e-06, -4.591420292854309e-06, -4.3995678424835205e-06, -4.207715392112732e-06, -4.015862941741943e-06, -3.824010491371155e-06, -3.632158041000366e-06, -3.4403055906295776e-06, -3.248453140258789e-06, -3.0566006898880005e-06, -2.864748239517212e-06, -2.6728957891464233e-06, -2.4810433387756348e-06, -2.289190888404846e-06, -2.0973384380340576e-06, -1.905485987663269e-06, -1.7136335372924805e-06, -1.521781086921692e-06, -1.3299286365509033e-06, -1.1380761861801147e-06, -9.462237358093262e-07, -7.543712854385376e-07, -5.62518835067749e-07, -3.7066638469696045e-07, -1.7881393432617188e-07, 1.30385160446167e-08, 2.0489096641540527e-07, 3.9674341678619385e-07, 5.885958671569824e-07, 7.80448317527771e-07, 9.723007678985596e-07, 1.1641532182693481e-06, 1.3560056686401367e-06, 1.5478581190109253e-06, 1.7397105693817139e-06, 1.9315630197525024e-06, 2.123415470123291e-06, 2.3152679204940796e-06, 2.507120370864868e-06, 2.6989728212356567e-06, 2.8908252716064453e-06, 3.082677721977234e-06, 3.2745301723480225e-06, 3.466382622718811e-06, 3.6582350730895996e-06, 3.850087523460388e-06, 4.041939973831177e-06, 4.233792424201965e-06, 4.425644874572754e-06, 4.6174973249435425e-06, 4.809349775314331e-06, 5.00120222568512e-06, 5.193054676055908e-06, 5.384907126426697e-06, 5.576759576797485e-06, 5.768612027168274e-06, 5.9604644775390625e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 13.0, 12.0, 22.0, 33.0, 50.0, 28.0, 56.0, 60.0, 87.0, 95.0, 96.0, 73.0, 67.0, 71.0, 27.0, 45.0, 33.0, 38.0, 19.0, 13.0, 15.0, 5.0, 6.0, 0.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6226043701171875e-06, -2.5099143385887146e-06, -2.3972243070602417e-06, -2.284534275531769e-06, -2.171844244003296e-06, -2.059154212474823e-06, -1.94646418094635e-06, -1.8337741494178772e-06, -1.7210841178894043e-06, -1.6083940863609314e-06, -1.4957040548324585e-06, -1.3830140233039856e-06, -1.2703239917755127e-06, -1.1576339602470398e-06, -1.044943928718567e-06, -9.32253897190094e-07, -8.195638656616211e-07, -7.068738341331482e-07, -5.941838026046753e-07, -4.814937710762024e-07, -3.688037395477295e-07, -2.561137080192566e-07, -1.434236764907837e-07, -3.073364496231079e-08, 8.195638656616211e-08, 1.94646418094635e-07, 3.073364496231079e-07, 4.200264811515808e-07, 5.327165126800537e-07, 6.454065442085266e-07, 7.580965757369995e-07, 8.707866072654724e-07, 9.834766387939453e-07, 1.0961666703224182e-06, 1.2088567018508911e-06, 1.321546733379364e-06, 1.434236764907837e-06, 1.5469267964363098e-06, 1.6596168279647827e-06, 1.7723068594932556e-06, 1.8849968910217285e-06, 1.9976869225502014e-06, 2.1103769540786743e-06, 2.2230669856071472e-06, 2.33575701713562e-06, 2.448447048664093e-06, 2.561137080192566e-06, 2.673827111721039e-06, 2.7865171432495117e-06, 2.8992071747779846e-06, 3.0118972063064575e-06, 3.1245872378349304e-06, 3.2372772693634033e-06, 3.3499673008918762e-06, 3.462657332420349e-06, 3.575347363948822e-06, 3.688037395477295e-06, 3.800727427005768e-06, 3.913417458534241e-06, 4.026107490062714e-06, 4.1387975215911865e-06, 4.2514875531196594e-06, 4.364177584648132e-06, 4.476867616176605e-06, 4.589557647705078e-06]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 14.0, 16.0, 34.0, 69.0, 112.0, 278.0, 165.0, 105.0, 59.0, 47.0, 31.0, 20.0, 18.0, 11.0, 8.0, 2.0, 5.0, 6.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000478080241009593, -0.0004634204087778926, -0.00044876057654619217, -0.00043410074431449175, -0.00041944091208279133, -0.0004047810798510909, -0.0003901212476193905, -0.0003754613862838596, -0.0003608015540521592, -0.00034614172182045877, -0.00033148188958875835, -0.00031682205735705793, -0.0003021622251253575, -0.00028750236378982663, -0.0002728425315581262, -0.0002581826993264258, -0.0002435228816466406, -0.00022886304941494018, -0.00021420321718323976, -0.0001995433703996241, -0.0001848835381679237, -0.00017022370593622327, -0.00015556387370452285, -0.00014090404147282243, -0.000126244209241122, -0.00011158437700942159, -9.692453750176355e-05, -8.226470527006313e-05, -6.76048657624051e-05, -5.294503353070468e-05, -3.828520129900426e-05, -2.3625361791346222e-05, -8.965522283688188e-06, 5.694312676496338e-06, 2.0354147636680864e-05, 3.501398168737069e-05, 4.9673817557049915e-05, 6.433365342672914e-05, 7.899348565842956e-05, 9.36533251660876e-05, 0.00010831315739778802, 0.00012297299690544605, 0.00013763282913714647, 0.0001522926613688469, 0.00016695249360054731, 0.00018161232583224773, 0.00019627215806394815, 0.0002109320048475638, 0.00022559183707926422, 0.00024025166931096464, 0.0002549115160945803, 0.0002695713483262807, 0.00028423118055798113, 0.00029889101278968155, 0.000313550845021382, 0.0003282106772530824, 0.0003428705094847828, 0.00035753034171648324, 0.00037219017394818366, 0.0003868500061798841, 0.0004015098384115845, 0.0004161696997471154, 0.0004308295319788158, 0.0004454893642105162, 0.00046014919644221663]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 9.0, 12.0, 15.0, 17.0, 13.0, 16.0, 30.0, 27.0, 30.0, 27.0, 47.0, 46.0, 46.0, 42.0, 31.0, 41.0, 37.0, 45.0, 34.0, 43.0, 30.0, 34.0, 36.0, 24.0, 31.0, 23.0, 25.0, 35.0, 18.0, 20.0, 16.0, 21.0, 12.0, 13.0, 8.0, 6.0, 3.0, 9.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0001575946807861328, -0.00015260186046361923, -0.00014760904014110565, -0.00014261621981859207, -0.0001376233994960785, -0.0001326305791735649, -0.00012763775885105133, -0.00012264493852853775, -0.00011765211820602417, -0.00011265929788351059, -0.00010766647756099701, -0.00010267365723848343, -9.768083691596985e-05, -9.268801659345627e-05, -8.769519627094269e-05, -8.270237594842911e-05, -7.770955562591553e-05, -7.271673530340195e-05, -6.772391498088837e-05, -6.273109465837479e-05, -5.7738274335861206e-05, -5.2745454013347626e-05, -4.7752633690834045e-05, -4.2759813368320465e-05, -3.7766993045806885e-05, -3.2774172723293304e-05, -2.7781352400779724e-05, -2.2788532078266144e-05, -1.7795711755752563e-05, -1.2802891433238983e-05, -7.810071110725403e-06, -2.8172507882118225e-06, 2.175569534301758e-06, 7.168389856815338e-06, 1.2161210179328918e-05, 1.71540305018425e-05, 2.214685082435608e-05, 2.713967114686966e-05, 3.213249146938324e-05, 3.712531179189682e-05, 4.21181321144104e-05, 4.711095243692398e-05, 5.210377275943756e-05, 5.709659308195114e-05, 6.208941340446472e-05, 6.70822337269783e-05, 7.207505404949188e-05, 7.706787437200546e-05, 8.206069469451904e-05, 8.705351501703262e-05, 9.20463353395462e-05, 9.703915566205978e-05, 0.00010203197598457336, 0.00010702479630708694, 0.00011201761662960052, 0.0001170104369521141, 0.00012200325727462769, 0.00012699607759714127, 0.00013198889791965485, 0.00013698171824216843, 0.000141974538564682, 0.0001469673588871956, 0.00015196017920970917, 0.00015695299953222275, 0.00016194581985473633]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 9.0, 3.0, 7.0, 17.0, 12.0, 12.0, 16.0, 36.0, 32.0, 58.0, 112.0, 177.0, 250.0, 383.0, 610.0, 849.0, 1324.0, 2235.0, 3640.0, 6169.0, 10949.0, 21062.0, 45139.0, 125338.0, 3167874.0, 658249.0, 79485.0, 32594.0, 15999.0, 8455.0, 4638.0, 2845.0, 1734.0, 1136.0, 751.0, 519.0, 361.0, 276.0, 218.0, 199.0, 128.0, 94.0, 76.0, 43.0, 44.0, 32.0, 14.0, 15.0, 17.0, 22.0, 8.0, 9.0, 4.0, 7.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0001227855682373047, -0.00011880509555339813, -0.00011482462286949158, -0.00011084415018558502, -0.00010686367750167847, -0.00010288320481777191, -9.890273213386536e-05, -9.49222594499588e-05, -9.094178676605225e-05, -8.696131408214569e-05, -8.298084139823914e-05, -7.900036871433258e-05, -7.501989603042603e-05, -7.103942334651947e-05, -6.705895066261292e-05, -6.307847797870636e-05, -5.9098005294799805e-05, -5.511753261089325e-05, -5.1137059926986694e-05, -4.715658724308014e-05, -4.3176114559173584e-05, -3.919564187526703e-05, -3.5215169191360474e-05, -3.123469650745392e-05, -2.7254223823547363e-05, -2.3273751139640808e-05, -1.9293278455734253e-05, -1.5312805771827698e-05, -1.1332333087921143e-05, -7.351860404014587e-06, -3.3713877201080322e-06, 6.09084963798523e-07, 4.589557647705078e-06, 8.570030331611633e-06, 1.2550503015518188e-05, 1.6530975699424744e-05, 2.05114483833313e-05, 2.4491921067237854e-05, 2.847239375114441e-05, 3.2452866435050964e-05, 3.643333911895752e-05, 4.0413811802864075e-05, 4.439428448677063e-05, 4.8374757170677185e-05, 5.235522985458374e-05, 5.6335702538490295e-05, 6.031617522239685e-05, 6.42966479063034e-05, 6.827712059020996e-05, 7.225759327411652e-05, 7.623806595802307e-05, 8.021853864192963e-05, 8.419901132583618e-05, 8.817948400974274e-05, 9.215995669364929e-05, 9.614042937755585e-05, 0.0001001209020614624, 0.00010410137474536896, 0.00010808184742927551, 0.00011206232011318207, 0.00011604279279708862, 0.00012002326548099518, 0.00012400373816490173, 0.0001279842108488083, 0.00013196468353271484]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 9.0, 4.0, 3.0, 8.0, 14.0, 15.0, 26.0, 34.0, 43.0, 53.0, 63.0, 87.0, 108.0, 115.0, 93.0, 82.0, 58.0, 41.0, 33.0, 34.0, 19.0, 17.0, 10.0, 11.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9325485229492188e-05, -2.8392300009727478e-05, -2.745911478996277e-05, -2.652592957019806e-05, -2.559274435043335e-05, -2.465955913066864e-05, -2.372637391090393e-05, -2.279318869113922e-05, -2.1860003471374512e-05, -2.0926818251609802e-05, -1.9993633031845093e-05, -1.9060447812080383e-05, -1.8127262592315674e-05, -1.7194077372550964e-05, -1.6260892152786255e-05, -1.5327706933021545e-05, -1.4394521713256836e-05, -1.3461336493492126e-05, -1.2528151273727417e-05, -1.1594966053962708e-05, -1.0661780834197998e-05, -9.728595614433289e-06, -8.795410394668579e-06, -7.86222517490387e-06, -6.92903995513916e-06, -5.995854735374451e-06, -5.062669515609741e-06, -4.129484295845032e-06, -3.1962990760803223e-06, -2.263113856315613e-06, -1.3299286365509033e-06, -3.9674341678619385e-07, 5.364418029785156e-07, 1.469627022743225e-06, 2.4028122425079346e-06, 3.335997462272644e-06, 4.2691826820373535e-06, 5.202367901802063e-06, 6.1355531215667725e-06, 7.068738341331482e-06, 8.001923561096191e-06, 8.935108780860901e-06, 9.86829400062561e-06, 1.080147922039032e-05, 1.173466444015503e-05, 1.2667849659919739e-05, 1.3601034879684448e-05, 1.4534220099449158e-05, 1.5467405319213867e-05, 1.6400590538978577e-05, 1.7333775758743286e-05, 1.8266960978507996e-05, 1.9200146198272705e-05, 2.0133331418037415e-05, 2.1066516637802124e-05, 2.1999701857566833e-05, 2.2932887077331543e-05, 2.3866072297096252e-05, 2.4799257516860962e-05, 2.573244273662567e-05, 2.666562795639038e-05, 2.759881317615509e-05, 2.85319983959198e-05, 2.946518361568451e-05, 3.039836883544922e-05]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 6.0, 6.0, 25.0, 23.0, 36.0, 43.0, 63.0, 88.0, 136.0, 209.0, 395.0, 538.0, 871.0, 1316.0, 2067.0, 3469.0, 5762.0, 9553.0, 16731.0, 31228.0, 57847.0, 119991.0, 348983.0, 2877448.0, 440325.0, 135034.0, 63196.0, 33332.0, 18775.0, 10479.0, 6210.0, 3767.0, 2268.0, 1471.0, 904.0, 522.0, 400.0, 250.0, 163.0, 115.0, 88.0, 39.0, 35.0, 20.0, 17.0, 16.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.794929504394531e-05, -6.579700857400894e-05, -6.364472210407257e-05, -6.14924356341362e-05, -5.934014916419983e-05, -5.718786269426346e-05, -5.503557622432709e-05, -5.2883289754390717e-05, -5.0731003284454346e-05, -4.8578716814517975e-05, -4.6426430344581604e-05, -4.427414387464523e-05, -4.212185740470886e-05, -3.996957093477249e-05, -3.781728446483612e-05, -3.566499799489975e-05, -3.351271152496338e-05, -3.136042505502701e-05, -2.9208138585090637e-05, -2.7055852115154266e-05, -2.4903565645217896e-05, -2.2751279175281525e-05, -2.0598992705345154e-05, -1.8446706235408783e-05, -1.6294419765472412e-05, -1.4142133295536041e-05, -1.198984682559967e-05, -9.8375603556633e-06, -7.685273885726929e-06, -5.532987415790558e-06, -3.380700945854187e-06, -1.2284144759178162e-06, 9.238719940185547e-07, 3.0761584639549255e-06, 5.228444933891296e-06, 7.380731403827667e-06, 9.533017873764038e-06, 1.1685304343700409e-05, 1.383759081363678e-05, 1.598987728357315e-05, 1.814216375350952e-05, 2.0294450223445892e-05, 2.2446736693382263e-05, 2.4599023163318634e-05, 2.6751309633255005e-05, 2.8903596103191376e-05, 3.1055882573127747e-05, 3.320816904306412e-05, 3.536045551300049e-05, 3.751274198293686e-05, 3.966502845287323e-05, 4.18173149228096e-05, 4.396960139274597e-05, 4.612188786268234e-05, 4.827417433261871e-05, 5.0426460802555084e-05, 5.2578747272491455e-05, 5.4731033742427826e-05, 5.68833202123642e-05, 5.903560668230057e-05, 6.118789315223694e-05, 6.334017962217331e-05, 6.549246609210968e-05, 6.764475256204605e-05, 6.979703903198242e-05]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 10.0, 12.0, 16.0, 15.0, 24.0, 20.0, 44.0, 42.0, 45.0, 77.0, 79.0, 89.0, 147.0, 217.0, 652.0, 1162.0, 544.0, 210.0, 98.0, 87.0, 84.0, 63.0, 72.0, 46.0, 39.0, 40.0, 21.0, 29.0, 20.0, 15.0, 13.0, 12.0, 5.0, 5.0, 3.0, 4.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.340576171875e-05, -5.1530078053474426e-05, -4.965439438819885e-05, -4.777871072292328e-05, -4.5903027057647705e-05, -4.402734339237213e-05, -4.215165972709656e-05, -4.0275976061820984e-05, -3.840029239654541e-05, -3.6524608731269836e-05, -3.464892506599426e-05, -3.277324140071869e-05, -3.0897557735443115e-05, -2.902187407016754e-05, -2.7146190404891968e-05, -2.5270506739616394e-05, -2.339482307434082e-05, -2.1519139409065247e-05, -1.9643455743789673e-05, -1.77677720785141e-05, -1.5892088413238525e-05, -1.4016404747962952e-05, -1.2140721082687378e-05, -1.0265037417411804e-05, -8.38935375213623e-06, -6.513670086860657e-06, -4.637986421585083e-06, -2.7623027563095093e-06, -8.866190910339355e-07, 9.890645742416382e-07, 2.864748239517212e-06, 4.740431904792786e-06, 6.616115570068359e-06, 8.491799235343933e-06, 1.0367482900619507e-05, 1.224316656589508e-05, 1.4118850231170654e-05, 1.5994533896446228e-05, 1.7870217561721802e-05, 1.9745901226997375e-05, 2.162158489227295e-05, 2.3497268557548523e-05, 2.5372952222824097e-05, 2.724863588809967e-05, 2.9124319553375244e-05, 3.100000321865082e-05, 3.287568688392639e-05, 3.4751370549201965e-05, 3.662705421447754e-05, 3.850273787975311e-05, 4.0378421545028687e-05, 4.225410521030426e-05, 4.4129788875579834e-05, 4.600547254085541e-05, 4.788115620613098e-05, 4.9756839871406555e-05, 5.163252353668213e-05, 5.35082072019577e-05, 5.5383890867233276e-05, 5.725957453250885e-05, 5.9135258197784424e-05, 6.101094186306e-05, 6.288662552833557e-05, 6.476230919361115e-05, 6.663799285888672e-05]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 11.0, 42.0, 74.0, 136.0, 229.0, 181.0, 112.0, 73.0, 50.0, 25.0, 23.0, 13.0, 17.0, 3.0, 8.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00046351822675205767, -0.0004386507789604366, -0.0004137833311688155, -0.0003889158833771944, -0.00036404840648174286, -0.00033918095869012177, -0.0003143135108985007, -0.00028944603400304914, -0.0002645786153152585, -0.00023971116752363741, -0.0002148437051801011, -0.00018997625738848, -0.0001651087950449437, -0.0001402413472533226, -0.00011537389946170151, -9.05064371181652e-05, -6.563897477462888e-05, -4.0771519707050174e-05, -1.590406827745028e-05, 8.963383152149618e-06, 3.383083821972832e-05, 5.8698293287307024e-05, 8.356574107892811e-05, 0.00010843320342246443, 0.00013330065121408552, 0.0001581680990057066, 0.00018303556134924293, 0.00020790300914086401, 0.0002327704569324851, 0.00025763793382793665, 0.0002825053525157273, 0.00030737282941117883, 0.0003322403063066304, 0.00035710775409825146, 0.00038197520188987255, 0.0004068426787853241, 0.0004317101265769452, 0.0004565775743685663, 0.00048144502216018736, 0.0005063124699518085, 0.00053117994684726, 0.0005560474237427115, 0.0005809148424305022, 0.0006057823193259537, 0.0006306497380137444, 0.0006555172149091959, 0.0006803846918046474, 0.0007052521104924381, 0.0007301195291802287, 0.0007549870060756803, 0.0007798544247634709, 0.0008047219016589224, 0.0008295893203467131, 0.0008544567972421646, 0.0008793242741376162, 0.0009041916928254068, 0.0009290591697208583, 0.0009539266466163099, 0.0009787940653041005, 0.001003661542199552, 0.0010285290190950036, 0.0010533963795751333, 0.0010782638564705849, 0.0011031313333660364, 0.001127998810261488]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 10.0, 7.0, 15.0, 8.0, 12.0, 12.0, 14.0, 22.0, 29.0, 25.0, 19.0, 21.0, 27.0, 31.0, 44.0, 33.0, 35.0, 35.0, 35.0, 37.0, 42.0, 48.0, 28.0, 42.0, 40.0, 26.0, 39.0, 24.0, 29.0, 25.0, 23.0, 25.0, 22.0, 17.0, 16.0, 10.0, 8.0, 13.0, 13.0, 9.0, 5.0, 2.0, 3.0, 7.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00022464990615844727, -0.0002176305279135704, -0.00021061114966869354, -0.00020359177142381668, -0.00019657239317893982, -0.00018955301493406296, -0.0001825336366891861, -0.00017551425844430923, -0.00016849488019943237, -0.0001614755019545555, -0.00015445612370967865, -0.0001474367454648018, -0.00014041736721992493, -0.00013339798897504807, -0.0001263786107301712, -0.00011935923248529434, -0.00011233985424041748, -0.00010532047599554062, -9.830109775066376e-05, -9.12817195057869e-05, -8.426234126091003e-05, -7.724296301603317e-05, -7.022358477115631e-05, -6.320420652627945e-05, -5.618482828140259e-05, -4.9165450036525726e-05, -4.2146071791648865e-05, -3.5126693546772e-05, -2.810731530189514e-05, -2.108793705701828e-05, -1.4068558812141418e-05, -7.049180567264557e-06, -2.9802322387695312e-08, 6.989575922489166e-06, 1.4008954167366028e-05, 2.102833241224289e-05, 2.804771065711975e-05, 3.506708890199661e-05, 4.2086467146873474e-05, 4.9105845391750336e-05, 5.61252236366272e-05, 6.314460188150406e-05, 7.016398012638092e-05, 7.718335837125778e-05, 8.420273661613464e-05, 9.12221148610115e-05, 9.824149310588837e-05, 0.00010526087135076523, 0.00011228024959564209, 0.00011929962784051895, 0.0001263190060853958, 0.00013333838433027267, 0.00014035776257514954, 0.0001473771408200264, 0.00015439651906490326, 0.00016141589730978012, 0.00016843527555465698, 0.00017545465379953384, 0.0001824740320444107, 0.00018949341028928757, 0.00019651278853416443, 0.0002035321667790413, 0.00021055154502391815, 0.000217570923268795, 0.00022459030151367188]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 5.0, 0.0, 4.0, 0.0, 3.0, 12.0, 7.0, 15.0, 12.0, 18.0, 12.0, 18.0, 23.0, 23.0, 46.0, 70.0, 86.0, 133.0, 192.0, 317.0, 500.0, 794.0, 1333.0, 2443.0, 4729.0, 9836.0, 23318.0, 67112.0, 315768.0, 493622.0, 78586.0, 26870.0, 10903.0, 5156.0, 2696.0, 1449.0, 852.0, 517.0, 352.0, 216.0, 142.0, 94.0, 68.0, 50.0, 39.0, 25.0, 23.0, 15.0, 12.0, 13.0, 10.0, 8.0, 3.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0001710653305053711, -0.00016573071479797363, -0.00016039609909057617, -0.0001550614833831787, -0.00014972686767578125, -0.0001443922519683838, -0.00013905763626098633, -0.00013372302055358887, -0.0001283884048461914, -0.00012305378913879395, -0.00011771917343139648, -0.00011238455772399902, -0.00010704994201660156, -0.0001017153263092041, -9.638071060180664e-05, -9.104609489440918e-05, -8.571147918701172e-05, -8.037686347961426e-05, -7.50422477722168e-05, -6.970763206481934e-05, -6.437301635742188e-05, -5.9038400650024414e-05, -5.370378494262695e-05, -4.836916923522949e-05, -4.303455352783203e-05, -3.769993782043457e-05, -3.236532211303711e-05, -2.703070640563965e-05, -2.1696090698242188e-05, -1.6361474990844727e-05, -1.1026859283447266e-05, -5.692243576049805e-06, -3.5762786865234375e-07, 4.976987838745117e-06, 1.0311603546142578e-05, 1.564621925354004e-05, 2.09808349609375e-05, 2.631545066833496e-05, 3.165006637573242e-05, 3.698468208312988e-05, 4.2319297790527344e-05, 4.7653913497924805e-05, 5.2988529205322266e-05, 5.8323144912719727e-05, 6.365776062011719e-05, 6.899237632751465e-05, 7.432699203491211e-05, 7.966160774230957e-05, 8.499622344970703e-05, 9.033083915710449e-05, 9.566545486450195e-05, 0.00010100007057189941, 0.00010633468627929688, 0.00011166930198669434, 0.0001170039176940918, 0.00012233853340148926, 0.00012767314910888672, 0.00013300776481628418, 0.00013834238052368164, 0.0001436769962310791, 0.00014901161193847656, 0.00015434622764587402, 0.00015968084335327148, 0.00016501545906066895, 0.0001703500747680664]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 1.0, 4.0, 9.0, 6.0, 8.0, 9.0, 17.0, 22.0, 32.0, 40.0, 50.0, 76.0, 93.0, 94.0, 124.0, 95.0, 78.0, 55.0, 51.0, 40.0, 29.0, 15.0, 17.0, 10.0, 8.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9490718841552734e-05, -1.857709139585495e-05, -1.7663463950157166e-05, -1.674983650445938e-05, -1.5836209058761597e-05, -1.4922581613063812e-05, -1.4008954167366028e-05, -1.3095326721668243e-05, -1.2181699275970459e-05, -1.1268071830272675e-05, -1.035444438457489e-05, -9.440816938877106e-06, -8.527189493179321e-06, -7.613562047481537e-06, -6.6999346017837524e-06, -5.786307156085968e-06, -4.872679710388184e-06, -3.959052264690399e-06, -3.0454248189926147e-06, -2.1317973732948303e-06, -1.218169927597046e-06, -3.045424818992615e-07, 6.09084963798523e-07, 1.5227124094963074e-06, 2.436339855194092e-06, 3.3499673008918762e-06, 4.263594746589661e-06, 5.177222192287445e-06, 6.0908496379852295e-06, 7.004477083683014e-06, 7.918104529380798e-06, 8.831731975078583e-06, 9.745359420776367e-06, 1.0658986866474152e-05, 1.1572614312171936e-05, 1.248624175786972e-05, 1.3399869203567505e-05, 1.431349664926529e-05, 1.5227124094963074e-05, 1.6140751540660858e-05, 1.7054378986358643e-05, 1.7968006432056427e-05, 1.888163387775421e-05, 1.9795261323451996e-05, 2.070888876914978e-05, 2.1622516214847565e-05, 2.253614366054535e-05, 2.3449771106243134e-05, 2.4363398551940918e-05, 2.5277025997638702e-05, 2.6190653443336487e-05, 2.710428088903427e-05, 2.8017908334732056e-05, 2.893153578042984e-05, 2.9845163226127625e-05, 3.075879067182541e-05, 3.167241811752319e-05, 3.258604556322098e-05, 3.349967300891876e-05, 3.441330045461655e-05, 3.532692790031433e-05, 3.6240555346012115e-05, 3.71541827917099e-05, 3.8067810237407684e-05, 3.898143768310547e-05]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 9.0, 11.0, 21.0, 32.0, 37.0, 67.0, 91.0, 117.0, 186.0, 286.0, 470.0, 677.0, 992.0, 1499.0, 2343.0, 3496.0, 5423.0, 8622.0, 12981.0, 20179.0, 32822.0, 51765.0, 90022.0, 184506.0, 334300.0, 120825.0, 66111.0, 40831.0, 24308.0, 15587.0, 10480.0, 6673.0, 4312.0, 2950.0, 1848.0, 1242.0, 840.0, 511.0, 354.0, 250.0, 155.0, 112.0, 64.0, 53.0, 33.0, 22.0, 15.0, 11.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.823373794555664e-05, -5.642697215080261e-05, -5.4620206356048584e-05, -5.2813440561294556e-05, -5.100667476654053e-05, -4.91999089717865e-05, -4.739314317703247e-05, -4.558637738227844e-05, -4.3779611587524414e-05, -4.1972845792770386e-05, -4.016607999801636e-05, -3.835931420326233e-05, -3.65525484085083e-05, -3.474578261375427e-05, -3.2939016819000244e-05, -3.1132251024246216e-05, -2.9325485229492188e-05, -2.751871943473816e-05, -2.571195363998413e-05, -2.3905187845230103e-05, -2.2098422050476074e-05, -2.0291656255722046e-05, -1.8484890460968018e-05, -1.667812466621399e-05, -1.4871358871459961e-05, -1.3064593076705933e-05, -1.1257827281951904e-05, -9.451061487197876e-06, -7.644295692443848e-06, -5.837529897689819e-06, -4.030764102935791e-06, -2.2239983081817627e-06, -4.172325134277344e-07, 1.389533281326294e-06, 3.1962990760803223e-06, 5.003064870834351e-06, 6.809830665588379e-06, 8.616596460342407e-06, 1.0423362255096436e-05, 1.2230128049850464e-05, 1.4036893844604492e-05, 1.584365963935852e-05, 1.765042543411255e-05, 1.9457191228866577e-05, 2.1263957023620605e-05, 2.3070722818374634e-05, 2.4877488613128662e-05, 2.668425440788269e-05, 2.849102020263672e-05, 3.0297785997390747e-05, 3.2104551792144775e-05, 3.3911317586898804e-05, 3.571808338165283e-05, 3.752484917640686e-05, 3.933161497116089e-05, 4.113838076591492e-05, 4.2945146560668945e-05, 4.4751912355422974e-05, 4.6558678150177e-05, 4.836544394493103e-05, 5.017220973968506e-05, 5.197897553443909e-05, 5.3785741329193115e-05, 5.5592507123947144e-05, 5.739927291870117e-05]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 6.0, 8.0, 13.0, 6.0, 11.0, 13.0, 21.0, 13.0, 24.0, 28.0, 34.0, 24.0, 28.0, 43.0, 36.0, 55.0, 38.0, 38.0, 42.0, 58.0, 31.0, 35.0, 42.0, 41.0, 42.0, 28.0, 28.0, 30.0, 20.0, 27.0, 36.0, 24.0, 22.0, 8.0, 15.0, 9.0, 5.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.048513412475586e-05, -4.889722913503647e-05, -4.730932414531708e-05, -4.572141915559769e-05, -4.4133514165878296e-05, -4.2545609176158905e-05, -4.0957704186439514e-05, -3.936979919672012e-05, -3.778189420700073e-05, -3.619398921728134e-05, -3.460608422756195e-05, -3.301817923784256e-05, -3.143027424812317e-05, -2.9842369258403778e-05, -2.8254464268684387e-05, -2.6666559278964996e-05, -2.5078654289245605e-05, -2.3490749299526215e-05, -2.1902844309806824e-05, -2.0314939320087433e-05, -1.8727034330368042e-05, -1.713912934064865e-05, -1.555122435092926e-05, -1.396331936120987e-05, -1.2375414371490479e-05, -1.0787509381771088e-05, -9.199604392051697e-06, -7.611699402332306e-06, -6.023794412612915e-06, -4.435889422893524e-06, -2.8479844331741333e-06, -1.2600794434547424e-06, 3.2782554626464844e-07, 1.9157305359840393e-06, 3.50363552570343e-06, 5.091540515422821e-06, 6.679445505142212e-06, 8.267350494861603e-06, 9.855255484580994e-06, 1.1443160474300385e-05, 1.3031065464019775e-05, 1.4618970453739166e-05, 1.6206875443458557e-05, 1.7794780433177948e-05, 1.938268542289734e-05, 2.097059041261673e-05, 2.255849540233612e-05, 2.414640039205551e-05, 2.5734305381774902e-05, 2.7322210371494293e-05, 2.8910115361213684e-05, 3.0498020350933075e-05, 3.2085925340652466e-05, 3.367383033037186e-05, 3.526173532009125e-05, 3.684964030981064e-05, 3.843754529953003e-05, 4.002545028924942e-05, 4.161335527896881e-05, 4.32012602686882e-05, 4.478916525840759e-05, 4.6377070248126984e-05, 4.7964975237846375e-05, 4.9552880227565765e-05, 5.1140785217285156e-05]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 12.0, 15.0, 25.0, 39.0, 59.0, 92.0, 75.0, 195.0, 315.0, 538.0, 923.0, 1472.0, 1618.0, 3938.0, 7333.0, 14850.0, 33620.0, 47019.0, 180926.0, 462515.0, 180659.0, 61791.0, 18905.0, 14844.0, 7466.0, 3947.0, 2186.0, 1257.0, 527.0, 530.0, 295.0, 182.0, 148.0, 67.0, 66.0, 34.0, 24.0, 10.0, 6.0, 13.0, 5.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-06, -4.600733518600464e-06, -4.433095455169678e-06, -4.265457391738892e-06, -4.0978193283081055e-06, -3.930181264877319e-06, -3.762543201446533e-06, -3.594905138015747e-06, -3.427267074584961e-06, -3.259629011154175e-06, -3.0919909477233887e-06, -2.9243528842926025e-06, -2.7567148208618164e-06, -2.5890767574310303e-06, -2.421438694000244e-06, -2.253800630569458e-06, -2.086162567138672e-06, -1.9185245037078857e-06, -1.7508864402770996e-06, -1.5832483768463135e-06, -1.4156103134155273e-06, -1.2479722499847412e-06, -1.080334186553955e-06, -9.126961231231689e-07, -7.450580596923828e-07, -5.774199962615967e-07, -4.0978193283081055e-07, -2.421438694000244e-07, -7.450580596923828e-08, 9.313225746154785e-08, 2.60770320892334e-07, 4.284083843231201e-07, 5.960464477539062e-07, 7.636845111846924e-07, 9.313225746154785e-07, 1.0989606380462646e-06, 1.2665987014770508e-06, 1.434236764907837e-06, 1.601874828338623e-06, 1.7695128917694092e-06, 1.9371509552001953e-06, 2.1047890186309814e-06, 2.2724270820617676e-06, 2.4400651454925537e-06, 2.60770320892334e-06, 2.775341272354126e-06, 2.942979335784912e-06, 3.1106173992156982e-06, 3.2782554626464844e-06, 3.4458935260772705e-06, 3.6135315895080566e-06, 3.7811696529388428e-06, 3.948807716369629e-06, 4.116445779800415e-06, 4.284083843231201e-06, 4.451721906661987e-06, 4.6193599700927734e-06, 4.7869980335235596e-06, 4.954636096954346e-06, 5.122274160385132e-06, 5.289912223815918e-06, 5.457550287246704e-06, 5.62518835067749e-06, 5.792826414108276e-06, 5.9604644775390625e-06]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 8.0, 3.0, 17.0, 11.0, 9.0, 21.0, 12.0, 25.0, 49.0, 42.0, 29.0, 93.0, 42.0, 57.0, 128.0, 64.0, 57.0, 86.0, 32.0, 41.0, 50.0, 24.0, 21.0, 19.0, 13.0, 8.0, 17.0, 3.0, 4.0, 11.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.682209014892578e-06, -2.6030465960502625e-06, -2.5238841772079468e-06, -2.444721758365631e-06, -2.3655593395233154e-06, -2.2863969206809998e-06, -2.207234501838684e-06, -2.1280720829963684e-06, -2.0489096641540527e-06, -1.969747245311737e-06, -1.8905848264694214e-06, -1.8114224076271057e-06, -1.73225998878479e-06, -1.6530975699424744e-06, -1.5739351511001587e-06, -1.494772732257843e-06, -1.4156103134155273e-06, -1.3364478945732117e-06, -1.257285475730896e-06, -1.1781230568885803e-06, -1.0989606380462646e-06, -1.019798219203949e-06, -9.406358003616333e-07, -8.614733815193176e-07, -7.82310962677002e-07, -7.031485438346863e-07, -6.239861249923706e-07, -5.448237061500549e-07, -4.6566128730773926e-07, -3.864988684654236e-07, -3.073364496231079e-07, -2.2817403078079224e-07, -1.4901161193847656e-07, -6.984919309616089e-08, 9.313225746154785e-09, 8.847564458847046e-08, 1.6763806343078613e-07, 2.468004822731018e-07, 3.259629011154175e-07, 4.0512531995773315e-07, 4.842877388000488e-07, 5.634501576423645e-07, 6.426125764846802e-07, 7.217749953269958e-07, 8.009374141693115e-07, 8.800998330116272e-07, 9.592622518539429e-07, 1.0384246706962585e-06, 1.1175870895385742e-06, 1.1967495083808899e-06, 1.2759119272232056e-06, 1.3550743460655212e-06, 1.434236764907837e-06, 1.5133991837501526e-06, 1.5925616025924683e-06, 1.671724021434784e-06, 1.7508864402770996e-06, 1.8300488591194153e-06, 1.909211277961731e-06, 1.9883736968040466e-06, 2.0675361156463623e-06, 2.146698534488678e-06, 2.2258609533309937e-06, 2.3050233721733093e-06, 2.384185791015625e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 13.0, 9.0, 9.0, 30.0, 22.0, 48.0, 97.0, 58.0, 148.0, 112.0, 290.0, 455.0, 317.0, 889.0, 1340.0, 936.0, 2654.0, 1933.0, 5483.0, 9421.0, 7270.0, 23530.0, 49685.0, 46614.0, 237056.0, 272341.0, 236580.0, 76390.0, 19846.0, 23688.0, 12395.0, 4018.0, 5436.0, 1906.0, 2676.0, 1722.0, 598.0, 895.0, 581.0, 192.0, 302.0, 107.0, 156.0, 103.0, 42.0, 61.0, 39.0, 8.0, 25.0, 9.0, 9.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.039836883544922e-06, -2.942979335784912e-06, -2.8461217880249023e-06, -2.7492642402648926e-06, -2.652406692504883e-06, -2.555549144744873e-06, -2.4586915969848633e-06, -2.3618340492248535e-06, -2.2649765014648438e-06, -2.168118953704834e-06, -2.0712614059448242e-06, -1.9744038581848145e-06, -1.8775463104248047e-06, -1.780688762664795e-06, -1.6838312149047852e-06, -1.5869736671447754e-06, -1.4901161193847656e-06, -1.3932585716247559e-06, -1.296401023864746e-06, -1.1995434761047363e-06, -1.1026859283447266e-06, -1.0058283805847168e-06, -9.08970832824707e-07, -8.121132850646973e-07, -7.152557373046875e-07, -6.183981895446777e-07, -5.21540641784668e-07, -4.246830940246582e-07, -3.2782554626464844e-07, -2.3096799850463867e-07, -1.341104507446289e-07, -3.725290298461914e-08, 5.960464477539063e-08, 1.564621925354004e-07, 2.5331974029541016e-07, 3.501772880554199e-07, 4.470348358154297e-07, 5.438923835754395e-07, 6.407499313354492e-07, 7.37607479095459e-07, 8.344650268554688e-07, 9.313225746154785e-07, 1.0281801223754883e-06, 1.125037670135498e-06, 1.2218952178955078e-06, 1.3187527656555176e-06, 1.4156103134155273e-06, 1.5124678611755371e-06, 1.6093254089355469e-06, 1.7061829566955566e-06, 1.8030405044555664e-06, 1.8998980522155762e-06, 1.996755599975586e-06, 2.0936131477355957e-06, 2.1904706954956055e-06, 2.2873282432556152e-06, 2.384185791015625e-06, 2.4810433387756348e-06, 2.5779008865356445e-06, 2.6747584342956543e-06, 2.771615982055664e-06, 2.868473529815674e-06, 2.9653310775756836e-06, 3.0621886253356934e-06, 3.159046173095703e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 8.0, 3.0, 6.0, 6.0, 5.0, 14.0, 7.0, 31.0, 15.0, 41.0, 38.0, 62.0, 35.0, 105.0, 41.0, 57.0, 98.0, 45.0, 77.0, 34.0, 52.0, 28.0, 48.0, 13.0, 29.0, 13.0, 9.0, 15.0, 10.0, 10.0, 6.0, 9.0, 2.0, 6.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.86102294921875e-06, -2.7744099497795105e-06, -2.687796950340271e-06, -2.6011839509010315e-06, -2.514570951461792e-06, -2.4279579520225525e-06, -2.341344952583313e-06, -2.2547319531440735e-06, -2.168118953704834e-06, -2.0815059542655945e-06, -1.994892954826355e-06, -1.9082799553871155e-06, -1.821666955947876e-06, -1.7350539565086365e-06, -1.648440957069397e-06, -1.5618279576301575e-06, -1.475214958190918e-06, -1.3886019587516785e-06, -1.301988959312439e-06, -1.2153759598731995e-06, -1.12876296043396e-06, -1.0421499609947205e-06, -9.55536961555481e-07, -8.689239621162415e-07, -7.82310962677002e-07, -6.956979632377625e-07, -6.09084963798523e-07, -5.224719643592834e-07, -4.3585896492004395e-07, -3.4924596548080444e-07, -2.6263296604156494e-07, -1.7601996660232544e-07, -8.940696716308594e-08, -2.7939677238464355e-09, 8.381903171539307e-08, 1.7043203115463257e-07, 2.5704503059387207e-07, 3.4365803003311157e-07, 4.302710294723511e-07, 5.168840289115906e-07, 6.034970283508301e-07, 6.901100277900696e-07, 7.767230272293091e-07, 8.633360266685486e-07, 9.499490261077881e-07, 1.0365620255470276e-06, 1.123175024986267e-06, 1.2097880244255066e-06, 1.296401023864746e-06, 1.3830140233039856e-06, 1.469627022743225e-06, 1.5562400221824646e-06, 1.642853021621704e-06, 1.7294660210609436e-06, 1.816079020500183e-06, 1.9026920199394226e-06, 1.989305019378662e-06, 2.0759180188179016e-06, 2.162531018257141e-06, 2.2491440176963806e-06, 2.33575701713562e-06, 2.4223700165748596e-06, 2.508983016014099e-06, 2.5955960154533386e-06, 2.682209014892578e-06]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 11.0, 8.0, 8.0, 7.0, 18.0, 23.0, 27.0, 46.0, 51.0, 85.0, 189.0, 166.0, 91.0, 73.0, 52.0, 24.0, 22.0, 14.0, 17.0, 7.0, 9.0, 12.0, 7.0, 5.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00027030555065721273, -0.0002618401194922626, -0.000253374659223482, -0.0002449092280585319, -0.00023644379689358175, -0.0002279783511767164, -0.00021951290545985103, -0.0002110474742949009, -0.00020258204312995076, -0.0001941165974130854, -0.00018565116624813527, -0.0001771857205312699, -0.00016872028936631978, -0.00016025484364945441, -0.00015178939793258905, -0.00014332396676763892, -0.00013485852105077356, -0.0001263930753339082, -0.00011792764416895807, -0.00010946219845209271, -0.00010099676728714257, -9.253132157027721e-05, -8.406588312936947e-05, -7.560044468846172e-05, -6.713500624755397e-05, -5.866956780664623e-05, -5.020412936573848e-05, -4.173868728685193e-05, -3.327324884594418e-05, -2.4807810405036435e-05, -1.634236832614988e-05, -7.876929885242134e-06, 5.885085556656122e-07, 9.05394790606806e-06, 1.751938725647051e-05, 2.598482751636766e-05, 3.4450265957275406e-05, 4.291570439818315e-05, 5.1381146477069706e-05, 5.984658491797745e-05, 6.83120233588852e-05, 7.677746179979295e-05, 8.524290024070069e-05, 9.370833868160844e-05, 0.0001021737843984738, 0.00011063921556342393, 0.00011910466128028929, 0.00012757009244523942, 0.00013603553816210479, 0.00014450098387897015, 0.00015296641504392028, 0.00016143186076078564, 0.00016989729192573577, 0.00017836273764260113, 0.00018682816880755126, 0.00019529361452441663, 0.00020375906024128199, 0.00021222450595814735, 0.00022068993712309748, 0.00022915538283996284, 0.00023762081400491297, 0.0002460862451698631, 0.0002545517054386437, 0.0002630171366035938, 0.00027148256776854396]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 7.0, 6.0, 7.0, 4.0, 13.0, 19.0, 19.0, 27.0, 28.0, 22.0, 24.0, 27.0, 26.0, 38.0, 39.0, 45.0, 30.0, 37.0, 43.0, 43.0, 46.0, 47.0, 48.0, 40.0, 28.0, 31.0, 37.0, 35.0, 33.0, 23.0, 20.0, 26.0, 23.0, 14.0, 10.0, 3.0, 10.0, 4.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001538395881652832, -0.00014900416135787964, -0.00014416873455047607, -0.0001393333077430725, -0.00013449788093566895, -0.00012966245412826538, -0.00012482702732086182, -0.00011999160051345825, -0.00011515617370605469, -0.00011032074689865112, -0.00010548532009124756, -0.000100649893283844, -9.581446647644043e-05, -9.097903966903687e-05, -8.61436128616333e-05, -8.130818605422974e-05, -7.647275924682617e-05, -7.163733243942261e-05, -6.680190563201904e-05, -6.196647882461548e-05, -5.7131052017211914e-05, -5.229562520980835e-05, -4.7460198402404785e-05, -4.262477159500122e-05, -3.7789344787597656e-05, -3.295391798019409e-05, -2.8118491172790527e-05, -2.3283064365386963e-05, -1.84476375579834e-05, -1.3612210750579834e-05, -8.77678394317627e-06, -3.941357135772705e-06, 8.940696716308594e-07, 5.729496479034424e-06, 1.0564923286437988e-05, 1.5400350093841553e-05, 2.0235776901245117e-05, 2.507120370864868e-05, 2.9906630516052246e-05, 3.474205732345581e-05, 3.9577484130859375e-05, 4.441291093826294e-05, 4.9248337745666504e-05, 5.408376455307007e-05, 5.891919136047363e-05, 6.37546181678772e-05, 6.859004497528076e-05, 7.342547178268433e-05, 7.826089859008789e-05, 8.309632539749146e-05, 8.793175220489502e-05, 9.276717901229858e-05, 9.760260581970215e-05, 0.00010243803262710571, 0.00010727345943450928, 0.00011210888624191284, 0.0001169443130493164, 0.00012177973985671997, 0.00012661516666412354, 0.0001314505934715271, 0.00013628602027893066, 0.00014112144708633423, 0.0001459568738937378, 0.00015079230070114136, 0.00015562772750854492]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 8.0, 9.0, 15.0, 38.0, 69.0, 96.0, 190.0, 318.0, 563.0, 1053.0, 1952.0, 4047.0, 8683.0, 21448.0, 59952.0, 272743.0, 3633247.0, 125654.0, 36925.0, 14013.0, 6169.0, 2930.0, 1411.0, 820.0, 480.0, 362.0, 227.0, 145.0, 133.0, 103.0, 77.0, 49.0, 52.0, 48.0, 42.0, 39.0, 15.0, 25.0, 21.0, 16.0, 20.0, 14.0, 8.0, 10.0, 10.0, 7.0, 9.0, 8.0, 7.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00012242794036865234, -0.00011573918163776398, -0.00010905042290687561, -0.00010236166417598724, -9.567290544509888e-05, -8.898414671421051e-05, -8.229538798332214e-05, -7.560662925243378e-05, -6.891787052154541e-05, -6.222911179065704e-05, -5.554035305976868e-05, -4.885159432888031e-05, -4.216283559799194e-05, -3.547407686710358e-05, -2.878531813621521e-05, -2.2096559405326843e-05, -1.5407800674438477e-05, -8.71904194355011e-06, -2.030283212661743e-06, 4.6584755182266235e-06, 1.134723424911499e-05, 1.8035992980003357e-05, 2.4724751710891724e-05, 3.141351044178009e-05, 3.810226917266846e-05, 4.4791027903556824e-05, 5.147978663444519e-05, 5.816854536533356e-05, 6.485730409622192e-05, 7.154606282711029e-05, 7.823482155799866e-05, 8.492358028888702e-05, 9.161233901977539e-05, 9.830109775066376e-05, 0.00010498985648155212, 0.00011167861521244049, 0.00011836737394332886, 0.00012505613267421722, 0.0001317448914051056, 0.00013843365013599396, 0.00014512240886688232, 0.0001518111675977707, 0.00015849992632865906, 0.00016518868505954742, 0.0001718774437904358, 0.00017856620252132416, 0.00018525496125221252, 0.0001919437199831009, 0.00019863247871398926, 0.00020532123744487762, 0.000212009996175766, 0.00021869875490665436, 0.00022538751363754272, 0.0002320762723684311, 0.00023876503109931946, 0.0002454537898302078, 0.0002521425485610962, 0.00025883130729198456, 0.0002655200660228729, 0.0002722088247537613, 0.00027889758348464966, 0.000285586342215538, 0.0002922751009464264, 0.00029896385967731476, 0.0003056526184082031]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 7.0, 6.0, 5.0, 12.0, 17.0, 19.0, 41.0, 58.0, 63.0, 94.0, 141.0, 161.0, 120.0, 78.0, 59.0, 43.0, 29.0, 19.0, 15.0, 9.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2351741790771484e-05, -2.112891525030136e-05, -1.9906088709831238e-05, -1.8683262169361115e-05, -1.746043562889099e-05, -1.6237609088420868e-05, -1.5014782547950745e-05, -1.3791956007480621e-05, -1.2569129467010498e-05, -1.1346302926540375e-05, -1.0123476386070251e-05, -8.900649845600128e-06, -7.677823305130005e-06, -6.454996764659882e-06, -5.232170224189758e-06, -4.009343683719635e-06, -2.7865171432495117e-06, -1.5636906027793884e-06, -3.4086406230926514e-07, 8.819624781608582e-07, 2.1047890186309814e-06, 3.3276155591011047e-06, 4.550442099571228e-06, 5.773268640041351e-06, 6.996095180511475e-06, 8.218921720981598e-06, 9.441748261451721e-06, 1.0664574801921844e-05, 1.1887401342391968e-05, 1.3110227882862091e-05, 1.4333054423332214e-05, 1.5555880963802338e-05, 1.677870750427246e-05, 1.8001534044742584e-05, 1.9224360585212708e-05, 2.044718712568283e-05, 2.1670013666152954e-05, 2.2892840206623077e-05, 2.41156667470932e-05, 2.5338493287563324e-05, 2.6561319828033447e-05, 2.778414636850357e-05, 2.9006972908973694e-05, 3.0229799449443817e-05, 3.145262598991394e-05, 3.2675452530384064e-05, 3.389827907085419e-05, 3.512110561132431e-05, 3.6343932151794434e-05, 3.756675869226456e-05, 3.878958523273468e-05, 4.0012411773204803e-05, 4.123523831367493e-05, 4.245806485414505e-05, 4.368089139461517e-05, 4.49037179350853e-05, 4.612654447555542e-05, 4.734937101602554e-05, 4.8572197556495667e-05, 4.979502409696579e-05, 5.101785063743591e-05, 5.2240677177906036e-05, 5.346350371837616e-05, 5.468633025884628e-05, 5.5909156799316406e-05]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 16.0, 9.0, 20.0, 26.0, 26.0, 59.0, 71.0, 139.0, 186.0, 337.0, 548.0, 955.0, 1590.0, 2816.0, 4829.0, 8565.0, 16591.0, 33721.0, 73233.0, 198739.0, 2430086.0, 1128484.0, 166175.0, 63656.0, 29537.0, 14966.0, 7938.0, 4621.0, 2686.0, 1441.0, 917.0, 463.0, 343.0, 199.0, 99.0, 73.0, 36.0, 23.0, 19.0, 7.0, 9.0, 6.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.28640365600586e-05, -8.995458483695984e-05, -8.704513311386108e-05, -8.413568139076233e-05, -8.122622966766357e-05, -7.831677794456482e-05, -7.540732622146606e-05, -7.249787449836731e-05, -6.958842277526855e-05, -6.66789710521698e-05, -6.376951932907104e-05, -6.086006760597229e-05, -5.7950615882873535e-05, -5.504116415977478e-05, -5.2131712436676025e-05, -4.922226071357727e-05, -4.6312808990478516e-05, -4.340335726737976e-05, -4.0493905544281006e-05, -3.758445382118225e-05, -3.4675002098083496e-05, -3.176555037498474e-05, -2.8856098651885986e-05, -2.594664692878723e-05, -2.3037195205688477e-05, -2.012774348258972e-05, -1.7218291759490967e-05, -1.4308840036392212e-05, -1.1399388313293457e-05, -8.489936590194702e-06, -5.580484867095947e-06, -2.6710331439971924e-06, 2.384185791015625e-07, 3.1478703022003174e-06, 6.057322025299072e-06, 8.966773748397827e-06, 1.1876225471496582e-05, 1.4785677194595337e-05, 1.7695128917694092e-05, 2.0604580640792847e-05, 2.35140323638916e-05, 2.6423484086990356e-05, 2.933293581008911e-05, 3.2242387533187866e-05, 3.515183925628662e-05, 3.8061290979385376e-05, 4.097074270248413e-05, 4.3880194425582886e-05, 4.678964614868164e-05, 4.9699097871780396e-05, 5.260854959487915e-05, 5.5518001317977905e-05, 5.842745304107666e-05, 6.133690476417542e-05, 6.424635648727417e-05, 6.715580821037292e-05, 7.006525993347168e-05, 7.297471165657043e-05, 7.588416337966919e-05, 7.879361510276794e-05, 8.17030668258667e-05, 8.461251854896545e-05, 8.752197027206421e-05, 9.043142199516296e-05, 9.334087371826172e-05]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 7.0, 10.0, 14.0, 20.0, 37.0, 39.0, 54.0, 85.0, 95.0, 138.0, 227.0, 652.0, 1393.0, 460.0, 202.0, 123.0, 98.0, 76.0, 57.0, 53.0, 45.0, 43.0, 30.0, 29.0, 16.0, 18.0, 12.0, 8.0, 6.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.612871170043945e-05, -8.375942707061768e-05, -8.13901424407959e-05, -7.902085781097412e-05, -7.665157318115234e-05, -7.428228855133057e-05, -7.191300392150879e-05, -6.954371929168701e-05, -6.717443466186523e-05, -6.480515003204346e-05, -6.243586540222168e-05, -6.00665807723999e-05, -5.7697296142578125e-05, -5.532801151275635e-05, -5.295872688293457e-05, -5.058944225311279e-05, -4.8220157623291016e-05, -4.585087299346924e-05, -4.348158836364746e-05, -4.1112303733825684e-05, -3.8743019104003906e-05, -3.637373447418213e-05, -3.400444984436035e-05, -3.1635165214538574e-05, -2.9265880584716797e-05, -2.689659595489502e-05, -2.4527311325073242e-05, -2.2158026695251465e-05, -1.9788742065429688e-05, -1.741945743560791e-05, -1.5050172805786133e-05, -1.2680888175964355e-05, -1.0311603546142578e-05, -7.9423189163208e-06, -5.5730342864990234e-06, -3.203749656677246e-06, -8.344650268554688e-07, 1.5348196029663086e-06, 3.904104232788086e-06, 6.273388862609863e-06, 8.64267349243164e-06, 1.1011958122253418e-05, 1.3381242752075195e-05, 1.5750527381896973e-05, 1.811981201171875e-05, 2.0489096641540527e-05, 2.2858381271362305e-05, 2.5227665901184082e-05, 2.759695053100586e-05, 2.9966235160827637e-05, 3.2335519790649414e-05, 3.470480442047119e-05, 3.707408905029297e-05, 3.9443373680114746e-05, 4.1812658309936523e-05, 4.41819429397583e-05, 4.655122756958008e-05, 4.8920512199401855e-05, 5.128979682922363e-05, 5.365908145904541e-05, 5.602836608886719e-05, 5.8397650718688965e-05, 6.076693534851074e-05, 6.313621997833252e-05, 6.55055046081543e-05]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 10.0, 13.0, 18.0, 18.0, 34.0, 57.0, 114.0, 128.0, 143.0, 106.0, 70.0, 64.0, 47.0, 38.0, 34.0, 27.0, 15.0, 14.0, 5.0, 4.0, 11.0, 4.0, 4.0, 5.0, 7.0, 5.0, 1.0, 1.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033581358729861677, -0.0003188868286088109, -0.00030196006991900504, -0.00028503331122919917, -0.0002681065525393933, -0.00025117979384958744, -0.0002342530497116968, -0.00021732629102189094, -0.00020039953233208507, -0.0001834727736422792, -0.00016654601495247334, -0.0001496192708145827, -0.00013269251212477684, -0.00011576574615901336, -9.883899474516511e-05, -8.191223605535924e-05, -6.498547736555338e-05, -4.8058718675747514e-05, -3.1131963623920456e-05, -1.4205208572093397e-05, 2.721550117712468e-06, 1.9648308807518333e-05, 3.6575060221366584e-05, 5.350181891117245e-05, 7.042857760097831e-05, 8.735533629078418e-05, 0.00010428209498059005, 0.0001212088463944383, 0.00013813559780828655, 0.0001550623564980924, 0.00017198911518789828, 0.00018891587387770414, 0.00020584260346367955, 0.00022276936215348542, 0.00023969612084329128, 0.00025662287953309715, 0.000273549638222903, 0.0002904763969127089, 0.00030740315560251474, 0.00032432988518849015, 0.0003412566729821265, 0.00035818343167193234, 0.0003751101903617382, 0.00039203694905154407, 0.00040896370774134994, 0.0004258904664311558, 0.00044281722512096167, 0.0004597439547069371, 0.00047667071339674294, 0.0004935974720865488, 0.0005105242016725242, 0.0005274509894661605, 0.0005443777190521359, 0.0005613045068457723, 0.0005782312364317477, 0.000595158024225384, 0.0006120847538113594, 0.0006290114833973348, 0.0006459382711909711, 0.0006628650007769465, 0.0006797917885705829, 0.0006967185181565583, 0.0007136453059501946, 0.00073057203553617, 0.0007474988233298063]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 8.0, 8.0, 11.0, 12.0, 11.0, 18.0, 17.0, 19.0, 16.0, 22.0, 29.0, 22.0, 19.0, 24.0, 42.0, 27.0, 31.0, 31.0, 39.0, 48.0, 30.0, 36.0, 36.0, 41.0, 38.0, 25.0, 30.0, 23.0, 37.0, 28.0, 31.0, 25.0, 26.0, 18.0, 22.0, 15.0, 16.0, 12.0, 14.0, 2.0, 11.0, 2.0, 5.0, 2.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.0002683401107788086, -0.0002605859190225601, -0.00025283172726631165, -0.00024507753551006317, -0.0002373233437538147, -0.00022956915199756622, -0.00022181496024131775, -0.00021406076848506927, -0.0002063065767288208, -0.00019855238497257233, -0.00019079819321632385, -0.00018304400146007538, -0.0001752898097038269, -0.00016753561794757843, -0.00015978142619132996, -0.00015202723443508148, -0.000144273042678833, -0.00013651885092258453, -0.00012876465916633606, -0.00012101046741008759, -0.00011325627565383911, -0.00010550208389759064, -9.774789214134216e-05, -8.999370038509369e-05, -8.223950862884521e-05, -7.448531687259674e-05, -6.673112511634827e-05, -5.897693336009979e-05, -5.122274160385132e-05, -4.3468549847602844e-05, -3.571435809135437e-05, -2.7960166335105896e-05, -2.0205974578857422e-05, -1.2451782822608948e-05, -4.697591066360474e-06, 3.0566006898880005e-06, 1.0810792446136475e-05, 1.856498420238495e-05, 2.6319175958633423e-05, 3.40733677148819e-05, 4.182755947113037e-05, 4.9581751227378845e-05, 5.733594298362732e-05, 6.50901347398758e-05, 7.284432649612427e-05, 8.059851825237274e-05, 8.835271000862122e-05, 9.610690176486969e-05, 0.00010386109352111816, 0.00011161528527736664, 0.00011936947703361511, 0.00012712366878986359, 0.00013487786054611206, 0.00014263205230236053, 0.000150386244058609, 0.00015814043581485748, 0.00016589462757110596, 0.00017364881932735443, 0.0001814030110836029, 0.00018915720283985138, 0.00019691139459609985, 0.00020466558635234833, 0.0002124197781085968, 0.00022017396986484528, 0.00022792816162109375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 4.0, 5.0, 10.0, 10.0, 22.0, 22.0, 37.0, 37.0, 89.0, 100.0, 149.0, 247.0, 362.0, 585.0, 908.0, 1532.0, 2656.0, 4989.0, 10061.0, 23035.0, 60348.0, 217041.0, 549411.0, 108542.0, 37324.0, 15298.0, 6937.0, 3541.0, 1993.0, 1149.0, 747.0, 436.0, 307.0, 203.0, 136.0, 80.0, 63.0, 38.0, 30.0, 18.0, 12.0, 13.0, 8.0, 9.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001569986343383789, -0.00015180930495262146, -0.00014661997556686401, -0.00014143064618110657, -0.00013624131679534912, -0.00013105198740959167, -0.00012586265802383423, -0.00012067332863807678, -0.00011548399925231934, -0.00011029466986656189, -0.00010510534048080444, -9.9916011095047e-05, -9.472668170928955e-05, -8.95373523235321e-05, -8.434802293777466e-05, -7.915869355201721e-05, -7.396936416625977e-05, -6.878003478050232e-05, -6.359070539474487e-05, -5.840137600898743e-05, -5.321204662322998e-05, -4.8022717237472534e-05, -4.283338785171509e-05, -3.764405846595764e-05, -3.2454729080200195e-05, -2.726539969444275e-05, -2.2076070308685303e-05, -1.6886740922927856e-05, -1.169741153717041e-05, -6.508082151412964e-06, -1.3187527656555176e-06, 3.870576620101929e-06, 9.059906005859375e-06, 1.4249235391616821e-05, 1.9438564777374268e-05, 2.4627894163131714e-05, 2.981722354888916e-05, 3.5006552934646606e-05, 4.019588232040405e-05, 4.53852117061615e-05, 5.0574541091918945e-05, 5.576387047767639e-05, 6.095319986343384e-05, 6.614252924919128e-05, 7.133185863494873e-05, 7.652118802070618e-05, 8.171051740646362e-05, 8.689984679222107e-05, 9.208917617797852e-05, 9.727850556373596e-05, 0.00010246783494949341, 0.00010765716433525085, 0.0001128464937210083, 0.00011803582310676575, 0.0001232251524925232, 0.00012841448187828064, 0.00013360381126403809, 0.00013879314064979553, 0.00014398247003555298, 0.00014917179942131042, 0.00015436112880706787, 0.00015955045819282532, 0.00016473978757858276, 0.0001699291169643402, 0.00017511844635009766]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 5.0, 7.0, 8.0, 19.0, 26.0, 18.0, 41.0, 38.0, 62.0, 65.0, 88.0, 95.0, 94.0, 91.0, 76.0, 62.0, 50.0, 42.0, 32.0, 21.0, 17.0, 9.0, 6.0, 4.0, 6.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.199411392211914e-05, -2.1126121282577515e-05, -2.025812864303589e-05, -1.9390136003494263e-05, -1.8522143363952637e-05, -1.765415072441101e-05, -1.6786158084869385e-05, -1.591816544532776e-05, -1.5050172805786133e-05, -1.4182180166244507e-05, -1.3314187526702881e-05, -1.2446194887161255e-05, -1.1578202247619629e-05, -1.0710209608078003e-05, -9.842216968536377e-06, -8.974224328994751e-06, -8.106231689453125e-06, -7.238239049911499e-06, -6.370246410369873e-06, -5.502253770828247e-06, -4.634261131286621e-06, -3.766268491744995e-06, -2.898275852203369e-06, -2.030283212661743e-06, -1.1622905731201172e-06, -2.942979335784912e-07, 5.736947059631348e-07, 1.4416873455047607e-06, 2.3096799850463867e-06, 3.1776726245880127e-06, 4.045665264129639e-06, 4.913657903671265e-06, 5.781650543212891e-06, 6.649643182754517e-06, 7.517635822296143e-06, 8.385628461837769e-06, 9.253621101379395e-06, 1.012161374092102e-05, 1.0989606380462646e-05, 1.1857599020004272e-05, 1.2725591659545898e-05, 1.3593584299087524e-05, 1.446157693862915e-05, 1.5329569578170776e-05, 1.6197562217712402e-05, 1.706555485725403e-05, 1.7933547496795654e-05, 1.880154013633728e-05, 1.9669532775878906e-05, 2.0537525415420532e-05, 2.1405518054962158e-05, 2.2273510694503784e-05, 2.314150333404541e-05, 2.4009495973587036e-05, 2.4877488613128662e-05, 2.5745481252670288e-05, 2.6613473892211914e-05, 2.748146653175354e-05, 2.8349459171295166e-05, 2.9217451810836792e-05, 3.0085444450378418e-05, 3.0953437089920044e-05, 3.182142972946167e-05, 3.2689422369003296e-05, 3.355741500854492e-05]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 11.0, 10.0, 17.0, 42.0, 62.0, 73.0, 109.0, 161.0, 228.0, 335.0, 440.0, 682.0, 928.0, 1424.0, 2117.0, 2946.0, 4153.0, 6391.0, 9587.0, 14368.0, 22282.0, 35132.0, 57311.0, 98941.0, 222802.0, 290217.0, 108363.0, 60762.0, 37478.0, 23992.0, 15536.0, 10217.0, 6954.0, 4545.0, 3069.0, 2071.0, 1524.0, 994.0, 717.0, 474.0, 356.0, 229.0, 140.0, 130.0, 69.0, 64.0, 37.0, 25.0, 15.0, 12.0, 4.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.167722702026367e-05, -5.0066038966178894e-05, -4.8454850912094116e-05, -4.684366285800934e-05, -4.523247480392456e-05, -4.362128674983978e-05, -4.2010098695755005e-05, -4.039891064167023e-05, -3.878772258758545e-05, -3.717653453350067e-05, -3.5565346479415894e-05, -3.3954158425331116e-05, -3.234297037124634e-05, -3.073178231716156e-05, -2.9120594263076782e-05, -2.7509406208992004e-05, -2.5898218154907227e-05, -2.428703010082245e-05, -2.267584204673767e-05, -2.1064653992652893e-05, -1.9453465938568115e-05, -1.7842277884483337e-05, -1.623108983039856e-05, -1.4619901776313782e-05, -1.3008713722229004e-05, -1.1397525668144226e-05, -9.786337614059448e-06, -8.17514955997467e-06, -6.563961505889893e-06, -4.952773451805115e-06, -3.341585397720337e-06, -1.730397343635559e-06, -1.1920928955078125e-07, 1.4919787645339966e-06, 3.1031668186187744e-06, 4.714354872703552e-06, 6.32554292678833e-06, 7.936730980873108e-06, 9.547919034957886e-06, 1.1159107089042664e-05, 1.2770295143127441e-05, 1.438148319721222e-05, 1.5992671251296997e-05, 1.7603859305381775e-05, 1.9215047359466553e-05, 2.082623541355133e-05, 2.243742346763611e-05, 2.4048611521720886e-05, 2.5659799575805664e-05, 2.7270987629890442e-05, 2.888217568397522e-05, 3.0493363738059998e-05, 3.2104551792144775e-05, 3.371573984622955e-05, 3.532692790031433e-05, 3.693811595439911e-05, 3.854930400848389e-05, 4.0160492062568665e-05, 4.177168011665344e-05, 4.338286817073822e-05, 4.4994056224823e-05, 4.6605244278907776e-05, 4.8216432332992554e-05, 4.982762038707733e-05, 5.143880844116211e-05]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 6.0, 7.0, 4.0, 14.0, 14.0, 8.0, 14.0, 15.0, 15.0, 20.0, 17.0, 24.0, 23.0, 26.0, 34.0, 35.0, 36.0, 40.0, 51.0, 45.0, 38.0, 37.0, 46.0, 47.0, 31.0, 38.0, 34.0, 38.0, 41.0, 35.0, 31.0, 20.0, 18.0, 18.0, 19.0, 16.0, 20.0, 4.0, 5.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-05, -4.388391971588135e-05, -4.246830940246582e-05, -4.105269908905029e-05, -3.9637088775634766e-05, -3.822147846221924e-05, -3.680586814880371e-05, -3.5390257835388184e-05, -3.3974647521972656e-05, -3.255903720855713e-05, -3.11434268951416e-05, -2.9727816581726074e-05, -2.8312206268310547e-05, -2.689659595489502e-05, -2.5480985641479492e-05, -2.4065375328063965e-05, -2.2649765014648438e-05, -2.123415470123291e-05, -1.9818544387817383e-05, -1.8402934074401855e-05, -1.6987323760986328e-05, -1.55717134475708e-05, -1.4156103134155273e-05, -1.2740492820739746e-05, -1.1324882507324219e-05, -9.909272193908691e-06, -8.493661880493164e-06, -7.078051567077637e-06, -5.662441253662109e-06, -4.246830940246582e-06, -2.8312206268310547e-06, -1.4156103134155273e-06, 0.0, 1.4156103134155273e-06, 2.8312206268310547e-06, 4.246830940246582e-06, 5.662441253662109e-06, 7.078051567077637e-06, 8.493661880493164e-06, 9.909272193908691e-06, 1.1324882507324219e-05, 1.2740492820739746e-05, 1.4156103134155273e-05, 1.55717134475708e-05, 1.6987323760986328e-05, 1.8402934074401855e-05, 1.9818544387817383e-05, 2.123415470123291e-05, 2.2649765014648438e-05, 2.4065375328063965e-05, 2.5480985641479492e-05, 2.689659595489502e-05, 2.8312206268310547e-05, 2.9727816581726074e-05, 3.11434268951416e-05, 3.255903720855713e-05, 3.3974647521972656e-05, 3.5390257835388184e-05, 3.680586814880371e-05, 3.822147846221924e-05, 3.9637088775634766e-05, 4.105269908905029e-05, 4.246830940246582e-05, 4.388391971588135e-05, 4.5299530029296875e-05]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [6.0, 7.0, 5.0, 5.0, 6.0, 20.0, 33.0, 31.0, 43.0, 71.0, 90.0, 157.0, 156.0, 191.0, 270.0, 405.0, 449.0, 1116.0, 1052.0, 1498.0, 2156.0, 3159.0, 4761.0, 12875.0, 16183.0, 29858.0, 61633.0, 144771.0, 343474.0, 287607.0, 62154.0, 29818.0, 16030.0, 9477.0, 8055.0, 3131.0, 2209.0, 1513.0, 1093.0, 785.0, 801.0, 334.0, 271.0, 195.0, 136.0, 121.0, 107.0, 49.0, 46.0, 39.0, 33.0, 25.0, 37.0, 8.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6954879760742188e-06, -3.5660341382026672e-06, -3.4365803003311157e-06, -3.307126462459564e-06, -3.1776726245880127e-06, -3.048218786716461e-06, -2.9187649488449097e-06, -2.789311110973358e-06, -2.6598572731018066e-06, -2.530403435230255e-06, -2.4009495973587036e-06, -2.271495759487152e-06, -2.1420419216156006e-06, -2.012588083744049e-06, -1.8831342458724976e-06, -1.753680408000946e-06, -1.6242265701293945e-06, -1.494772732257843e-06, -1.3653188943862915e-06, -1.23586505651474e-06, -1.1064112186431885e-06, -9.76957380771637e-07, -8.475035429000854e-07, -7.180497050285339e-07, -5.885958671569824e-07, -4.591420292854309e-07, -3.296881914138794e-07, -2.0023435354232788e-07, -7.078051567077637e-08, 5.8673322200775146e-08, 1.8812716007232666e-07, 3.175809979438782e-07, 4.470348358154297e-07, 5.764886736869812e-07, 7.059425115585327e-07, 8.353963494300842e-07, 9.648501873016357e-07, 1.0943040251731873e-06, 1.2237578630447388e-06, 1.3532117009162903e-06, 1.4826655387878418e-06, 1.6121193766593933e-06, 1.7415732145309448e-06, 1.8710270524024963e-06, 2.000480890274048e-06, 2.1299347281455994e-06, 2.259388566017151e-06, 2.3888424038887024e-06, 2.518296241760254e-06, 2.6477500796318054e-06, 2.777203917503357e-06, 2.9066577553749084e-06, 3.03611159324646e-06, 3.1655654311180115e-06, 3.295019268989563e-06, 3.4244731068611145e-06, 3.553926944732666e-06, 3.6833807826042175e-06, 3.812834620475769e-06, 3.9422884583473206e-06, 4.071742296218872e-06, 4.201196134090424e-06, 4.330649971961975e-06, 4.460103809833527e-06, 4.589557647705078e-06]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 8.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 11.0, 8.0, 10.0, 8.0, 11.0, 28.0, 32.0, 48.0, 47.0, 84.0, 43.0, 52.0, 138.0, 62.0, 105.0, 49.0, 89.0, 22.0, 23.0, 28.0, 13.0, 13.0, 4.0, 10.0, 9.0, 8.0, 9.0, 3.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.86102294921875e-06, -2.7762725949287415e-06, -2.691522240638733e-06, -2.6067718863487244e-06, -2.522021532058716e-06, -2.4372711777687073e-06, -2.3525208234786987e-06, -2.26777046918869e-06, -2.1830201148986816e-06, -2.098269760608673e-06, -2.0135194063186646e-06, -1.928769052028656e-06, -1.8440186977386475e-06, -1.759268343448639e-06, -1.6745179891586304e-06, -1.5897676348686218e-06, -1.5050172805786133e-06, -1.4202669262886047e-06, -1.3355165719985962e-06, -1.2507662177085876e-06, -1.166015863418579e-06, -1.0812655091285706e-06, -9.96515154838562e-07, -9.117648005485535e-07, -8.270144462585449e-07, -7.422640919685364e-07, -6.575137376785278e-07, -5.727633833885193e-07, -4.880130290985107e-07, -4.032626748085022e-07, -3.1851232051849365e-07, -2.337619662284851e-07, -1.4901161193847656e-07, -6.426125764846802e-08, 2.0489096641540527e-08, 1.0523945093154907e-07, 1.8998980522155762e-07, 2.7474015951156616e-07, 3.594905138015747e-07, 4.4424086809158325e-07, 5.289912223815918e-07, 6.137415766716003e-07, 6.984919309616089e-07, 7.832422852516174e-07, 8.67992639541626e-07, 9.527429938316345e-07, 1.037493348121643e-06, 1.1222437024116516e-06, 1.2069940567016602e-06, 1.2917444109916687e-06, 1.3764947652816772e-06, 1.4612451195716858e-06, 1.5459954738616943e-06, 1.6307458281517029e-06, 1.7154961824417114e-06, 1.80024653673172e-06, 1.8849968910217285e-06, 1.969747245311737e-06, 2.0544975996017456e-06, 2.139247953891754e-06, 2.2239983081817627e-06, 2.3087486624717712e-06, 2.3934990167617798e-06, 2.4782493710517883e-06, 2.562999725341797e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 13.0, 22.0, 18.0, 30.0, 30.0, 36.0, 60.0, 87.0, 101.0, 151.0, 191.0, 248.0, 329.0, 482.0, 633.0, 957.0, 1331.0, 2006.0, 3101.0, 5022.0, 8440.0, 16081.0, 32422.0, 76148.0, 240670.0, 271548.0, 240053.0, 76610.0, 32478.0, 15936.0, 8528.0, 5039.0, 2955.0, 2014.0, 1380.0, 927.0, 598.0, 501.0, 355.0, 265.0, 191.0, 137.0, 116.0, 74.0, 62.0, 40.0, 44.0, 30.0, 20.0, 12.0, 13.0, 6.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.6954879760742188e-06, -3.5781413316726685e-06, -3.460794687271118e-06, -3.343448042869568e-06, -3.2261013984680176e-06, -3.1087547540664673e-06, -2.991408109664917e-06, -2.8740614652633667e-06, -2.7567148208618164e-06, -2.639368176460266e-06, -2.522021532058716e-06, -2.4046748876571655e-06, -2.2873282432556152e-06, -2.169981598854065e-06, -2.0526349544525146e-06, -1.9352883100509644e-06, -1.817941665649414e-06, -1.7005950212478638e-06, -1.5832483768463135e-06, -1.4659017324447632e-06, -1.3485550880432129e-06, -1.2312084436416626e-06, -1.1138617992401123e-06, -9.96515154838562e-07, -8.791685104370117e-07, -7.618218660354614e-07, -6.444752216339111e-07, -5.271285772323608e-07, -4.0978193283081055e-07, -2.9243528842926025e-07, -1.7508864402770996e-07, -5.774199962615967e-08, 5.960464477539063e-08, 1.7695128917694092e-07, 2.942979335784912e-07, 4.116445779800415e-07, 5.289912223815918e-07, 6.463378667831421e-07, 7.636845111846924e-07, 8.810311555862427e-07, 9.98377799987793e-07, 1.1157244443893433e-06, 1.2330710887908936e-06, 1.3504177331924438e-06, 1.4677643775939941e-06, 1.5851110219955444e-06, 1.7024576663970947e-06, 1.819804310798645e-06, 1.9371509552001953e-06, 2.0544975996017456e-06, 2.171844244003296e-06, 2.289190888404846e-06, 2.4065375328063965e-06, 2.5238841772079468e-06, 2.641230821609497e-06, 2.7585774660110474e-06, 2.8759241104125977e-06, 2.993270754814148e-06, 3.1106173992156982e-06, 3.2279640436172485e-06, 3.345310688018799e-06, 3.462657332420349e-06, 3.5800039768218994e-06, 3.6973506212234497e-06, 3.814697265625e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 0.0, 7.0, 9.0, 15.0, 3.0, 14.0, 22.0, 19.0, 35.0, 54.0, 27.0, 80.0, 89.0, 106.0, 54.0, 99.0, 78.0, 39.0, 66.0, 47.0, 44.0, 12.0, 19.0, 10.0, 6.0, 13.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0994415283203125e-06, -2.9979273676872253e-06, -2.896413207054138e-06, -2.794899046421051e-06, -2.693384885787964e-06, -2.5918707251548767e-06, -2.4903565645217896e-06, -2.3888424038887024e-06, -2.2873282432556152e-06, -2.185814082622528e-06, -2.084299921989441e-06, -1.9827857613563538e-06, -1.8812716007232666e-06, -1.7797574400901794e-06, -1.6782432794570923e-06, -1.5767291188240051e-06, -1.475214958190918e-06, -1.3737007975578308e-06, -1.2721866369247437e-06, -1.1706724762916565e-06, -1.0691583156585693e-06, -9.676441550254822e-07, -8.66129994392395e-07, -7.646158337593079e-07, -6.631016731262207e-07, -5.615875124931335e-07, -4.600733518600464e-07, -3.5855919122695923e-07, -2.5704503059387207e-07, -1.555308699607849e-07, -5.4016709327697754e-08, 4.7497451305389404e-08, 1.4901161193847656e-07, 2.505257725715637e-07, 3.520399332046509e-07, 4.5355409383773804e-07, 5.550682544708252e-07, 6.565824151039124e-07, 7.580965757369995e-07, 8.596107363700867e-07, 9.611248970031738e-07, 1.062639057636261e-06, 1.1641532182693481e-06, 1.2656673789024353e-06, 1.3671815395355225e-06, 1.4686957001686096e-06, 1.5702098608016968e-06, 1.671724021434784e-06, 1.773238182067871e-06, 1.8747523427009583e-06, 1.9762665033340454e-06, 2.0777806639671326e-06, 2.1792948246002197e-06, 2.280808985233307e-06, 2.382323145866394e-06, 2.483837306499481e-06, 2.5853514671325684e-06, 2.6868656277656555e-06, 2.7883797883987427e-06, 2.88989394903183e-06, 2.991408109664917e-06, 3.092922270298004e-06, 3.1944364309310913e-06, 3.2959505915641785e-06, 3.3974647521972656e-06]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 11.0, 11.0, 17.0, 18.0, 14.0, 20.0, 42.0, 59.0, 115.0, 194.0, 125.0, 70.0, 60.0, 41.0, 31.0, 28.0, 24.0, 15.0, 20.0, 19.0, 9.0, 10.0, 12.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002257805026602, -0.00021864150767214596, -0.0002115024981321767, -0.00020436350314412266, -0.00019722450815606862, -0.00019008549861609936, -0.00018294650362804532, -0.00017580750863999128, -0.00016866851365193725, -0.0001615295186638832, -0.00015439050912391394, -0.0001472515141358599, -0.00014011251914780587, -0.0001329735096078366, -0.00012583451461978257, -0.00011869551963172853, -0.00011155651736771688, -0.00010441751510370523, -9.727852011565119e-05, -9.013951785163954e-05, -8.30005228635855e-05, -7.586152059957385e-05, -6.872252561151981e-05, -6.158352334750816e-05, -5.444452472147532e-05, -4.7305526095442474e-05, -4.016652746940963e-05, -3.3027528843376786e-05, -2.5888528398354538e-05, -1.874952795333229e-05, -1.1610529327299446e-05, -4.471530701266602e-06, 2.6674679247662425e-06, 9.806466550799087e-06, 1.694546517683193e-05, 2.408446562185418e-05, 3.122346242889762e-05, 3.836246469290927e-05, 4.5501463318942115e-05, 5.264046194497496e-05, 5.97794605710078e-05, 6.691845919704065e-05, 7.40574614610523e-05, 8.119645644910634e-05, 8.833545871311799e-05, 9.547446097712964e-05, 0.00010261345596518368, 0.00010975245095323771, 0.00011689145321724936, 0.00012403045548126101, 0.00013116945046931505, 0.0001383084454573691, 0.00014544745499733835, 0.0001525864499853924, 0.00015972544497344643, 0.0001668644545134157, 0.00017400344950146973, 0.00018114244448952377, 0.00018828145402949303, 0.00019542044901754707, 0.0002025594440056011, 0.00020969845354557037, 0.0002168374485336244, 0.00022397644352167845, 0.00023111543850973248]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 4.0, 8.0, 11.0, 7.0, 11.0, 17.0, 10.0, 15.0, 16.0, 26.0, 18.0, 32.0, 25.0, 38.0, 24.0, 33.0, 35.0, 44.0, 32.0, 36.0, 32.0, 43.0, 37.0, 39.0, 38.0, 37.0, 25.0, 32.0, 23.0, 26.0, 24.0, 24.0, 24.0, 18.0, 24.0, 15.0, 14.0, 15.0, 10.0, 11.0, 11.0, 3.0, 7.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0], "bins": [-0.00012475252151489258, -0.00012094993144273758, -0.00011714734137058258, -0.00011334475129842758, -0.00010954216122627258, -0.00010573957115411758, -0.00010193698108196259, -9.813439100980759e-05, -9.433180093765259e-05, -9.052921086549759e-05, -8.672662079334259e-05, -8.292403072118759e-05, -7.912144064903259e-05, -7.53188505768776e-05, -7.15162605047226e-05, -6.77136704325676e-05, -6.39110803604126e-05, -6.01084902882576e-05, -5.63059002161026e-05, -5.25033101439476e-05, -4.87007200717926e-05, -4.4898129999637604e-05, -4.1095539927482605e-05, -3.7292949855327606e-05, -3.349035978317261e-05, -2.968776971101761e-05, -2.588517963886261e-05, -2.208258956670761e-05, -1.8279999494552612e-05, -1.4477409422397614e-05, -1.0674819350242615e-05, -6.872229278087616e-06, -3.069639205932617e-06, 7.329508662223816e-07, 4.53554093837738e-06, 8.338131010532379e-06, 1.2140721082687378e-05, 1.5943311154842377e-05, 1.9745901226997375e-05, 2.3548491299152374e-05, 2.7351081371307373e-05, 3.115367144346237e-05, 3.495626151561737e-05, 3.875885158777237e-05, 4.256144165992737e-05, 4.636403173208237e-05, 5.0166621804237366e-05, 5.3969211876392365e-05, 5.777180194854736e-05, 6.157439202070236e-05, 6.537698209285736e-05, 6.917957216501236e-05, 7.298216223716736e-05, 7.678475230932236e-05, 8.058734238147736e-05, 8.438993245363235e-05, 8.819252252578735e-05, 9.199511259794235e-05, 9.579770267009735e-05, 9.960029274225235e-05, 0.00010340288281440735, 0.00010720547288656235, 0.00011100806295871735, 0.00011481065303087234, 0.00011861324310302734]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 9.0, 15.0, 23.0, 40.0, 72.0, 96.0, 172.0, 241.0, 394.0, 597.0, 1008.0, 1694.0, 2952.0, 5619.0, 10986.0, 22142.0, 50992.0, 174162.0, 3666485.0, 162763.0, 49410.0, 21213.0, 10377.0, 5033.0, 2695.0, 1505.0, 972.0, 620.0, 420.0, 338.0, 250.0, 183.0, 137.0, 119.0, 91.0, 66.0, 76.0, 49.0, 54.0, 39.0, 30.0, 25.0, 35.0, 14.0, 17.0, 9.0, 17.0, 11.0, 4.0, 3.0, 2.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010925531387329102, -0.00010417494922876358, -9.909458458423615e-05, -9.401421993970871e-05, -8.893385529518127e-05, -8.385349065065384e-05, -7.87731260061264e-05, -7.369276136159897e-05, -6.861239671707153e-05, -6.35320320725441e-05, -5.845166742801666e-05, -5.337130278348923e-05, -4.829093813896179e-05, -4.321057349443436e-05, -3.813020884990692e-05, -3.3049844205379486e-05, -2.796947956085205e-05, -2.2889114916324615e-05, -1.780875027179718e-05, -1.2728385627269745e-05, -7.64802098274231e-06, -2.5676563382148743e-06, 2.512708306312561e-06, 7.593072950839996e-06, 1.2673437595367432e-05, 1.7753802239894867e-05, 2.2834166884422302e-05, 2.7914531528949738e-05, 3.299489617347717e-05, 3.807526081800461e-05, 4.3155625462532043e-05, 4.823599010705948e-05, 5.3316354751586914e-05, 5.839671939611435e-05, 6.347708404064178e-05, 6.855744868516922e-05, 7.363781332969666e-05, 7.871817797422409e-05, 8.379854261875153e-05, 8.887890726327896e-05, 9.39592719078064e-05, 9.903963655233383e-05, 0.00010412000119686127, 0.0001092003658413887, 0.00011428073048591614, 0.00011936109513044357, 0.000124441459774971, 0.00012952182441949844, 0.00013460218906402588, 0.00013968255370855331, 0.00014476291835308075, 0.00014984328299760818, 0.00015492364764213562, 0.00016000401228666306, 0.0001650843769311905, 0.00017016474157571793, 0.00017524510622024536, 0.0001803254708647728, 0.00018540583550930023, 0.00019048620015382767, 0.0001955665647983551, 0.00020064692944288254, 0.00020572729408740997, 0.0002108076587319374, 0.00021588802337646484]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 10.0, 17.0, 11.0, 25.0, 31.0, 39.0, 47.0, 67.0, 87.0, 104.0, 98.0, 82.0, 89.0, 82.0, 45.0, 44.0, 26.0, 40.0, 15.0, 16.0, 7.0, 0.0, 6.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0325183868408203e-05, -1.9390136003494263e-05, -1.8455088138580322e-05, -1.7520040273666382e-05, -1.658499240875244e-05, -1.56499445438385e-05, -1.471489667892456e-05, -1.377984881401062e-05, -1.284480094909668e-05, -1.190975308418274e-05, -1.0974705219268799e-05, -1.0039657354354858e-05, -9.104609489440918e-06, -8.169561624526978e-06, -7.234513759613037e-06, -6.299465894699097e-06, -5.364418029785156e-06, -4.429370164871216e-06, -3.4943222999572754e-06, -2.559274435043335e-06, -1.6242265701293945e-06, -6.891787052154541e-07, 2.4586915969848633e-07, 1.1809170246124268e-06, 2.115964889526367e-06, 3.0510127544403076e-06, 3.986060619354248e-06, 4.9211084842681885e-06, 5.856156349182129e-06, 6.791204214096069e-06, 7.72625207901001e-06, 8.66129994392395e-06, 9.59634780883789e-06, 1.0531395673751831e-05, 1.1466443538665771e-05, 1.2401491403579712e-05, 1.3336539268493652e-05, 1.4271587133407593e-05, 1.5206634998321533e-05, 1.6141682863235474e-05, 1.7076730728149414e-05, 1.8011778593063354e-05, 1.8946826457977295e-05, 1.9881874322891235e-05, 2.0816922187805176e-05, 2.1751970052719116e-05, 2.2687017917633057e-05, 2.3622065782546997e-05, 2.4557113647460938e-05, 2.5492161512374878e-05, 2.642720937728882e-05, 2.736225724220276e-05, 2.82973051071167e-05, 2.923235297203064e-05, 3.016740083694458e-05, 3.110244870185852e-05, 3.203749656677246e-05, 3.29725444316864e-05, 3.390759229660034e-05, 3.484264016151428e-05, 3.577768802642822e-05, 3.671273589134216e-05, 3.7647783756256104e-05, 3.8582831621170044e-05, 3.9517879486083984e-05]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 11.0, 14.0, 24.0, 29.0, 43.0, 74.0, 100.0, 132.0, 241.0, 328.0, 512.0, 787.0, 1269.0, 1989.0, 3065.0, 5142.0, 8920.0, 15747.0, 28132.0, 57949.0, 132211.0, 505120.0, 3008455.0, 240989.0, 89137.0, 41645.0, 21797.0, 12294.0, 6877.0, 4171.0, 2519.0, 1657.0, 1004.0, 636.0, 422.0, 282.0, 175.0, 113.0, 93.0, 59.0, 43.0, 21.0, 21.0, 11.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-8.118152618408203e-05, -7.881317287683487e-05, -7.644481956958771e-05, -7.407646626234055e-05, -7.170811295509338e-05, -6.933975964784622e-05, -6.697140634059906e-05, -6.46030530333519e-05, -6.223469972610474e-05, -5.9866346418857574e-05, -5.749799311161041e-05, -5.512963980436325e-05, -5.276128649711609e-05, -5.039293318986893e-05, -4.8024579882621765e-05, -4.56562265753746e-05, -4.328787326812744e-05, -4.091951996088028e-05, -3.855116665363312e-05, -3.6182813346385956e-05, -3.3814460039138794e-05, -3.144610673189163e-05, -2.907775342464447e-05, -2.670940011739731e-05, -2.4341046810150146e-05, -2.1972693502902985e-05, -1.9604340195655823e-05, -1.723598688840866e-05, -1.4867633581161499e-05, -1.2499280273914337e-05, -1.0130926966667175e-05, -7.762573659420013e-06, -5.3942203521728516e-06, -3.0258670449256897e-06, -6.575137376785278e-07, 1.710839569568634e-06, 4.079192876815796e-06, 6.447546184062958e-06, 8.81589949131012e-06, 1.1184252798557281e-05, 1.3552606105804443e-05, 1.5920959413051605e-05, 1.8289312720298767e-05, 2.065766602754593e-05, 2.302601933479309e-05, 2.5394372642040253e-05, 2.7762725949287415e-05, 3.0131079256534576e-05, 3.249943256378174e-05, 3.48677858710289e-05, 3.723613917827606e-05, 3.9604492485523224e-05, 4.1972845792770386e-05, 4.434119910001755e-05, 4.670955240726471e-05, 4.907790571451187e-05, 5.144625902175903e-05, 5.3814612329006195e-05, 5.618296563625336e-05, 5.855131894350052e-05, 6.091967225074768e-05, 6.328802555799484e-05, 6.5656378865242e-05, 6.802473217248917e-05, 7.039308547973633e-05]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 7.0, 8.0, 9.0, 16.0, 23.0, 31.0, 27.0, 36.0, 62.0, 76.0, 73.0, 110.0, 191.0, 555.0, 1528.0, 541.0, 185.0, 115.0, 79.0, 54.0, 60.0, 56.0, 35.0, 33.0, 34.0, 27.0, 21.0, 9.0, 13.0, 8.0, 5.0, 8.0, 7.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.221366882324219e-05, -5.0445087254047394e-05, -4.86765056848526e-05, -4.6907924115657806e-05, -4.513934254646301e-05, -4.337076097726822e-05, -4.1602179408073425e-05, -3.983359783887863e-05, -3.806501626968384e-05, -3.6296434700489044e-05, -3.452785313129425e-05, -3.275927156209946e-05, -3.099068999290466e-05, -2.922210842370987e-05, -2.7453526854515076e-05, -2.5684945285320282e-05, -2.3916363716125488e-05, -2.2147782146930695e-05, -2.03792005777359e-05, -1.8610619008541107e-05, -1.6842037439346313e-05, -1.507345587015152e-05, -1.3304874300956726e-05, -1.1536292731761932e-05, -9.767711162567139e-06, -7.999129593372345e-06, -6.230548024177551e-06, -4.4619664549827576e-06, -2.693384885787964e-06, -9.248033165931702e-07, 8.437782526016235e-07, 2.6123598217964172e-06, 4.380941390991211e-06, 6.149522960186005e-06, 7.918104529380798e-06, 9.686686098575592e-06, 1.1455267667770386e-05, 1.322384923696518e-05, 1.4992430806159973e-05, 1.6761012375354767e-05, 1.852959394454956e-05, 2.0298175513744354e-05, 2.2066757082939148e-05, 2.383533865213394e-05, 2.5603920221328735e-05, 2.737250179052353e-05, 2.9141083359718323e-05, 3.0909664928913116e-05, 3.267824649810791e-05, 3.4446828067302704e-05, 3.62154096364975e-05, 3.798399120569229e-05, 3.9752572774887085e-05, 4.152115434408188e-05, 4.328973591327667e-05, 4.5058317482471466e-05, 4.682689905166626e-05, 4.8595480620861053e-05, 5.036406219005585e-05, 5.213264375925064e-05, 5.3901225328445435e-05, 5.566980689764023e-05, 5.743838846683502e-05, 5.9206970036029816e-05, 6.097555160522461e-05]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 7.0, 2.0, 19.0, 18.0, 24.0, 32.0, 64.0, 93.0, 165.0, 138.0, 112.0, 83.0, 61.0, 42.0, 29.0, 24.0, 14.0, 14.0, 15.0, 9.0, 13.0, 6.0, 3.0, 6.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004161005490459502, -0.0004025893867947161, -0.0003890781954396516, -0.0003755670040845871, -0.00036205584183335304, -0.000348544679582119, -0.0003350334882270545, -0.00032152229687198997, -0.0003080111346207559, -0.00029449997236952186, -0.00028098878101445735, -0.00026747758965939283, -0.0002539664274081588, -0.0002404552506050095, -0.0002269440738018602, -0.00021343289699871093, -0.00019992172019556165, -0.00018641054339241236, -0.00017289936658926308, -0.0001593881897861138, -0.00014587701298296452, -0.00013236583617981523, -0.00011885465937666595, -0.00010534348257351667, -9.183230577036738e-05, -7.83211289672181e-05, -6.480995216406882e-05, -5.1298775360919535e-05, -3.778759855777025e-05, -2.427642175462097e-05, -1.0765244951471686e-05, 2.7459318516775966e-06, 1.625710865482688e-05, 2.9768285457976162e-05, 4.3279462261125445e-05, 5.679063906427473e-05, 7.030181586742401e-05, 8.38129926705733e-05, 9.732416947372258e-05, 0.00011083534627687186, 0.00012434652308002114, 0.00013785769988317043, 0.0001513688766863197, 0.000164880053489469, 0.00017839123029261827, 0.00019190240709576756, 0.00020541358389891684, 0.00021892476070206612, 0.0002324359375052154, 0.00024594709975644946, 0.00025945829111151397, 0.0002729694824665785, 0.00028648064471781254, 0.0002999918069690466, 0.0003135029983241111, 0.0003270141896791756, 0.00034052535193040967, 0.0003540365141816437, 0.00036754770553670824, 0.00038105889689177275, 0.0003945700591430068, 0.00040808122139424086, 0.00042159241274930537, 0.0004351036041043699, 0.00044861476635560393]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 6.0, 14.0, 14.0, 8.0, 21.0, 14.0, 31.0, 20.0, 36.0, 26.0, 26.0, 33.0, 32.0, 45.0, 48.0, 50.0, 28.0, 55.0, 30.0, 34.0, 44.0, 34.0, 38.0, 30.0, 27.0, 26.0, 21.0, 28.0, 25.0, 27.0, 11.0, 25.0, 9.0, 12.0, 19.0, 5.0, 16.0, 6.0, 8.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0001920461654663086, -0.00018588639795780182, -0.00017972663044929504, -0.00017356686294078827, -0.0001674070954322815, -0.00016124732792377472, -0.00015508756041526794, -0.00014892779290676117, -0.0001427680253982544, -0.00013660825788974762, -0.00013044849038124084, -0.00012428872287273407, -0.0001181289553642273, -0.00011196918785572052, -0.00010580942034721375, -9.964965283870697e-05, -9.34898853302002e-05, -8.733011782169342e-05, -8.117035031318665e-05, -7.501058280467987e-05, -6.88508152961731e-05, -6.269104778766632e-05, -5.6531280279159546e-05, -5.037151277065277e-05, -4.4211745262145996e-05, -3.805197775363922e-05, -3.1892210245132446e-05, -2.573244273662567e-05, -1.9572675228118896e-05, -1.3412907719612122e-05, -7.253140211105347e-06, -1.0933727025985718e-06, 5.066394805908203e-06, 1.1226162314414978e-05, 1.7385929822921753e-05, 2.3545697331428528e-05, 2.9705464839935303e-05, 3.586523234844208e-05, 4.202499985694885e-05, 4.818476736545563e-05, 5.43445348739624e-05, 6.050430238246918e-05, 6.666406989097595e-05, 7.282383739948273e-05, 7.89836049079895e-05, 8.514337241649628e-05, 9.130313992500305e-05, 9.746290743350983e-05, 0.0001036226749420166, 0.00010978244245052338, 0.00011594220995903015, 0.00012210197746753693, 0.0001282617449760437, 0.00013442151248455048, 0.00014058127999305725, 0.00014674104750156403, 0.0001529008150100708, 0.00015906058251857758, 0.00016522035002708435, 0.00017138011753559113, 0.0001775398850440979, 0.00018369965255260468, 0.00018985942006111145, 0.00019601918756961823, 0.000202178955078125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 7.0, 11.0, 16.0, 25.0, 33.0, 32.0, 42.0, 74.0, 105.0, 120.0, 263.0, 516.0, 1249.0, 3399.0, 10343.0, 34249.0, 179974.0, 694332.0, 91144.0, 21322.0, 6915.0, 2425.0, 960.0, 443.0, 182.0, 119.0, 82.0, 58.0, 28.0, 23.0, 19.0, 9.0, 12.0, 5.0, 8.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027632713317871094, -0.0002680346369743347, -0.0002597421407699585, -0.0002514496445655823, -0.00024315714836120605, -0.00023486465215682983, -0.0002265721559524536, -0.0002182796597480774, -0.00020998716354370117, -0.00020169466733932495, -0.00019340217113494873, -0.0001851096749305725, -0.0001768171787261963, -0.00016852468252182007, -0.00016023218631744385, -0.00015193969011306763, -0.0001436471939086914, -0.00013535469770431519, -0.00012706220149993896, -0.00011876970529556274, -0.00011047720909118652, -0.0001021847128868103, -9.389221668243408e-05, -8.559972047805786e-05, -7.730722427368164e-05, -6.901472806930542e-05, -6.07222318649292e-05, -5.242973566055298e-05, -4.413723945617676e-05, -3.584474325180054e-05, -2.7552247047424316e-05, -1.9259750843048096e-05, -1.0967254638671875e-05, -2.6747584342956543e-06, 5.617737770080566e-06, 1.3910233974456787e-05, 2.2202730178833008e-05, 3.049522638320923e-05, 3.878772258758545e-05, 4.708021879196167e-05, 5.537271499633789e-05, 6.366521120071411e-05, 7.195770740509033e-05, 8.025020360946655e-05, 8.854269981384277e-05, 9.6835196018219e-05, 0.00010512769222259521, 0.00011342018842697144, 0.00012171268463134766, 0.00013000518083572388, 0.0001382976770401001, 0.00014659017324447632, 0.00015488266944885254, 0.00016317516565322876, 0.00017146766185760498, 0.0001797601580619812, 0.00018805265426635742, 0.00019634515047073364, 0.00020463764667510986, 0.00021293014287948608, 0.0002212226390838623, 0.00022951513528823853, 0.00023780763149261475, 0.00024610012769699097, 0.0002543926239013672]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 5.0, 8.0, 13.0, 15.0, 16.0, 21.0, 49.0, 47.0, 77.0, 95.0, 109.0, 118.0, 99.0, 86.0, 62.0, 56.0, 26.0, 18.0, 24.0, 14.0, 19.0, 10.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.707114279270172e-05, -1.6082078218460083e-05, -1.5093013644218445e-05, -1.4103949069976807e-05, -1.3114884495735168e-05, -1.212581992149353e-05, -1.1136755347251892e-05, -1.0147690773010254e-05, -9.158626198768616e-06, -8.169561624526978e-06, -7.180497050285339e-06, -6.191432476043701e-06, -5.202367901802063e-06, -4.213303327560425e-06, -3.2242387533187866e-06, -2.2351741790771484e-06, -1.2461096048355103e-06, -2.5704503059387207e-07, 7.320195436477661e-07, 1.7210841178894043e-06, 2.7101486921310425e-06, 3.6992132663726807e-06, 4.688277840614319e-06, 5.677342414855957e-06, 6.666406989097595e-06, 7.655471563339233e-06, 8.644536137580872e-06, 9.63360071182251e-06, 1.0622665286064148e-05, 1.1611729860305786e-05, 1.2600794434547424e-05, 1.3589859008789062e-05, 1.45789235830307e-05, 1.556798815727234e-05, 1.6557052731513977e-05, 1.7546117305755615e-05, 1.8535181879997253e-05, 1.952424645423889e-05, 2.051331102848053e-05, 2.1502375602722168e-05, 2.2491440176963806e-05, 2.3480504751205444e-05, 2.4469569325447083e-05, 2.545863389968872e-05, 2.644769847393036e-05, 2.7436763048171997e-05, 2.8425827622413635e-05, 2.9414892196655273e-05, 3.040395677089691e-05, 3.139302134513855e-05, 3.238208591938019e-05, 3.3371150493621826e-05, 3.4360215067863464e-05, 3.53492796421051e-05, 3.633834421634674e-05, 3.732740879058838e-05, 3.831647336483002e-05, 3.9305537939071655e-05, 4.0294602513313293e-05, 4.128366708755493e-05, 4.227273166179657e-05, 4.326179623603821e-05, 4.4250860810279846e-05, 4.5239925384521484e-05]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 10.0, 17.0, 25.0, 24.0, 39.0, 66.0, 84.0, 116.0, 181.0, 268.0, 413.0, 532.0, 818.0, 1202.0, 1855.0, 2674.0, 4125.0, 6632.0, 9993.0, 16221.0, 26641.0, 46157.0, 85564.0, 183420.0, 364461.0, 132762.0, 68228.0, 36839.0, 21520.0, 13160.0, 8450.0, 5472.0, 3596.0, 2301.0, 1529.0, 998.0, 685.0, 441.0, 325.0, 228.0, 130.0, 113.0, 82.0, 50.0, 30.0, 22.0, 19.0, 13.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.608797073364258e-05, -5.423650145530701e-05, -5.2385032176971436e-05, -5.0533562898635864e-05, -4.868209362030029e-05, -4.683062434196472e-05, -4.497915506362915e-05, -4.312768578529358e-05, -4.127621650695801e-05, -3.9424747228622437e-05, -3.7573277950286865e-05, -3.5721808671951294e-05, -3.387033939361572e-05, -3.201887011528015e-05, -3.016740083694458e-05, -2.831593155860901e-05, -2.6464462280273438e-05, -2.4612993001937866e-05, -2.2761523723602295e-05, -2.0910054445266724e-05, -1.9058585166931152e-05, -1.720711588859558e-05, -1.535564661026001e-05, -1.3504177331924438e-05, -1.1652708053588867e-05, -9.801238775253296e-06, -7.949769496917725e-06, -6.098300218582153e-06, -4.246830940246582e-06, -2.3953616619110107e-06, -5.438923835754395e-07, 1.3075768947601318e-06, 3.159046173095703e-06, 5.010515451431274e-06, 6.861984729766846e-06, 8.713454008102417e-06, 1.0564923286437988e-05, 1.241639256477356e-05, 1.4267861843109131e-05, 1.6119331121444702e-05, 1.7970800399780273e-05, 1.9822269678115845e-05, 2.1673738956451416e-05, 2.3525208234786987e-05, 2.537667751312256e-05, 2.722814679145813e-05, 2.90796160697937e-05, 3.093108534812927e-05, 3.2782554626464844e-05, 3.4634023904800415e-05, 3.6485493183135986e-05, 3.833696246147156e-05, 4.018843173980713e-05, 4.20399010181427e-05, 4.389137029647827e-05, 4.574283957481384e-05, 4.7594308853149414e-05, 4.9445778131484985e-05, 5.129724740982056e-05, 5.314871668815613e-05, 5.50001859664917e-05, 5.685165524482727e-05, 5.870312452316284e-05, 6.055459380149841e-05, 6.240606307983398e-05]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 5.0, 8.0, 14.0, 13.0, 10.0, 9.0, 9.0, 20.0, 13.0, 29.0, 20.0, 35.0, 26.0, 44.0, 39.0, 42.0, 46.0, 40.0, 42.0, 60.0, 43.0, 48.0, 29.0, 54.0, 41.0, 32.0, 30.0, 30.0, 22.0, 27.0, 28.0, 8.0, 13.0, 7.0, 17.0, 12.0, 10.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.988908767700195e-05, -4.8412010073661804e-05, -4.6934932470321655e-05, -4.5457854866981506e-05, -4.398077726364136e-05, -4.250369966030121e-05, -4.102662205696106e-05, -3.954954445362091e-05, -3.807246685028076e-05, -3.659538924694061e-05, -3.5118311643600464e-05, -3.3641234040260315e-05, -3.2164156436920166e-05, -3.068707883358002e-05, -2.9210001230239868e-05, -2.773292362689972e-05, -2.625584602355957e-05, -2.477876842021942e-05, -2.3301690816879272e-05, -2.1824613213539124e-05, -2.0347535610198975e-05, -1.8870458006858826e-05, -1.7393380403518677e-05, -1.5916302800178528e-05, -1.4439225196838379e-05, -1.296214759349823e-05, -1.1485069990158081e-05, -1.0007992386817932e-05, -8.530914783477783e-06, -7.053837180137634e-06, -5.576759576797485e-06, -4.0996819734573364e-06, -2.6226043701171875e-06, -1.1455267667770386e-06, 3.3155083656311035e-07, 1.8086284399032593e-06, 3.285706043243408e-06, 4.762783646583557e-06, 6.239861249923706e-06, 7.716938853263855e-06, 9.194016456604004e-06, 1.0671094059944153e-05, 1.2148171663284302e-05, 1.362524926662445e-05, 1.51023268699646e-05, 1.657940447330475e-05, 1.8056482076644897e-05, 1.9533559679985046e-05, 2.1010637283325195e-05, 2.2487714886665344e-05, 2.3964792490005493e-05, 2.5441870093345642e-05, 2.691894769668579e-05, 2.839602530002594e-05, 2.987310290336609e-05, 3.135018050670624e-05, 3.282725811004639e-05, 3.4304335713386536e-05, 3.5781413316726685e-05, 3.7258490920066833e-05, 3.873556852340698e-05, 4.021264612674713e-05, 4.168972373008728e-05, 4.316680133342743e-05, 4.464387893676758e-05]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 10.0, 12.0, 20.0, 35.0, 42.0, 60.0, 78.0, 165.0, 168.0, 255.0, 410.0, 928.0, 1281.0, 2167.0, 3715.0, 10808.0, 18870.0, 45351.0, 129124.0, 531376.0, 190999.0, 62751.0, 24910.0, 13796.0, 4623.0, 2581.0, 1464.0, 1070.0, 487.0, 320.0, 230.0, 170.0, 89.0, 63.0, 44.0, 28.0, 14.0, 11.0, 4.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-7.092952728271484e-06, -6.899237632751465e-06, -6.705522537231445e-06, -6.511807441711426e-06, -6.318092346191406e-06, -6.124377250671387e-06, -5.930662155151367e-06, -5.736947059631348e-06, -5.543231964111328e-06, -5.349516868591309e-06, -5.155801773071289e-06, -4.9620866775512695e-06, -4.76837158203125e-06, -4.5746564865112305e-06, -4.380941390991211e-06, -4.187226295471191e-06, -3.993511199951172e-06, -3.7997961044311523e-06, -3.606081008911133e-06, -3.4123659133911133e-06, -3.2186508178710938e-06, -3.0249357223510742e-06, -2.8312206268310547e-06, -2.637505531311035e-06, -2.4437904357910156e-06, -2.250075340270996e-06, -2.0563602447509766e-06, -1.862645149230957e-06, -1.6689300537109375e-06, -1.475214958190918e-06, -1.2814998626708984e-06, -1.087784767150879e-06, -8.940696716308594e-07, -7.003545761108398e-07, -5.066394805908203e-07, -3.129243850708008e-07, -1.1920928955078125e-07, 7.450580596923828e-08, 2.682209014892578e-07, 4.6193599700927734e-07, 6.556510925292969e-07, 8.493661880493164e-07, 1.043081283569336e-06, 1.2367963790893555e-06, 1.430511474609375e-06, 1.6242265701293945e-06, 1.817941665649414e-06, 2.0116567611694336e-06, 2.205371856689453e-06, 2.3990869522094727e-06, 2.592802047729492e-06, 2.7865171432495117e-06, 2.9802322387695312e-06, 3.1739473342895508e-06, 3.3676624298095703e-06, 3.56137752532959e-06, 3.7550926208496094e-06, 3.948807716369629e-06, 4.1425228118896484e-06, 4.336237907409668e-06, 4.5299530029296875e-06, 4.723668098449707e-06, 4.9173831939697266e-06, 5.111098289489746e-06, 5.304813385009766e-06]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 12.0, 3.0, 5.0, 5.0, 14.0, 10.0, 10.0, 22.0, 46.0, 32.0, 37.0, 54.0, 97.0, 56.0, 51.0, 45.0, 139.0, 54.0, 50.0, 46.0, 64.0, 34.0, 19.0, 11.0, 26.0, 9.0, 6.0, 9.0, 10.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.952052116394043e-06, -1.8775463104248047e-06, -1.8030405044555664e-06, -1.7285346984863281e-06, -1.6540288925170898e-06, -1.5795230865478516e-06, -1.5050172805786133e-06, -1.430511474609375e-06, -1.3560056686401367e-06, -1.2814998626708984e-06, -1.2069940567016602e-06, -1.1324882507324219e-06, -1.0579824447631836e-06, -9.834766387939453e-07, -9.08970832824707e-07, -8.344650268554688e-07, -7.599592208862305e-07, -6.854534149169922e-07, -6.109476089477539e-07, -5.364418029785156e-07, -4.6193599700927734e-07, -3.8743019104003906e-07, -3.129243850708008e-07, -2.384185791015625e-07, -1.6391277313232422e-07, -8.940696716308594e-08, -1.4901161193847656e-08, 5.960464477539063e-08, 1.341104507446289e-07, 2.086162567138672e-07, 2.8312206268310547e-07, 3.5762786865234375e-07, 4.3213367462158203e-07, 5.066394805908203e-07, 5.811452865600586e-07, 6.556510925292969e-07, 7.301568984985352e-07, 8.046627044677734e-07, 8.791685104370117e-07, 9.5367431640625e-07, 1.0281801223754883e-06, 1.1026859283447266e-06, 1.1771917343139648e-06, 1.2516975402832031e-06, 1.3262033462524414e-06, 1.4007091522216797e-06, 1.475214958190918e-06, 1.5497207641601562e-06, 1.6242265701293945e-06, 1.6987323760986328e-06, 1.773238182067871e-06, 1.8477439880371094e-06, 1.9222497940063477e-06, 1.996755599975586e-06, 2.0712614059448242e-06, 2.1457672119140625e-06, 2.2202730178833008e-06, 2.294778823852539e-06, 2.3692846298217773e-06, 2.4437904357910156e-06, 2.518296241760254e-06, 2.592802047729492e-06, 2.6673078536987305e-06, 2.7418136596679688e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 7.0, 10.0, 10.0, 26.0, 26.0, 37.0, 65.0, 22.0, 105.0, 161.0, 255.0, 384.0, 584.0, 908.0, 1390.0, 2364.0, 1736.0, 5294.0, 9842.0, 18139.0, 36934.0, 82179.0, 238601.0, 405637.0, 132858.0, 32612.0, 36949.0, 18234.0, 9727.0, 5362.0, 3103.0, 1826.0, 1104.0, 711.0, 256.0, 361.0, 208.0, 149.0, 119.0, 85.0, 40.0, 35.0, 33.0, 9.0, 23.0, 10.0, 3.0, 8.0, 6.0, 7.0, 2.0, 0.0, 1.0], "bins": [-3.874301910400391e-06, -3.7616118788719177e-06, -3.648921847343445e-06, -3.536231815814972e-06, -3.423541784286499e-06, -3.310851752758026e-06, -3.1981617212295532e-06, -3.0854716897010803e-06, -2.9727816581726074e-06, -2.8600916266441345e-06, -2.7474015951156616e-06, -2.6347115635871887e-06, -2.522021532058716e-06, -2.409331500530243e-06, -2.29664146900177e-06, -2.183951437473297e-06, -2.0712614059448242e-06, -1.9585713744163513e-06, -1.8458813428878784e-06, -1.7331913113594055e-06, -1.6205012798309326e-06, -1.5078112483024597e-06, -1.3951212167739868e-06, -1.282431185245514e-06, -1.169741153717041e-06, -1.0570511221885681e-06, -9.443610906600952e-07, -8.316710591316223e-07, -7.189810276031494e-07, -6.062909960746765e-07, -4.936009645462036e-07, -3.809109330177307e-07, -2.682209014892578e-07, -1.555308699607849e-07, -4.284083843231201e-08, 6.984919309616089e-08, 1.825392246246338e-07, 2.952292561531067e-07, 4.079192876815796e-07, 5.206093192100525e-07, 6.332993507385254e-07, 7.459893822669983e-07, 8.586794137954712e-07, 9.71369445323944e-07, 1.084059476852417e-06, 1.1967495083808899e-06, 1.3094395399093628e-06, 1.4221295714378357e-06, 1.5348196029663086e-06, 1.6475096344947815e-06, 1.7601996660232544e-06, 1.8728896975517273e-06, 1.9855797290802e-06, 2.098269760608673e-06, 2.210959792137146e-06, 2.323649823665619e-06, 2.436339855194092e-06, 2.5490298867225647e-06, 2.6617199182510376e-06, 2.7744099497795105e-06, 2.8870999813079834e-06, 2.9997900128364563e-06, 3.112480044364929e-06, 3.225170075893402e-06, 3.337860107421875e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 6.0, 6.0, 14.0, 13.0, 22.0, 16.0, 31.0, 18.0, 58.0, 23.0, 38.0, 69.0, 34.0, 73.0, 55.0, 90.0, 45.0, 46.0, 74.0, 31.0, 58.0, 29.0, 38.0, 15.0, 21.0, 11.0, 6.0, 14.0, 5.0, 15.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-06, -2.4177134037017822e-06, -2.332031726837158e-06, -2.246350049972534e-06, -2.16066837310791e-06, -2.074986696243286e-06, -1.989305019378662e-06, -1.903623342514038e-06, -1.817941665649414e-06, -1.73225998878479e-06, -1.646578311920166e-06, -1.560896635055542e-06, -1.475214958190918e-06, -1.389533281326294e-06, -1.30385160446167e-06, -1.218169927597046e-06, -1.1324882507324219e-06, -1.0468065738677979e-06, -9.611248970031738e-07, -8.754432201385498e-07, -7.897615432739258e-07, -7.040798664093018e-07, -6.183981895446777e-07, -5.327165126800537e-07, -4.470348358154297e-07, -3.6135315895080566e-07, -2.7567148208618164e-07, -1.8998980522155762e-07, -1.043081283569336e-07, -1.862645149230957e-08, 6.705522537231445e-08, 1.5273690223693848e-07, 2.384185791015625e-07, 3.241002559661865e-07, 4.0978193283081055e-07, 4.954636096954346e-07, 5.811452865600586e-07, 6.668269634246826e-07, 7.525086402893066e-07, 8.381903171539307e-07, 9.238719940185547e-07, 1.0095536708831787e-06, 1.0952353477478027e-06, 1.1809170246124268e-06, 1.2665987014770508e-06, 1.3522803783416748e-06, 1.4379620552062988e-06, 1.5236437320709229e-06, 1.6093254089355469e-06, 1.695007085800171e-06, 1.780688762664795e-06, 1.866370439529419e-06, 1.952052116394043e-06, 2.037733793258667e-06, 2.123415470123291e-06, 2.209097146987915e-06, 2.294778823852539e-06, 2.380460500717163e-06, 2.466142177581787e-06, 2.551823854446411e-06, 2.637505531311035e-06, 2.723187208175659e-06, 2.808868885040283e-06, 2.8945505619049072e-06, 2.9802322387695312e-06]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 11.0, 18.0, 22.0, 56.0, 81.0, 143.0, 228.0, 112.0, 73.0, 53.0, 41.0, 44.0, 21.0, 20.0, 13.0, 11.0, 12.0, 4.0, 3.0, 6.0, 8.0, 2.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017380519420839846, -0.0001642717543290928, -0.00015473831444978714, -0.00014520487457048148, -0.00013567143469117582, -0.00012613799481187016, -0.0001166045549325645, -0.00010707111505325884, -9.753767517395318e-05, -8.800423529464751e-05, -7.847079541534185e-05, -6.89373555360362e-05, -5.940391565673053e-05, -4.987047577742487e-05, -4.033703589811921e-05, -3.080359601881355e-05, -2.127015613950789e-05, -1.1736716260202229e-05, -2.2032763808965683e-06, 7.3301634984090924e-06, 1.6863603377714753e-05, 2.6397043257020414e-05, 3.5930483136326075e-05, 4.5463923015631735e-05, 5.4997362894937396e-05, 6.453080277424306e-05, 7.406424265354872e-05, 8.359768253285438e-05, 9.313112241216004e-05, 0.0001026645622914657, 0.00011219800217077136, 0.00012173144205007702, 0.00013126488192938268, 0.00014079832180868834, 0.000150331761687994, 0.00015986520156729966, 0.00016939864144660532, 0.00017893208132591099, 0.00018846552120521665, 0.0001979989610845223, 0.00020753240096382797, 0.00021706584084313363, 0.0002265992807224393, 0.00023613272060174495, 0.0002456661604810506, 0.0002551996149122715, 0.00026473304023966193, 0.00027426646556705236, 0.00028379991999827325, 0.00029333337442949414, 0.0003028667997568846, 0.000312400225084275, 0.0003219336795154959, 0.0003314671339467168, 0.0003410005592741072, 0.00035053398460149765, 0.00036006743903271854, 0.00036960089346393943, 0.00037913431879132986, 0.0003886677441187203, 0.0003982011985499412, 0.00040773465298116207, 0.0004172680783085525, 0.00042680150363594294, 0.0004363349580671638]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 10.0, 3.0, 10.0, 12.0, 9.0, 11.0, 19.0, 19.0, 29.0, 33.0, 33.0, 30.0, 37.0, 37.0, 42.0, 42.0, 47.0, 57.0, 38.0, 54.0, 50.0, 29.0, 37.0, 32.0, 39.0, 31.0, 33.0, 35.0, 24.0, 29.0, 22.0, 13.0, 15.0, 12.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000152587890625, -0.0001474730670452118, -0.00014235824346542358, -0.00013724341988563538, -0.00013212859630584717, -0.00012701377272605896, -0.00012189894914627075, -0.00011678412556648254, -0.00011166930198669434, -0.00010655447840690613, -0.00010143965482711792, -9.632483124732971e-05, -9.12100076675415e-05, -8.60951840877533e-05, -8.098036050796509e-05, -7.586553692817688e-05, -7.075071334838867e-05, -6.563588976860046e-05, -6.0521066188812256e-05, -5.540624260902405e-05, -5.029141902923584e-05, -4.517659544944763e-05, -4.0061771869659424e-05, -3.4946948289871216e-05, -2.9832124710083008e-05, -2.47173011302948e-05, -1.9602477550506592e-05, -1.4487653970718384e-05, -9.372830390930176e-06, -4.258006811141968e-06, 8.568167686462402e-07, 5.971640348434448e-06, 1.1086463928222656e-05, 1.6201287508010864e-05, 2.1316111087799072e-05, 2.643093466758728e-05, 3.154575824737549e-05, 3.6660581827163696e-05, 4.1775405406951904e-05, 4.689022898674011e-05, 5.200505256652832e-05, 5.711987614631653e-05, 6.223469972610474e-05, 6.734952330589294e-05, 7.246434688568115e-05, 7.757917046546936e-05, 8.269399404525757e-05, 8.780881762504578e-05, 9.292364120483398e-05, 9.803846478462219e-05, 0.0001031532883644104, 0.00010826811194419861, 0.00011338293552398682, 0.00011849775910377502, 0.00012361258268356323, 0.00012872740626335144, 0.00013384222984313965, 0.00013895705342292786, 0.00014407187700271606, 0.00014918670058250427, 0.00015430152416229248, 0.0001594163477420807, 0.0001645311713218689, 0.0001696459949016571, 0.0001747608184814453]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 15.0, 20.0, 28.0, 33.0, 53.0, 122.0, 174.0, 302.0, 542.0, 985.0, 1939.0, 3801.0, 8207.0, 19272.0, 55776.0, 1416309.0, 2591369.0, 55547.0, 20569.0, 8988.0, 4345.0, 2381.0, 1261.0, 712.0, 472.0, 304.0, 198.0, 134.0, 87.0, 60.0, 51.0, 40.0, 28.0, 28.0, 19.0, 28.0, 10.0, 7.0, 13.0, 10.0, 8.0, 10.0, 3.0, 4.0, 6.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.00015664100646972656, -0.00014983117580413818, -0.0001430213451385498, -0.00013621151447296143, -0.00012940168380737305, -0.00012259185314178467, -0.00011578202247619629, -0.00010897219181060791, -0.00010216236114501953, -9.535253047943115e-05, -8.854269981384277e-05, -8.17328691482544e-05, -7.492303848266602e-05, -6.811320781707764e-05, -6.130337715148926e-05, -5.449354648590088e-05, -4.76837158203125e-05, -4.087388515472412e-05, -3.406405448913574e-05, -2.7254223823547363e-05, -2.0444393157958984e-05, -1.3634562492370605e-05, -6.8247318267822266e-06, -1.4901161193847656e-08, 6.794929504394531e-06, 1.360476016998291e-05, 2.041459083557129e-05, 2.7224421501159668e-05, 3.403425216674805e-05, 4.0844082832336426e-05, 4.7653913497924805e-05, 5.4463744163513184e-05, 6.127357482910156e-05, 6.808340549468994e-05, 7.489323616027832e-05, 8.17030668258667e-05, 8.851289749145508e-05, 9.532272815704346e-05, 0.00010213255882263184, 0.00010894238948822021, 0.0001157522201538086, 0.00012256205081939697, 0.00012937188148498535, 0.00013618171215057373, 0.0001429915428161621, 0.0001498013734817505, 0.00015661120414733887, 0.00016342103481292725, 0.00017023086547851562, 0.000177040696144104, 0.00018385052680969238, 0.00019066035747528076, 0.00019747018814086914, 0.00020428001880645752, 0.0002110898494720459, 0.00021789968013763428, 0.00022470951080322266, 0.00023151934146881104, 0.00023832917213439941, 0.0002451390027999878, 0.00025194883346557617, 0.00025875866413116455, 0.00026556849479675293, 0.0002723783254623413, 0.0002791881561279297]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 7.0, 13.0, 16.0, 16.0, 33.0, 43.0, 62.0, 91.0, 103.0, 132.0, 109.0, 106.0, 70.0, 57.0, 44.0, 28.0, 20.0, 18.0, 10.0, 8.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-05, -2.280157059431076e-05, -2.176128327846527e-05, -2.072099596261978e-05, -1.9680708646774292e-05, -1.8640421330928802e-05, -1.7600134015083313e-05, -1.6559846699237823e-05, -1.5519559383392334e-05, -1.4479272067546844e-05, -1.3438984751701355e-05, -1.2398697435855865e-05, -1.1358410120010376e-05, -1.0318122804164886e-05, -9.277835488319397e-06, -8.237548172473907e-06, -7.197260856628418e-06, -6.1569735407829285e-06, -5.116686224937439e-06, -4.0763989090919495e-06, -3.03611159324646e-06, -1.9958242774009705e-06, -9.55536961555481e-07, 8.475035429000854e-08, 1.125037670135498e-06, 2.1653249859809875e-06, 3.205612301826477e-06, 4.2458996176719666e-06, 5.286186933517456e-06, 6.3264742493629456e-06, 7.366761565208435e-06, 8.407048881053925e-06, 9.447336196899414e-06, 1.0487623512744904e-05, 1.1527910828590393e-05, 1.2568198144435883e-05, 1.3608485460281372e-05, 1.4648772776126862e-05, 1.568906009197235e-05, 1.672934740781784e-05, 1.776963472366333e-05, 1.880992203950882e-05, 1.985020935535431e-05, 2.08904966711998e-05, 2.1930783987045288e-05, 2.2971071302890778e-05, 2.4011358618736267e-05, 2.5051645934581757e-05, 2.6091933250427246e-05, 2.7132220566272736e-05, 2.8172507882118225e-05, 2.9212795197963715e-05, 3.0253082513809204e-05, 3.1293369829654694e-05, 3.233365714550018e-05, 3.337394446134567e-05, 3.441423177719116e-05, 3.545451909303665e-05, 3.649480640888214e-05, 3.753509372472763e-05, 3.857538104057312e-05, 3.961566835641861e-05, 4.06559556722641e-05, 4.169624298810959e-05, 4.273653030395508e-05]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 5.0, 5.0, 9.0, 13.0, 21.0, 20.0, 40.0, 68.0, 119.0, 155.0, 296.0, 456.0, 734.0, 1220.0, 2205.0, 3867.0, 6810.0, 12858.0, 24702.0, 55728.0, 156270.0, 3286951.0, 472250.0, 91068.0, 38162.0, 18078.0, 9774.0, 5276.0, 2907.0, 1658.0, 975.0, 640.0, 368.0, 198.0, 130.0, 97.0, 54.0, 31.0, 21.0, 17.0, 13.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.982419967651367e-05, -8.699670433998108e-05, -8.416920900344849e-05, -8.13417136669159e-05, -7.85142183303833e-05, -7.568672299385071e-05, -7.285922765731812e-05, -7.003173232078552e-05, -6.720423698425293e-05, -6.437674164772034e-05, -6.154924631118774e-05, -5.872175097465515e-05, -5.589425563812256e-05, -5.3066760301589966e-05, -5.023926496505737e-05, -4.741176962852478e-05, -4.458427429199219e-05, -4.1756778955459595e-05, -3.8929283618927e-05, -3.610178828239441e-05, -3.3274292945861816e-05, -3.0446797609329224e-05, -2.761930227279663e-05, -2.4791806936264038e-05, -2.1964311599731445e-05, -1.9136816263198853e-05, -1.630932092666626e-05, -1.3481825590133667e-05, -1.0654330253601074e-05, -7.826834917068481e-06, -4.999339580535889e-06, -2.171844244003296e-06, 6.556510925292969e-07, 3.4831464290618896e-06, 6.310641765594482e-06, 9.138137102127075e-06, 1.1965632438659668e-05, 1.479312777519226e-05, 1.7620623111724854e-05, 2.0448118448257446e-05, 2.327561378479004e-05, 2.6103109121322632e-05, 2.8930604457855225e-05, 3.175809979438782e-05, 3.458559513092041e-05, 3.7413090467453e-05, 4.0240585803985596e-05, 4.306808114051819e-05, 4.589557647705078e-05, 4.8723071813583374e-05, 5.155056715011597e-05, 5.437806248664856e-05, 5.720555782318115e-05, 6.0033053159713745e-05, 6.286054849624634e-05, 6.568804383277893e-05, 6.851553916931152e-05, 7.134303450584412e-05, 7.417052984237671e-05, 7.69980251789093e-05, 7.98255205154419e-05, 8.265301585197449e-05, 8.548051118850708e-05, 8.830800652503967e-05, 9.113550186157227e-05]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 2.0, 8.0, 12.0, 7.0, 10.0, 10.0, 8.0, 13.0, 24.0, 23.0, 32.0, 50.0, 60.0, 75.0, 155.0, 490.0, 1997.0, 520.0, 154.0, 80.0, 69.0, 51.0, 30.0, 24.0, 29.0, 34.0, 24.0, 15.0, 12.0, 19.0, 9.0, 11.0, 7.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.137920379638672e-05, -4.974938929080963e-05, -4.8119574785232544e-05, -4.6489760279655457e-05, -4.485994577407837e-05, -4.323013126850128e-05, -4.1600316762924194e-05, -3.997050225734711e-05, -3.834068775177002e-05, -3.671087324619293e-05, -3.5081058740615845e-05, -3.345124423503876e-05, -3.182142972946167e-05, -3.0191615223884583e-05, -2.8561800718307495e-05, -2.6931986212730408e-05, -2.530217170715332e-05, -2.3672357201576233e-05, -2.2042542695999146e-05, -2.0412728190422058e-05, -1.878291368484497e-05, -1.7153099179267883e-05, -1.5523284673690796e-05, -1.3893470168113708e-05, -1.2263655662536621e-05, -1.0633841156959534e-05, -9.004026651382446e-06, -7.374212145805359e-06, -5.7443976402282715e-06, -4.114583134651184e-06, -2.4847686290740967e-06, -8.549541234970093e-07, 7.748603820800781e-07, 2.4046748876571655e-06, 4.034489393234253e-06, 5.66430389881134e-06, 7.294118404388428e-06, 8.923932909965515e-06, 1.0553747415542603e-05, 1.218356192111969e-05, 1.3813376426696777e-05, 1.5443190932273865e-05, 1.7073005437850952e-05, 1.870281994342804e-05, 2.0332634449005127e-05, 2.1962448954582214e-05, 2.3592263460159302e-05, 2.522207796573639e-05, 2.6851892471313477e-05, 2.8481706976890564e-05, 3.011152148246765e-05, 3.174133598804474e-05, 3.3371150493621826e-05, 3.5000964999198914e-05, 3.6630779504776e-05, 3.826059401035309e-05, 3.9890408515930176e-05, 4.152022302150726e-05, 4.315003752708435e-05, 4.477985203266144e-05, 4.6409666538238525e-05, 4.803948104381561e-05, 4.96692955493927e-05, 5.129911005496979e-05, 5.2928924560546875e-05]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 7.0, 11.0, 8.0, 16.0, 20.0, 31.0, 40.0, 56.0, 95.0, 136.0, 121.0, 107.0, 75.0, 56.0, 44.0, 32.0, 21.0, 26.0, 14.0, 17.0, 21.0, 7.0, 7.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019153833272866905, -0.00018240278586745262, -0.00017326725355815142, -0.000164131706696935, -0.0001549961743876338, -0.00014586062752641737, -0.00013672508066520095, -0.00012758953380398452, -0.00011845400149468333, -0.00010931846190942451, -0.0001001829223241657, -9.104737546294928e-05, -8.191183587769046e-05, -7.277629629243165e-05, -6.364074943121523e-05, -5.4505209845956415e-05, -4.53696702606976e-05, -3.623413067543879e-05, -2.7098587452201173e-05, -1.7963046047952957e-05, -8.827504643704742e-06, 3.080349415540695e-07, 9.443578164791688e-06, 1.8579121388029307e-05, 2.771466097328812e-05, 3.685020055854693e-05, 4.598574378178455e-05, 5.512128700502217e-05, 6.425682659028098e-05, 7.339236617553979e-05, 8.252791303675622e-05, 9.166345262201503e-05, 0.0001007990213111043, 0.00010993456089636311, 0.00011907010048162192, 0.00012820564734283835, 0.00013734117965213954, 0.00014647672651335597, 0.0001556122733745724, 0.00016474782023578882, 0.00017388335254509002, 0.00018301889940630645, 0.00019215443171560764, 0.00020128997857682407, 0.0002104255254380405, 0.0002195610577473417, 0.00022869660460855812, 0.00023783213691785932, 0.00024696768377907574, 0.00025610323064029217, 0.0002652387775015086, 0.00027437429525889456, 0.000283509842120111, 0.0002926453889813274, 0.00030178093584254384, 0.00031091648270376027, 0.0003200520295649767, 0.0003291875764261931, 0.00033832312328740954, 0.0003474586410447955, 0.00035659418790601194, 0.00036572973476722836, 0.0003748652816284448, 0.0003840008284896612, 0.0003931363462470472]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 6.0, 8.0, 2.0, 7.0, 11.0, 13.0, 16.0, 19.0, 22.0, 18.0, 12.0, 25.0, 21.0, 27.0, 36.0, 33.0, 38.0, 37.0, 42.0, 37.0, 43.0, 47.0, 31.0, 32.0, 34.0, 43.0, 52.0, 39.0, 34.0, 37.0, 22.0, 23.0, 23.0, 17.0, 7.0, 19.0, 18.0, 11.0, 9.0, 5.0, 6.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00013959407806396484, -0.00013489089906215668, -0.0001301877200603485, -0.00012548454105854034, -0.00012078136205673218, -0.00011607818305492401, -0.00011137500405311584, -0.00010667182505130768, -0.00010196864604949951, -9.726546704769135e-05, -9.256228804588318e-05, -8.785910904407501e-05, -8.315593004226685e-05, -7.845275104045868e-05, -7.374957203865051e-05, -6.904639303684235e-05, -6.434321403503418e-05, -5.964003503322601e-05, -5.493685603141785e-05, -5.023367702960968e-05, -4.5530498027801514e-05, -4.082731902599335e-05, -3.612414002418518e-05, -3.1420961022377014e-05, -2.6717782020568848e-05, -2.201460301876068e-05, -1.7311424016952515e-05, -1.2608245015144348e-05, -7.905066013336182e-06, -3.201887011528015e-06, 1.5012919902801514e-06, 6.204470992088318e-06, 1.0907649993896484e-05, 1.561082899570465e-05, 2.0314007997512817e-05, 2.5017186999320984e-05, 2.972036600112915e-05, 3.442354500293732e-05, 3.9126724004745483e-05, 4.382990300655365e-05, 4.8533082008361816e-05, 5.323626101016998e-05, 5.793944001197815e-05, 6.264261901378632e-05, 6.734579801559448e-05, 7.204897701740265e-05, 7.675215601921082e-05, 8.145533502101898e-05, 8.615851402282715e-05, 9.086169302463531e-05, 9.556487202644348e-05, 0.00010026805102825165, 0.00010497123003005981, 0.00010967440903186798, 0.00011437758803367615, 0.00011908076703548431, 0.00012378394603729248, 0.00012848712503910065, 0.0001331903040409088, 0.00013789348304271698, 0.00014259666204452515, 0.0001472998410463333, 0.00015200302004814148, 0.00015670619904994965, 0.0001614093780517578]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 13.0, 9.0, 7.0, 8.0, 7.0, 17.0, 18.0, 18.0, 26.0, 35.0, 42.0, 81.0, 187.0, 324.0, 641.0, 1293.0, 2888.0, 7083.0, 21330.0, 91688.0, 690384.0, 181087.0, 33694.0, 10212.0, 4062.0, 1617.0, 812.0, 377.0, 229.0, 125.0, 71.0, 46.0, 28.0, 22.0, 10.0, 12.0, 10.0, 6.0, 12.0, 8.0, 9.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002371072769165039, -0.0002288389950990677, -0.00022057071328163147, -0.00021230243146419525, -0.00020403414964675903, -0.00019576586782932281, -0.0001874975860118866, -0.00017922930419445038, -0.00017096102237701416, -0.00016269274055957794, -0.00015442445874214172, -0.0001461561769247055, -0.0001378878951072693, -0.00012961961328983307, -0.00012135133147239685, -0.00011308304965496063, -0.00010481476783752441, -9.65464860200882e-05, -8.827820420265198e-05, -8.000992238521576e-05, -7.174164056777954e-05, -6.347335875034332e-05, -5.5205076932907104e-05, -4.6936795115470886e-05, -3.866851329803467e-05, -3.040023148059845e-05, -2.213194966316223e-05, -1.3863667845726013e-05, -5.595386028289795e-06, 2.6728957891464233e-06, 1.0941177606582642e-05, 1.920945942401886e-05, 2.7477741241455078e-05, 3.5746023058891296e-05, 4.4014304876327515e-05, 5.228258669376373e-05, 6.055086851119995e-05, 6.881915032863617e-05, 7.708743214607239e-05, 8.53557139635086e-05, 9.362399578094482e-05, 0.00010189227759838104, 0.00011016055941581726, 0.00011842884123325348, 0.0001266971230506897, 0.00013496540486812592, 0.00014323368668556213, 0.00015150196850299835, 0.00015977025032043457, 0.0001680385321378708, 0.000176306813955307, 0.00018457509577274323, 0.00019284337759017944, 0.00020111165940761566, 0.00020937994122505188, 0.0002176482230424881, 0.00022591650485992432, 0.00023418478667736053, 0.00024245306849479675, 0.00025072135031223297, 0.0002589896321296692, 0.0002672579139471054, 0.0002755261957645416, 0.00028379447758197784, 0.00029206275939941406]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 8.0, 15.0, 10.0, 11.0, 25.0, 34.0, 68.0, 83.0, 116.0, 132.0, 125.0, 102.0, 93.0, 56.0, 35.0, 29.0, 19.0, 14.0, 5.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.187490463256836e-05, -2.072565257549286e-05, -1.957640051841736e-05, -1.8427148461341858e-05, -1.7277896404266357e-05, -1.6128644347190857e-05, -1.4979392290115356e-05, -1.3830140233039856e-05, -1.2680888175964355e-05, -1.1531636118888855e-05, -1.0382384061813354e-05, -9.233132004737854e-06, -8.083879947662354e-06, -6.934627890586853e-06, -5.7853758335113525e-06, -4.636123776435852e-06, -3.4868717193603516e-06, -2.337619662284851e-06, -1.1883676052093506e-06, -3.91155481338501e-08, 1.1101365089416504e-06, 2.259388566017151e-06, 3.4086406230926514e-06, 4.557892680168152e-06, 5.707144737243652e-06, 6.856396794319153e-06, 8.005648851394653e-06, 9.154900908470154e-06, 1.0304152965545654e-05, 1.1453405022621155e-05, 1.2602657079696655e-05, 1.3751909136772156e-05, 1.4901161193847656e-05, 1.6050413250923157e-05, 1.7199665307998657e-05, 1.8348917365074158e-05, 1.9498169422149658e-05, 2.064742147922516e-05, 2.179667353630066e-05, 2.294592559337616e-05, 2.409517765045166e-05, 2.524442970752716e-05, 2.639368176460266e-05, 2.754293382167816e-05, 2.8692185878753662e-05, 2.9841437935829163e-05, 3.099068999290466e-05, 3.2139942049980164e-05, 3.3289194107055664e-05, 3.4438446164131165e-05, 3.5587698221206665e-05, 3.6736950278282166e-05, 3.7886202335357666e-05, 3.9035454392433167e-05, 4.018470644950867e-05, 4.133395850658417e-05, 4.248321056365967e-05, 4.363246262073517e-05, 4.478171467781067e-05, 4.593096673488617e-05, 4.708021879196167e-05, 4.822947084903717e-05, 4.937872290611267e-05, 5.052797496318817e-05, 5.167722702026367e-05]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 3.0, 19.0, 16.0, 17.0, 41.0, 56.0, 119.0, 146.0, 297.0, 443.0, 788.0, 1186.0, 2234.0, 3569.0, 6431.0, 10477.0, 18760.0, 32170.0, 58390.0, 118185.0, 348259.0, 236384.0, 93745.0, 50892.0, 27499.0, 16234.0, 8948.0, 5510.0, 3108.0, 1862.0, 1123.0, 626.0, 367.0, 255.0, 128.0, 105.0, 69.0, 40.0, 16.0, 18.0, 3.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.158517837524414e-05, -6.9471076130867e-05, -6.735697388648987e-05, -6.524287164211273e-05, -6.31287693977356e-05, -6.101466715335846e-05, -5.890056490898132e-05, -5.678646266460419e-05, -5.467236042022705e-05, -5.2558258175849915e-05, -5.044415593147278e-05, -4.833005368709564e-05, -4.6215951442718506e-05, -4.410184919834137e-05, -4.1987746953964233e-05, -3.98736447095871e-05, -3.775954246520996e-05, -3.5645440220832825e-05, -3.353133797645569e-05, -3.141723573207855e-05, -2.9303133487701416e-05, -2.718903124332428e-05, -2.5074928998947144e-05, -2.2960826754570007e-05, -2.084672451019287e-05, -1.8732622265815735e-05, -1.66185200214386e-05, -1.4504417777061462e-05, -1.2390315532684326e-05, -1.027621328830719e-05, -8.162111043930054e-06, -6.0480087995529175e-06, -3.933906555175781e-06, -1.819804310798645e-06, 2.942979335784912e-07, 2.4084001779556274e-06, 4.522502422332764e-06, 6.6366046667099e-06, 8.750706911087036e-06, 1.0864809155464172e-05, 1.2978911399841309e-05, 1.5093013644218445e-05, 1.720711588859558e-05, 1.9321218132972717e-05, 2.1435320377349854e-05, 2.354942262172699e-05, 2.5663524866104126e-05, 2.7777627110481262e-05, 2.98917293548584e-05, 3.2005831599235535e-05, 3.411993384361267e-05, 3.623403608798981e-05, 3.834813833236694e-05, 4.046224057674408e-05, 4.2576342821121216e-05, 4.469044506549835e-05, 4.680454730987549e-05, 4.8918649554252625e-05, 5.103275179862976e-05, 5.31468540430069e-05, 5.526095628738403e-05, 5.737505853176117e-05, 5.9489160776138306e-05, 6.160326302051544e-05, 6.371736526489258e-05]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 8.0, 4.0, 8.0, 16.0, 8.0, 13.0, 14.0, 23.0, 17.0, 27.0, 32.0, 21.0, 34.0, 31.0, 33.0, 42.0, 44.0, 40.0, 45.0, 45.0, 44.0, 44.0, 38.0, 38.0, 42.0, 43.0, 39.0, 21.0, 40.0, 26.0, 28.0, 19.0, 14.0, 13.0, 15.0, 6.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 5.0], "bins": [-5.924701690673828e-05, -5.771126598119736e-05, -5.617551505565643e-05, -5.463976413011551e-05, -5.3104013204574585e-05, -5.156826227903366e-05, -5.003251135349274e-05, -4.849676042795181e-05, -4.696100950241089e-05, -4.5425258576869965e-05, -4.388950765132904e-05, -4.2353756725788116e-05, -4.081800580024719e-05, -3.928225487470627e-05, -3.7746503949165344e-05, -3.621075302362442e-05, -3.4675002098083496e-05, -3.313925117254257e-05, -3.160350024700165e-05, -3.0067749321460724e-05, -2.85319983959198e-05, -2.6996247470378876e-05, -2.546049654483795e-05, -2.3924745619297028e-05, -2.2388994693756104e-05, -2.085324376821518e-05, -1.9317492842674255e-05, -1.778174191713333e-05, -1.6245990991592407e-05, -1.4710240066051483e-05, -1.3174489140510559e-05, -1.1638738214969635e-05, -1.0102987289428711e-05, -8.567236363887787e-06, -7.031485438346863e-06, -5.495734512805939e-06, -3.959983587265015e-06, -2.4242326617240906e-06, -8.884817361831665e-07, 6.472691893577576e-07, 2.1830201148986816e-06, 3.7187710404396057e-06, 5.25452196598053e-06, 6.790272891521454e-06, 8.326023817062378e-06, 9.861774742603302e-06, 1.1397525668144226e-05, 1.293327659368515e-05, 1.4469027519226074e-05, 1.6004778444766998e-05, 1.7540529370307922e-05, 1.9076280295848846e-05, 2.061203122138977e-05, 2.2147782146930695e-05, 2.368353307247162e-05, 2.5219283998012543e-05, 2.6755034923553467e-05, 2.829078584909439e-05, 2.9826536774635315e-05, 3.136228770017624e-05, 3.289803862571716e-05, 3.443378955125809e-05, 3.596954047679901e-05, 3.7505291402339935e-05, 3.904104232788086e-05]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 2.0, 9.0, 23.0, 15.0, 25.0, 50.0, 55.0, 84.0, 114.0, 247.0, 282.0, 406.0, 903.0, 1104.0, 1874.0, 4766.0, 7151.0, 13117.0, 43051.0, 90253.0, 273382.0, 448323.0, 89674.0, 36356.0, 16818.0, 10358.0, 3792.0, 2334.0, 1715.0, 735.0, 465.0, 388.0, 200.0, 131.0, 129.0, 69.0, 42.0, 39.0, 14.0, 12.0, 8.0, 11.0, 6.0, 7.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.543231964111328e-06, -5.345791578292847e-06, -5.148351192474365e-06, -4.950910806655884e-06, -4.753470420837402e-06, -4.556030035018921e-06, -4.3585896492004395e-06, -4.161149263381958e-06, -3.9637088775634766e-06, -3.766268491744995e-06, -3.5688281059265137e-06, -3.3713877201080322e-06, -3.1739473342895508e-06, -2.9765069484710693e-06, -2.779066562652588e-06, -2.5816261768341064e-06, -2.384185791015625e-06, -2.1867454051971436e-06, -1.989305019378662e-06, -1.7918646335601807e-06, -1.5944242477416992e-06, -1.3969838619232178e-06, -1.1995434761047363e-06, -1.0021030902862549e-06, -8.046627044677734e-07, -6.07222318649292e-07, -4.0978193283081055e-07, -2.123415470123291e-07, -1.4901161193847656e-08, 1.825392246246338e-07, 3.7997961044311523e-07, 5.774199962615967e-07, 7.748603820800781e-07, 9.723007678985596e-07, 1.169741153717041e-06, 1.3671815395355225e-06, 1.564621925354004e-06, 1.7620623111724854e-06, 1.959502696990967e-06, 2.1569430828094482e-06, 2.3543834686279297e-06, 2.551823854446411e-06, 2.7492642402648926e-06, 2.946704626083374e-06, 3.1441450119018555e-06, 3.341585397720337e-06, 3.5390257835388184e-06, 3.7364661693573e-06, 3.933906555175781e-06, 4.131346940994263e-06, 4.328787326812744e-06, 4.526227712631226e-06, 4.723668098449707e-06, 4.9211084842681885e-06, 5.11854887008667e-06, 5.315989255905151e-06, 5.513429641723633e-06, 5.710870027542114e-06, 5.908310413360596e-06, 6.105750799179077e-06, 6.303191184997559e-06, 6.50063157081604e-06, 6.6980719566345215e-06, 6.895512342453003e-06, 7.092952728271484e-06]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 11.0, 8.0, 6.0, 9.0, 12.0, 19.0, 22.0, 21.0, 56.0, 26.0, 30.0, 36.0, 63.0, 49.0, 44.0, 55.0, 105.0, 46.0, 49.0, 41.0, 37.0, 30.0, 36.0, 33.0, 45.0, 20.0, 20.0, 14.0, 12.0, 4.0, 7.0, 10.0, 11.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.682209014892578e-06, -2.6151537895202637e-06, -2.5480985641479492e-06, -2.4810433387756348e-06, -2.4139881134033203e-06, -2.346932888031006e-06, -2.2798776626586914e-06, -2.212822437286377e-06, -2.1457672119140625e-06, -2.078711986541748e-06, -2.0116567611694336e-06, -1.944601535797119e-06, -1.8775463104248047e-06, -1.8104910850524902e-06, -1.7434358596801758e-06, -1.6763806343078613e-06, -1.6093254089355469e-06, -1.5422701835632324e-06, -1.475214958190918e-06, -1.4081597328186035e-06, -1.341104507446289e-06, -1.2740492820739746e-06, -1.2069940567016602e-06, -1.1399388313293457e-06, -1.0728836059570312e-06, -1.0058283805847168e-06, -9.387731552124023e-07, -8.717179298400879e-07, -8.046627044677734e-07, -7.37607479095459e-07, -6.705522537231445e-07, -6.034970283508301e-07, -5.364418029785156e-07, -4.6938657760620117e-07, -4.023313522338867e-07, -3.3527612686157227e-07, -2.682209014892578e-07, -2.0116567611694336e-07, -1.341104507446289e-07, -6.705522537231445e-08, 0.0, 6.705522537231445e-08, 1.341104507446289e-07, 2.0116567611694336e-07, 2.682209014892578e-07, 3.3527612686157227e-07, 4.023313522338867e-07, 4.6938657760620117e-07, 5.364418029785156e-07, 6.034970283508301e-07, 6.705522537231445e-07, 7.37607479095459e-07, 8.046627044677734e-07, 8.717179298400879e-07, 9.387731552124023e-07, 1.0058283805847168e-06, 1.0728836059570312e-06, 1.1399388313293457e-06, 1.2069940567016602e-06, 1.2740492820739746e-06, 1.341104507446289e-06, 1.4081597328186035e-06, 1.475214958190918e-06, 1.5422701835632324e-06, 1.6093254089355469e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 6.0, 4.0, 10.0, 26.0, 12.0, 35.0, 37.0, 73.0, 91.0, 89.0, 267.0, 174.0, 468.0, 363.0, 1060.0, 1762.0, 1225.0, 3626.0, 2716.0, 8289.0, 14502.0, 11259.0, 37509.0, 32276.0, 133372.0, 153988.0, 396071.0, 133544.0, 32263.0, 37496.0, 11330.0, 14481.0, 4642.0, 6204.0, 3615.0, 1240.0, 1693.0, 570.0, 823.0, 492.0, 190.0, 258.0, 84.0, 120.0, 36.0, 64.0, 41.0, 13.0, 25.0, 8.0, 11.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.9206275939941406e-06, -2.8265640139579773e-06, -2.732500433921814e-06, -2.6384368538856506e-06, -2.5443732738494873e-06, -2.450309693813324e-06, -2.3562461137771606e-06, -2.2621825337409973e-06, -2.168118953704834e-06, -2.0740553736686707e-06, -1.9799917936325073e-06, -1.885928213596344e-06, -1.7918646335601807e-06, -1.6978010535240173e-06, -1.603737473487854e-06, -1.5096738934516907e-06, -1.4156103134155273e-06, -1.321546733379364e-06, -1.2274831533432007e-06, -1.1334195733070374e-06, -1.039355993270874e-06, -9.452924132347107e-07, -8.512288331985474e-07, -7.57165253162384e-07, -6.631016731262207e-07, -5.690380930900574e-07, -4.7497451305389404e-07, -3.809109330177307e-07, -2.868473529815674e-07, -1.9278377294540405e-07, -9.872019290924072e-08, -4.6566128730773926e-09, 8.940696716308594e-08, 1.8347054719924927e-07, 2.775341272354126e-07, 3.7159770727157593e-07, 4.6566128730773926e-07, 5.597248673439026e-07, 6.537884473800659e-07, 7.478520274162292e-07, 8.419156074523926e-07, 9.359791874885559e-07, 1.0300427675247192e-06, 1.1241063475608826e-06, 1.218169927597046e-06, 1.3122335076332092e-06, 1.4062970876693726e-06, 1.5003606677055359e-06, 1.5944242477416992e-06, 1.6884878277778625e-06, 1.7825514078140259e-06, 1.8766149878501892e-06, 1.9706785678863525e-06, 2.064742147922516e-06, 2.158805727958679e-06, 2.2528693079948425e-06, 2.346932888031006e-06, 2.440996468067169e-06, 2.5350600481033325e-06, 2.629123628139496e-06, 2.723187208175659e-06, 2.8172507882118225e-06, 2.911314368247986e-06, 3.005377948284149e-06, 3.0994415283203125e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 10.0, 10.0, 6.0, 8.0, 9.0, 19.0, 10.0, 17.0, 9.0, 16.0, 41.0, 24.0, 29.0, 22.0, 28.0, 76.0, 36.0, 43.0, 35.0, 47.0, 97.0, 45.0, 45.0, 40.0, 34.0, 54.0, 21.0, 13.0, 18.0, 14.0, 32.0, 7.0, 12.0, 15.0, 8.0, 11.0, 5.0, 3.0, 6.0, 1.0, 6.0, 3.0, 7.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0265579223632812e-06, -1.9548460841178894e-06, -1.8831342458724976e-06, -1.8114224076271057e-06, -1.7397105693817139e-06, -1.667998731136322e-06, -1.5962868928909302e-06, -1.5245750546455383e-06, -1.4528632164001465e-06, -1.3811513781547546e-06, -1.3094395399093628e-06, -1.237727701663971e-06, -1.166015863418579e-06, -1.0943040251731873e-06, -1.0225921869277954e-06, -9.508803486824036e-07, -8.791685104370117e-07, -8.074566721916199e-07, -7.35744833946228e-07, -6.640329957008362e-07, -5.923211574554443e-07, -5.206093192100525e-07, -4.4889748096466064e-07, -3.771856427192688e-07, -3.0547380447387695e-07, -2.337619662284851e-07, -1.6205012798309326e-07, -9.033828973770142e-08, -1.862645149230957e-08, 5.3085386753082275e-08, 1.2479722499847412e-07, 1.9650906324386597e-07, 2.682209014892578e-07, 3.3993273973464966e-07, 4.116445779800415e-07, 4.833564162254333e-07, 5.550682544708252e-07, 6.26780092716217e-07, 6.984919309616089e-07, 7.702037692070007e-07, 8.419156074523926e-07, 9.136274456977844e-07, 9.853392839431763e-07, 1.0570511221885681e-06, 1.12876296043396e-06, 1.2004747986793518e-06, 1.2721866369247437e-06, 1.3438984751701355e-06, 1.4156103134155273e-06, 1.4873221516609192e-06, 1.559033989906311e-06, 1.6307458281517029e-06, 1.7024576663970947e-06, 1.7741695046424866e-06, 1.8458813428878784e-06, 1.9175931811332703e-06, 1.989305019378662e-06, 2.061016857624054e-06, 2.132728695869446e-06, 2.2044405341148376e-06, 2.2761523723602295e-06, 2.3478642106056213e-06, 2.419576048851013e-06, 2.491287887096405e-06, 2.562999725341797e-06]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 8.0, 18.0, 9.0, 18.0, 13.0, 29.0, 43.0, 67.0, 87.0, 171.0, 164.0, 93.0, 62.0, 48.0, 26.0, 20.0, 22.0, 15.0, 13.0, 13.0, 5.0, 9.0, 7.0, 7.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001502146915299818, -0.0001433406723663211, -0.00013646665320266038, -0.00012959263403899968, -0.00012271861487533897, -0.00011584459571167827, -0.00010897056927205995, -0.00010209655010839924, -9.522253094473854e-05, -8.834851178107783e-05, -8.147449261741713e-05, -7.460046617779881e-05, -6.77264470141381e-05, -6.0852431488456205e-05, -5.397840868681669e-05, -4.710438952315599e-05, -4.023037035949528e-05, -3.335635119583458e-05, -2.648233021318447e-05, -1.960830923053436e-05, -1.2734290066873655e-05, -5.86027090321295e-06, 1.0137518984265625e-06, 7.887771062087268e-06, 1.4761790225747973e-05, 2.1635809389408678e-05, 2.8509830372058786e-05, 3.5383851354708895e-05, 4.22578705183696e-05, 4.9131889682030305e-05, 5.600591248366982e-05, 6.287993164733052e-05, 6.975396536290646e-05, 7.662798452656716e-05, 8.350200369022787e-05, 9.037602285388857e-05, 9.725004201754928e-05, 0.00010412406118120998, 0.0001109980876208283, 0.000117872106784489, 0.0001247461186721921, 0.0001316201378358528, 0.0001384941569995135, 0.0001453681761631742, 0.00015224219532683492, 0.00015911621449049562, 0.00016599023365415633, 0.00017286426736973226, 0.00017973828653339297, 0.00018661230569705367, 0.00019348632486071438, 0.00020036034402437508, 0.00020723436318803579, 0.0002141083823516965, 0.00022098241606727242, 0.0002278564206790179, 0.00023473045439459383, 0.00024160447355825454, 0.00024847849272191525, 0.0002553525264374912, 0.00026222653104923666, 0.0002691005647648126, 0.00027597456937655807, 0.000282848603092134, 0.0002897226077038795]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 5.0, 4.0, 4.0, 8.0, 7.0, 7.0, 3.0, 9.0, 17.0, 24.0, 27.0, 24.0, 42.0, 35.0, 35.0, 27.0, 30.0, 45.0, 41.0, 41.0, 43.0, 48.0, 45.0, 40.0, 42.0, 37.0, 32.0, 39.0, 33.0, 31.0, 21.0, 28.0, 14.0, 27.0, 15.0, 7.0, 17.0, 8.0, 4.0, 6.0, 8.0, 4.0, 2.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00012201070785522461, -0.00011801440268754959, -0.00011401809751987457, -0.00011002179235219955, -0.00010602548718452454, -0.00010202918201684952, -9.80328768491745e-05, -9.403657168149948e-05, -9.004026651382446e-05, -8.604396134614944e-05, -8.204765617847443e-05, -7.805135101079941e-05, -7.405504584312439e-05, -7.005874067544937e-05, -6.606243550777435e-05, -6.206613034009933e-05, -5.8069825172424316e-05, -5.40735200047493e-05, -5.007721483707428e-05, -4.608090966939926e-05, -4.208460450172424e-05, -3.8088299334049225e-05, -3.4091994166374207e-05, -3.0095688998699188e-05, -2.609938383102417e-05, -2.210307866334915e-05, -1.8106773495674133e-05, -1.4110468327999115e-05, -1.0114163160324097e-05, -6.117857992649078e-06, -2.12155282497406e-06, 1.8747523427009583e-06, 5.8710575103759766e-06, 9.867362678050995e-06, 1.3863667845726013e-05, 1.785997301340103e-05, 2.185627818107605e-05, 2.5852583348751068e-05, 2.9848888516426086e-05, 3.3845193684101105e-05, 3.784149885177612e-05, 4.183780401945114e-05, 4.583410918712616e-05, 4.983041435480118e-05, 5.3826719522476196e-05, 5.7823024690151215e-05, 6.181932985782623e-05, 6.581563502550125e-05, 6.981194019317627e-05, 7.380824536085129e-05, 7.78045505285263e-05, 8.180085569620132e-05, 8.579716086387634e-05, 8.979346603155136e-05, 9.378977119922638e-05, 9.77860763669014e-05, 0.00010178238153457642, 0.00010577868670225143, 0.00010977499186992645, 0.00011377129703760147, 0.00011776760220527649, 0.00012176390737295151, 0.00012576021254062653, 0.00012975651770830154, 0.00013375282287597656]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 14.0, 28.0, 46.0, 80.0, 154.0, 228.0, 393.0, 670.0, 1136.0, 1901.0, 3452.0, 7376.0, 17023.0, 44110.0, 218719.0, 3792744.0, 59652.0, 22776.0, 10689.0, 5420.0, 2940.0, 1692.0, 971.0, 607.0, 378.0, 259.0, 156.0, 147.0, 80.0, 68.0, 52.0, 55.0, 38.0, 26.0, 22.0, 24.0, 24.0, 20.0, 25.0, 21.0, 15.0, 5.0, 6.0, 8.0, 4.0, 10.0, 3.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00011777877807617188, -0.00011130422353744507, -0.00010482966899871826, -9.835511445999146e-05, -9.188055992126465e-05, -8.540600538253784e-05, -7.893145084381104e-05, -7.245689630508423e-05, -6.598234176635742e-05, -5.9507787227630615e-05, -5.303323268890381e-05, -4.6558678150177e-05, -4.0084123611450195e-05, -3.360956907272339e-05, -2.7135014533996582e-05, -2.0660459995269775e-05, -1.4185905456542969e-05, -7.711350917816162e-06, -1.2367963790893555e-06, 5.237758159637451e-06, 1.1712312698364258e-05, 1.8186867237091064e-05, 2.466142177581787e-05, 3.113597631454468e-05, 3.7610530853271484e-05, 4.408508539199829e-05, 5.05596399307251e-05, 5.7034194469451904e-05, 6.350874900817871e-05, 6.998330354690552e-05, 7.645785808563232e-05, 8.293241262435913e-05, 8.940696716308594e-05, 9.588152170181274e-05, 0.00010235607624053955, 0.00010883063077926636, 0.00011530518531799316, 0.00012177973985671997, 0.00012825429439544678, 0.00013472884893417358, 0.0001412034034729004, 0.0001476779580116272, 0.000154152512550354, 0.0001606270670890808, 0.00016710162162780762, 0.00017357617616653442, 0.00018005073070526123, 0.00018652528524398804, 0.00019299983978271484, 0.00019947439432144165, 0.00020594894886016846, 0.00021242350339889526, 0.00021889805793762207, 0.00022537261247634888, 0.00023184716701507568, 0.0002383217215538025, 0.0002447962760925293, 0.0002512708306312561, 0.0002577453851699829, 0.0002642199397087097, 0.0002706944942474365, 0.00027716904878616333, 0.00028364360332489014, 0.00029011815786361694, 0.00029659271240234375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 2.0, 3.0, 10.0, 11.0, 12.0, 19.0, 46.0, 53.0, 80.0, 95.0, 129.0, 106.0, 111.0, 93.0, 61.0, 43.0, 36.0, 25.0, 18.0, 18.0, 11.0, 9.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.895427703857422e-05, -1.7873942852020264e-05, -1.679360866546631e-05, -1.5713274478912354e-05, -1.4632940292358398e-05, -1.3552606105804443e-05, -1.2472271919250488e-05, -1.1391937732696533e-05, -1.0311603546142578e-05, -9.231269359588623e-06, -8.150935173034668e-06, -7.070600986480713e-06, -5.990266799926758e-06, -4.909932613372803e-06, -3.829598426818848e-06, -2.7492642402648926e-06, -1.6689300537109375e-06, -5.885958671569824e-07, 4.917383193969727e-07, 1.5720725059509277e-06, 2.652406692504883e-06, 3.732740879058838e-06, 4.813075065612793e-06, 5.893409252166748e-06, 6.973743438720703e-06, 8.054077625274658e-06, 9.134411811828613e-06, 1.0214745998382568e-05, 1.1295080184936523e-05, 1.2375414371490479e-05, 1.3455748558044434e-05, 1.4536082744598389e-05, 1.5616416931152344e-05, 1.66967511177063e-05, 1.7777085304260254e-05, 1.885741949081421e-05, 1.9937753677368164e-05, 2.101808786392212e-05, 2.2098422050476074e-05, 2.317875623703003e-05, 2.4259090423583984e-05, 2.533942461013794e-05, 2.6419758796691895e-05, 2.750009298324585e-05, 2.8580427169799805e-05, 2.966076135635376e-05, 3.0741095542907715e-05, 3.182142972946167e-05, 3.2901763916015625e-05, 3.398209810256958e-05, 3.5062432289123535e-05, 3.614276647567749e-05, 3.7223100662231445e-05, 3.83034348487854e-05, 3.9383769035339355e-05, 4.046410322189331e-05, 4.1544437408447266e-05, 4.262477159500122e-05, 4.3705105781555176e-05, 4.478543996810913e-05, 4.5865774154663086e-05, 4.694610834121704e-05, 4.8026442527770996e-05, 4.910677671432495e-05, 5.0187110900878906e-05]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 4.0, 15.0, 11.0, 19.0, 23.0, 46.0, 55.0, 83.0, 96.0, 144.0, 184.0, 304.0, 496.0, 690.0, 1050.0, 1700.0, 2917.0, 4851.0, 8644.0, 16094.0, 31866.0, 74232.0, 327978.0, 3482912.0, 137180.0, 49218.0, 23522.0, 12468.0, 7019.0, 3957.0, 2335.0, 1461.0, 932.0, 606.0, 362.0, 240.0, 186.0, 114.0, 98.0, 59.0, 34.0, 20.0, 25.0, 15.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010067224502563477, -9.773485362529755e-05, -9.479746222496033e-05, -9.186007082462311e-05, -8.892267942428589e-05, -8.598528802394867e-05, -8.304789662361145e-05, -8.011050522327423e-05, -7.717311382293701e-05, -7.423572242259979e-05, -7.129833102226257e-05, -6.836093962192535e-05, -6.542354822158813e-05, -6.248615682125092e-05, -5.9548765420913696e-05, -5.661137402057648e-05, -5.367398262023926e-05, -5.073659121990204e-05, -4.779919981956482e-05, -4.48618084192276e-05, -4.192441701889038e-05, -3.898702561855316e-05, -3.604963421821594e-05, -3.311224281787872e-05, -3.0174851417541504e-05, -2.7237460017204285e-05, -2.4300068616867065e-05, -2.1362677216529846e-05, -1.8425285816192627e-05, -1.5487894415855408e-05, -1.2550503015518188e-05, -9.61311161518097e-06, -6.67572021484375e-06, -3.7383288145065308e-06, -8.009374141693115e-07, 2.1364539861679077e-06, 5.073845386505127e-06, 8.011236786842346e-06, 1.0948628187179565e-05, 1.3886019587516785e-05, 1.6823410987854004e-05, 1.9760802388191223e-05, 2.2698193788528442e-05, 2.563558518886566e-05, 2.857297658920288e-05, 3.15103679895401e-05, 3.444775938987732e-05, 3.738515079021454e-05, 4.032254219055176e-05, 4.325993359088898e-05, 4.6197324991226196e-05, 4.9134716391563416e-05, 5.2072107791900635e-05, 5.5009499192237854e-05, 5.794689059257507e-05, 6.088428199291229e-05, 6.382167339324951e-05, 6.675906479358673e-05, 6.969645619392395e-05, 7.263384759426117e-05, 7.557123899459839e-05, 7.850863039493561e-05, 8.144602179527283e-05, 8.438341319561005e-05, 8.732080459594727e-05]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 1.0, 5.0, 12.0, 13.0, 14.0, 11.0, 23.0, 23.0, 35.0, 51.0, 74.0, 132.0, 441.0, 2349.0, 413.0, 114.0, 66.0, 37.0, 38.0, 31.0, 23.0, 21.0, 39.0, 19.0, 16.0, 11.0, 13.0, 14.0, 4.0, 6.0, 4.0, 5.0, 3.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.1081180572509766e-05, -4.9350783228874207e-05, -4.762038588523865e-05, -4.588998854160309e-05, -4.415959119796753e-05, -4.242919385433197e-05, -4.069879651069641e-05, -3.896839916706085e-05, -3.723800182342529e-05, -3.5507604479789734e-05, -3.3777207136154175e-05, -3.2046809792518616e-05, -3.0316412448883057e-05, -2.8586015105247498e-05, -2.685561776161194e-05, -2.512522041797638e-05, -2.339482307434082e-05, -2.166442573070526e-05, -1.9934028387069702e-05, -1.8203631043434143e-05, -1.6473233699798584e-05, -1.4742836356163025e-05, -1.3012439012527466e-05, -1.1282041668891907e-05, -9.551644325256348e-06, -7.821246981620789e-06, -6.0908496379852295e-06, -4.36045229434967e-06, -2.6300549507141113e-06, -8.996576070785522e-07, 8.307397365570068e-07, 2.561137080192566e-06, 4.291534423828125e-06, 6.021931767463684e-06, 7.752329111099243e-06, 9.482726454734802e-06, 1.1213123798370361e-05, 1.294352114200592e-05, 1.467391848564148e-05, 1.640431582927704e-05, 1.8134713172912598e-05, 1.9865110516548157e-05, 2.1595507860183716e-05, 2.3325905203819275e-05, 2.5056302547454834e-05, 2.6786699891090393e-05, 2.8517097234725952e-05, 3.024749457836151e-05, 3.197789192199707e-05, 3.370828926563263e-05, 3.543868660926819e-05, 3.716908395290375e-05, 3.889948129653931e-05, 4.0629878640174866e-05, 4.2360275983810425e-05, 4.4090673327445984e-05, 4.582107067108154e-05, 4.75514680147171e-05, 4.928186535835266e-05, 5.101226270198822e-05, 5.274266004562378e-05, 5.447305738925934e-05, 5.62034547328949e-05, 5.7933852076530457e-05, 5.9664249420166016e-05]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 6.0, 6.0, 10.0, 16.0, 15.0, 34.0, 43.0, 58.0, 119.0, 150.0, 139.0, 88.0, 45.0, 52.0, 54.0, 25.0, 29.0, 23.0, 18.0, 19.0, 7.0, 11.0, 6.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0003272637550253421, -0.00031575027969665825, -0.0003042368043679744, -0.00029272332903929055, -0.00028120982460677624, -0.0002696963492780924, -0.00025818287394940853, -0.0002466693986207247, -0.00023515592329204082, -0.00022364244796335697, -0.00021212897263467312, -0.00020061548275407404, -0.00018910200742539018, -0.00017758853209670633, -0.00016607504221610725, -0.0001545615668874234, -0.00014304809155873954, -0.0001315346162300557, -0.00012002113362541422, -0.00010850765102077276, -9.69941756920889e-05, -8.548070036340505e-05, -7.396721775876358e-05, -6.245373515412211e-05, -5.094025982543826e-05, -3.94267808587756e-05, -2.791330189211294e-05, -1.639982292545028e-05, -4.88634395878762e-06, 6.62713500787504e-06, 1.81406139745377e-05, 2.9654096579179168e-05, 4.116760101169348e-05, 5.268107997835614e-05, 6.41945589450188e-05, 7.570804154966027e-05, 8.722151687834412e-05, 9.873499220702797e-05, 0.00011024847481166944, 0.0001217619574163109, 0.00013327543274499476, 0.0001447889080736786, 0.00015630238340236247, 0.00016781587328296155, 0.0001793293486116454, 0.00019084282394032925, 0.00020235631382092834, 0.0002138697891496122, 0.00022538326447829604, 0.0002368967398069799, 0.00024841021513566375, 0.0002599236904643476, 0.00027143716579303145, 0.00028295067022554576, 0.0002944641455542296, 0.00030597762088291347, 0.0003174910962115973, 0.0003290045715402812, 0.00034051804686896503, 0.0003520315221976489, 0.0003635450266301632, 0.00037505850195884705, 0.0003865719772875309, 0.00039808545261621475, 0.0004095989279448986]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 4.0, 5.0, 10.0, 16.0, 16.0, 16.0, 17.0, 19.0, 23.0, 31.0, 19.0, 27.0, 37.0, 25.0, 36.0, 35.0, 39.0, 34.0, 42.0, 44.0, 31.0, 37.0, 36.0, 34.0, 44.0, 31.0, 22.0, 32.0, 28.0, 35.0, 27.0, 19.0, 26.0, 25.0, 10.0, 12.0, 12.0, 11.0, 6.0, 9.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00019925832748413086, -0.0001932792365550995, -0.00018730014562606812, -0.00018132105469703674, -0.00017534196376800537, -0.000169362872838974, -0.00016338378190994263, -0.00015740469098091125, -0.00015142560005187988, -0.0001454465091228485, -0.00013946741819381714, -0.00013348832726478577, -0.0001275092363357544, -0.00012153014540672302, -0.00011555105447769165, -0.00010957196354866028, -0.0001035928726196289, -9.761378169059753e-05, -9.163469076156616e-05, -8.565559983253479e-05, -7.967650890350342e-05, -7.369741797447205e-05, -6.771832704544067e-05, -6.17392361164093e-05, -5.576014518737793e-05, -4.978105425834656e-05, -4.3801963329315186e-05, -3.7822872400283813e-05, -3.184378147125244e-05, -2.586469054222107e-05, -1.9885599613189697e-05, -1.3906508684158325e-05, -7.927417755126953e-06, -1.948326826095581e-06, 4.030764102935791e-06, 1.0009855031967163e-05, 1.5988945960998535e-05, 2.1968036890029907e-05, 2.794712781906128e-05, 3.392621874809265e-05, 3.9905309677124023e-05, 4.5884400606155396e-05, 5.186349153518677e-05, 5.784258246421814e-05, 6.382167339324951e-05, 6.980076432228088e-05, 7.577985525131226e-05, 8.175894618034363e-05, 8.7738037109375e-05, 9.371712803840637e-05, 9.969621896743774e-05, 0.00010567530989646912, 0.00011165440082550049, 0.00011763349175453186, 0.00012361258268356323, 0.0001295916736125946, 0.00013557076454162598, 0.00014154985547065735, 0.00014752894639968872, 0.0001535080373287201, 0.00015948712825775146, 0.00016546621918678284, 0.0001714453101158142, 0.00017742440104484558, 0.00018340349197387695]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 7.0, 6.0, 9.0, 14.0, 19.0, 28.0, 49.0, 61.0, 86.0, 128.0, 158.0, 229.0, 366.0, 551.0, 796.0, 1325.0, 1970.0, 3158.0, 5602.0, 10619.0, 23002.0, 56968.0, 203430.0, 554739.0, 110294.0, 38721.0, 16129.0, 8178.0, 4450.0, 2625.0, 1659.0, 1044.0, 649.0, 474.0, 289.0, 220.0, 152.0, 102.0, 75.0, 44.0, 39.0, 30.0, 13.0, 10.0, 6.0, 6.0, 4.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0001289844512939453, -0.00012472644448280334, -0.00012046843767166138, -0.00011621043086051941, -0.00011195242404937744, -0.00010769441723823547, -0.0001034364104270935, -9.917840361595154e-05, -9.492039680480957e-05, -9.06623899936676e-05, -8.640438318252563e-05, -8.214637637138367e-05, -7.78883695602417e-05, -7.363036274909973e-05, -6.937235593795776e-05, -6.51143491268158e-05, -6.085634231567383e-05, -5.659833550453186e-05, -5.234032869338989e-05, -4.8082321882247925e-05, -4.382431507110596e-05, -3.956630825996399e-05, -3.530830144882202e-05, -3.1050294637680054e-05, -2.6792287826538086e-05, -2.2534281015396118e-05, -1.827627420425415e-05, -1.4018267393112183e-05, -9.760260581970215e-06, -5.502253770828247e-06, -1.2442469596862793e-06, 3.0137598514556885e-06, 7.271766662597656e-06, 1.1529773473739624e-05, 1.5787780284881592e-05, 2.004578709602356e-05, 2.4303793907165527e-05, 2.8561800718307495e-05, 3.281980752944946e-05, 3.707781434059143e-05, 4.13358211517334e-05, 4.5593827962875366e-05, 4.9851834774017334e-05, 5.41098415851593e-05, 5.836784839630127e-05, 6.262585520744324e-05, 6.68838620185852e-05, 7.114186882972717e-05, 7.539987564086914e-05, 7.965788245201111e-05, 8.391588926315308e-05, 8.817389607429504e-05, 9.243190288543701e-05, 9.668990969657898e-05, 0.00010094791650772095, 0.00010520592331886292, 0.00010946393013000488, 0.00011372193694114685, 0.00011797994375228882, 0.00012223795056343079, 0.00012649595737457275, 0.00013075396418571472, 0.0001350119709968567, 0.00013926997780799866, 0.00014352798461914062]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 9.0, 9.0, 15.0, 15.0, 17.0, 29.0, 43.0, 46.0, 68.0, 69.0, 107.0, 104.0, 94.0, 76.0, 79.0, 52.0, 32.0, 30.0, 32.0, 17.0, 5.0, 5.0, 10.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1278858184814453e-05, -2.0449981093406677e-05, -1.96211040019989e-05, -1.8792226910591125e-05, -1.796334981918335e-05, -1.7134472727775574e-05, -1.6305595636367798e-05, -1.5476718544960022e-05, -1.4647841453552246e-05, -1.381896436214447e-05, -1.2990087270736694e-05, -1.2161210179328918e-05, -1.1332333087921143e-05, -1.0503455996513367e-05, -9.67457890510559e-06, -8.845701813697815e-06, -8.016824722290039e-06, -7.187947630882263e-06, -6.359070539474487e-06, -5.5301934480667114e-06, -4.7013163566589355e-06, -3.87243926525116e-06, -3.043562173843384e-06, -2.214685082435608e-06, -1.385807991027832e-06, -5.569308996200562e-07, 2.7194619178771973e-07, 1.1008232831954956e-06, 1.9297003746032715e-06, 2.7585774660110474e-06, 3.5874545574188232e-06, 4.416331648826599e-06, 5.245208740234375e-06, 6.074085831642151e-06, 6.902962923049927e-06, 7.731840014457703e-06, 8.560717105865479e-06, 9.389594197273254e-06, 1.021847128868103e-05, 1.1047348380088806e-05, 1.1876225471496582e-05, 1.2705102562904358e-05, 1.3533979654312134e-05, 1.436285674571991e-05, 1.5191733837127686e-05, 1.602061092853546e-05, 1.6849488019943237e-05, 1.7678365111351013e-05, 1.850724220275879e-05, 1.9336119294166565e-05, 2.016499638557434e-05, 2.0993873476982117e-05, 2.1822750568389893e-05, 2.265162765979767e-05, 2.3480504751205444e-05, 2.430938184261322e-05, 2.5138258934020996e-05, 2.5967136025428772e-05, 2.6796013116836548e-05, 2.7624890208244324e-05, 2.84537672996521e-05, 2.9282644391059875e-05, 3.011152148246765e-05, 3.094039857387543e-05, 3.17692756652832e-05]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 11.0, 12.0, 16.0, 42.0, 48.0, 66.0, 80.0, 156.0, 223.0, 307.0, 494.0, 749.0, 1258.0, 1743.0, 2885.0, 4393.0, 6725.0, 10162.0, 16355.0, 25783.0, 42043.0, 70239.0, 142322.0, 369400.0, 153645.0, 79497.0, 44525.0, 27131.0, 16764.0, 11290.0, 7123.0, 4602.0, 2849.0, 1906.0, 1315.0, 837.0, 526.0, 347.0, 273.0, 140.0, 109.0, 53.0, 49.0, 20.0, 12.0, 20.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.9948692321777344e-05, -4.841480404138565e-05, -4.688091576099396e-05, -4.5347027480602264e-05, -4.381313920021057e-05, -4.227925091981888e-05, -4.0745362639427185e-05, -3.921147435903549e-05, -3.76775860786438e-05, -3.6143697798252106e-05, -3.460980951786041e-05, -3.307592123746872e-05, -3.1542032957077026e-05, -3.0008144676685333e-05, -2.847425639629364e-05, -2.6940368115901947e-05, -2.5406479835510254e-05, -2.387259155511856e-05, -2.2338703274726868e-05, -2.0804814994335175e-05, -1.927092671394348e-05, -1.773703843355179e-05, -1.6203150153160095e-05, -1.4669261872768402e-05, -1.3135373592376709e-05, -1.1601485311985016e-05, -1.0067597031593323e-05, -8.53370875120163e-06, -6.9998204708099365e-06, -5.465932190418243e-06, -3.93204391002655e-06, -2.398155629634857e-06, -8.642673492431641e-07, 6.69620931148529e-07, 2.203509211540222e-06, 3.7373974919319153e-06, 5.271285772323608e-06, 6.8051740527153015e-06, 8.339062333106995e-06, 9.872950613498688e-06, 1.1406838893890381e-05, 1.2940727174282074e-05, 1.4474615454673767e-05, 1.600850373506546e-05, 1.7542392015457153e-05, 1.9076280295848846e-05, 2.061016857624054e-05, 2.2144056856632233e-05, 2.3677945137023926e-05, 2.521183341741562e-05, 2.6745721697807312e-05, 2.8279609978199005e-05, 2.9813498258590698e-05, 3.134738653898239e-05, 3.2881274819374084e-05, 3.441516309976578e-05, 3.594905138015747e-05, 3.7482939660549164e-05, 3.901682794094086e-05, 4.055071622133255e-05, 4.208460450172424e-05, 4.3618492782115936e-05, 4.515238106250763e-05, 4.668626934289932e-05, 4.8220157623291016e-05]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 4.0, 4.0, 6.0, 11.0, 10.0, 14.0, 9.0, 16.0, 22.0, 16.0, 15.0, 25.0, 28.0, 20.0, 38.0, 42.0, 41.0, 45.0, 43.0, 38.0, 45.0, 54.0, 37.0, 45.0, 29.0, 37.0, 42.0, 35.0, 28.0, 22.0, 19.0, 31.0, 15.0, 20.0, 20.0, 18.0, 8.0, 13.0, 14.0, 7.0, 5.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.886222839355469e-05, -3.7534162402153015e-05, -3.620609641075134e-05, -3.487803041934967e-05, -3.3549964427948e-05, -3.2221898436546326e-05, -3.089383244514465e-05, -2.956576645374298e-05, -2.823770046234131e-05, -2.6909634470939636e-05, -2.5581568479537964e-05, -2.425350248813629e-05, -2.292543649673462e-05, -2.1597370505332947e-05, -2.0269304513931274e-05, -1.8941238522529602e-05, -1.761317253112793e-05, -1.6285106539726257e-05, -1.4957040548324585e-05, -1.3628974556922913e-05, -1.230090856552124e-05, -1.0972842574119568e-05, -9.644776582717896e-06, -8.316710591316223e-06, -6.988644599914551e-06, -5.660578608512878e-06, -4.332512617111206e-06, -3.0044466257095337e-06, -1.6763806343078613e-06, -3.4831464290618896e-07, 9.797513484954834e-07, 2.3078173398971558e-06, 3.635883331298828e-06, 4.9639493227005005e-06, 6.292015314102173e-06, 7.620081305503845e-06, 8.948147296905518e-06, 1.027621328830719e-05, 1.1604279279708862e-05, 1.2932345271110535e-05, 1.4260411262512207e-05, 1.558847725391388e-05, 1.6916543245315552e-05, 1.8244609236717224e-05, 1.9572675228118896e-05, 2.090074121952057e-05, 2.222880721092224e-05, 2.3556873202323914e-05, 2.4884939193725586e-05, 2.6213005185127258e-05, 2.754107117652893e-05, 2.8869137167930603e-05, 3.0197203159332275e-05, 3.152526915073395e-05, 3.285333514213562e-05, 3.418140113353729e-05, 3.5509467124938965e-05, 3.683753311634064e-05, 3.816559910774231e-05, 3.949366509914398e-05, 4.0821731090545654e-05, 4.214979708194733e-05, 4.3477863073349e-05, 4.480592906475067e-05, 4.6133995056152344e-05]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 12.0, 8.0, 29.0, 33.0, 66.0, 71.0, 140.0, 153.0, 336.0, 507.0, 1347.0, 2221.0, 6674.0, 14183.0, 41920.0, 243983.0, 515209.0, 169627.0, 31247.0, 12721.0, 3712.0, 2214.0, 872.0, 536.0, 227.0, 191.0, 109.0, 91.0, 39.0, 24.0, 22.0, 7.0, 11.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881092071533203e-06, -8.614733815193176e-06, -8.34837555885315e-06, -8.082017302513123e-06, -7.815659046173096e-06, -7.549300789833069e-06, -7.282942533493042e-06, -7.016584277153015e-06, -6.750226020812988e-06, -6.4838677644729614e-06, -6.2175095081329346e-06, -5.951151251792908e-06, -5.684792995452881e-06, -5.418434739112854e-06, -5.152076482772827e-06, -4.8857182264328e-06, -4.6193599700927734e-06, -4.353001713752747e-06, -4.08664345741272e-06, -3.820285201072693e-06, -3.553926944732666e-06, -3.287568688392639e-06, -3.0212104320526123e-06, -2.7548521757125854e-06, -2.4884939193725586e-06, -2.2221356630325317e-06, -1.955777406692505e-06, -1.689419150352478e-06, -1.4230608940124512e-06, -1.1567026376724243e-06, -8.903443813323975e-07, -6.239861249923706e-07, -3.5762786865234375e-07, -9.12696123123169e-08, 1.7508864402770996e-07, 4.414469003677368e-07, 7.078051567077637e-07, 9.741634130477905e-07, 1.2405216693878174e-06, 1.5068799257278442e-06, 1.773238182067871e-06, 2.039596438407898e-06, 2.305954694747925e-06, 2.5723129510879517e-06, 2.8386712074279785e-06, 3.1050294637680054e-06, 3.3713877201080322e-06, 3.637745976448059e-06, 3.904104232788086e-06, 4.170462489128113e-06, 4.43682074546814e-06, 4.7031790018081665e-06, 4.969537258148193e-06, 5.23589551448822e-06, 5.502253770828247e-06, 5.768612027168274e-06, 6.034970283508301e-06, 6.301328539848328e-06, 6.5676867961883545e-06, 6.834045052528381e-06, 7.100403308868408e-06, 7.366761565208435e-06, 7.633119821548462e-06, 7.899478077888489e-06, 8.165836334228516e-06]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 6.0, 7.0, 11.0, 13.0, 9.0, 16.0, 33.0, 28.0, 72.0, 33.0, 37.0, 76.0, 47.0, 45.0, 77.0, 36.0, 48.0, 88.0, 32.0, 74.0, 27.0, 31.0, 57.0, 17.0, 15.0, 25.0, 4.0, 5.0, 17.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.7418136596679688e-06, -2.660788595676422e-06, -2.5797635316848755e-06, -2.498738467693329e-06, -2.4177134037017822e-06, -2.3366883397102356e-06, -2.255663275718689e-06, -2.1746382117271423e-06, -2.0936131477355957e-06, -2.012588083744049e-06, -1.9315630197525024e-06, -1.8505379557609558e-06, -1.7695128917694092e-06, -1.6884878277778625e-06, -1.607462763786316e-06, -1.5264376997947693e-06, -1.4454126358032227e-06, -1.364387571811676e-06, -1.2833625078201294e-06, -1.2023374438285828e-06, -1.1213123798370361e-06, -1.0402873158454895e-06, -9.592622518539429e-07, -8.782371878623962e-07, -7.972121238708496e-07, -7.16187059879303e-07, -6.351619958877563e-07, -5.541369318962097e-07, -4.731118679046631e-07, -3.9208680391311646e-07, -3.110617399215698e-07, -2.300366759300232e-07, -1.4901161193847656e-07, -6.798654794692993e-08, 1.30385160446167e-08, 9.406358003616333e-08, 1.7508864402770996e-07, 2.561137080192566e-07, 3.371387720108032e-07, 4.1816383600234985e-07, 4.991888999938965e-07, 5.802139639854431e-07, 6.612390279769897e-07, 7.422640919685364e-07, 8.23289155960083e-07, 9.043142199516296e-07, 9.853392839431763e-07, 1.066364347934723e-06, 1.1473894119262695e-06, 1.2284144759178162e-06, 1.3094395399093628e-06, 1.3904646039009094e-06, 1.471489667892456e-06, 1.5525147318840027e-06, 1.6335397958755493e-06, 1.714564859867096e-06, 1.7955899238586426e-06, 1.8766149878501892e-06, 1.957640051841736e-06, 2.0386651158332825e-06, 2.119690179824829e-06, 2.2007152438163757e-06, 2.2817403078079224e-06, 2.362765371799469e-06, 2.4437904357910156e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 6.0, 27.0, 18.0, 26.0, 19.0, 60.0, 89.0, 129.0, 148.0, 111.0, 292.0, 430.0, 685.0, 483.0, 1407.0, 2130.0, 3458.0, 2593.0, 7741.0, 13741.0, 26157.0, 21850.0, 80981.0, 240218.0, 399757.0, 133025.0, 31889.0, 36501.0, 18867.0, 10288.0, 3276.0, 4428.0, 2702.0, 1775.0, 595.0, 879.0, 619.0, 374.0, 143.0, 205.0, 146.0, 90.0, 62.0, 24.0, 29.0, 26.0, 20.0, 5.0, 13.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.3974647521972656e-06, -3.2922253012657166e-06, -3.1869858503341675e-06, -3.0817463994026184e-06, -2.9765069484710693e-06, -2.8712674975395203e-06, -2.766028046607971e-06, -2.660788595676422e-06, -2.555549144744873e-06, -2.450309693813324e-06, -2.345070242881775e-06, -2.239830791950226e-06, -2.1345913410186768e-06, -2.0293518900871277e-06, -1.9241124391555786e-06, -1.8188729882240295e-06, -1.7136335372924805e-06, -1.6083940863609314e-06, -1.5031546354293823e-06, -1.3979151844978333e-06, -1.2926757335662842e-06, -1.1874362826347351e-06, -1.082196831703186e-06, -9.76957380771637e-07, -8.717179298400879e-07, -7.664784789085388e-07, -6.612390279769897e-07, -5.559995770454407e-07, -4.507601261138916e-07, -3.4552067518234253e-07, -2.4028122425079346e-07, -1.3504177331924438e-07, -2.9802322387695312e-08, 7.543712854385376e-08, 1.8067657947540283e-07, 2.859160304069519e-07, 3.91155481338501e-07, 4.9639493227005e-07, 6.016343832015991e-07, 7.068738341331482e-07, 8.121132850646973e-07, 9.173527359962463e-07, 1.0225921869277954e-06, 1.1278316378593445e-06, 1.2330710887908936e-06, 1.3383105397224426e-06, 1.4435499906539917e-06, 1.5487894415855408e-06, 1.6540288925170898e-06, 1.759268343448639e-06, 1.864507794380188e-06, 1.969747245311737e-06, 2.074986696243286e-06, 2.180226147174835e-06, 2.2854655981063843e-06, 2.3907050490379333e-06, 2.4959444999694824e-06, 2.6011839509010315e-06, 2.7064234018325806e-06, 2.8116628527641296e-06, 2.9169023036956787e-06, 3.0221417546272278e-06, 3.127381205558777e-06, 3.232620656490326e-06, 3.337860107421875e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 8.0, 2.0, 4.0, 5.0, 9.0, 8.0, 20.0, 24.0, 18.0, 35.0, 20.0, 65.0, 28.0, 58.0, 37.0, 102.0, 39.0, 68.0, 80.0, 47.0, 71.0, 25.0, 39.0, 19.0, 36.0, 9.0, 29.0, 10.0, 26.0, 14.0, 8.0, 10.0, 1.0, 8.0, 5.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.86102294921875e-06, -2.7688220143318176e-06, -2.6766210794448853e-06, -2.584420144557953e-06, -2.4922192096710205e-06, -2.400018274784088e-06, -2.3078173398971558e-06, -2.2156164050102234e-06, -2.123415470123291e-06, -2.0312145352363586e-06, -1.9390136003494263e-06, -1.846812665462494e-06, -1.7546117305755615e-06, -1.6624107956886292e-06, -1.5702098608016968e-06, -1.4780089259147644e-06, -1.385807991027832e-06, -1.2936070561408997e-06, -1.2014061212539673e-06, -1.109205186367035e-06, -1.0170042514801025e-06, -9.248033165931702e-07, -8.326023817062378e-07, -7.404014468193054e-07, -6.48200511932373e-07, -5.559995770454407e-07, -4.637986421585083e-07, -3.7159770727157593e-07, -2.7939677238464355e-07, -1.8719583749771118e-07, -9.499490261077881e-08, -2.7939677238464355e-09, 8.940696716308594e-08, 1.816079020500183e-07, 2.738088369369507e-07, 3.6600977182388306e-07, 4.5821070671081543e-07, 5.504116415977478e-07, 6.426125764846802e-07, 7.348135113716125e-07, 8.270144462585449e-07, 9.192153811454773e-07, 1.0114163160324097e-06, 1.103617250919342e-06, 1.1958181858062744e-06, 1.2880191206932068e-06, 1.3802200555801392e-06, 1.4724209904670715e-06, 1.564621925354004e-06, 1.6568228602409363e-06, 1.7490237951278687e-06, 1.841224730014801e-06, 1.9334256649017334e-06, 2.0256265997886658e-06, 2.117827534675598e-06, 2.2100284695625305e-06, 2.302229404449463e-06, 2.3944303393363953e-06, 2.4866312742233276e-06, 2.57883220911026e-06, 2.6710331439971924e-06, 2.7632340788841248e-06, 2.855435013771057e-06, 2.9476359486579895e-06, 3.039836883544922e-06]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 6.0, 5.0, 8.0, 9.0, 22.0, 14.0, 45.0, 90.0, 169.0, 196.0, 92.0, 86.0, 48.0, 35.0, 36.0, 35.0, 23.0, 15.0, 9.0, 8.0, 10.0, 13.0, 4.0, 6.0, 5.0, 5.0, 7.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011795697355410084, -0.00011018435179721564, -0.00010241173731628805, -9.463912283536047e-05, -8.686650107847527e-05, -7.909387932159007e-05, -7.132126484066248e-05, -6.354865035973489e-05, -5.577602860284969e-05, -4.80034104839433e-05, -4.0230792365036905e-05, -3.245817424613051e-05, -2.4685556127224118e-05, -1.6912938008317724e-05, -9.14031988941133e-06, -1.3677017705049366e-06, 6.404916348401457e-06, 1.417753446730785e-05, 2.1950152586214244e-05, 2.9722770705120638e-05, 3.749538882402703e-05, 4.5268006942933425e-05, 5.304062506183982e-05, 6.081324318074621e-05, 6.85858612996526e-05, 7.635848305653781e-05, 8.41310975374654e-05, 9.190371201839298e-05, 9.967633377527818e-05, 0.00010744895553216338, 0.00011522157001309097, 0.00012299418449401855, 0.0001307668280787766, 0.00013853944255970418, 0.00014631205704063177, 0.00015408468607347459, 0.00016185730055440217, 0.00016962991503532976, 0.00017740254406817257, 0.00018517515854910016, 0.00019294777303002775, 0.00020072038751095533, 0.00020849300199188292, 0.00021626563102472574, 0.00022403824550565332, 0.0002318108599865809, 0.00023958348901942372, 0.0002473561035003513, 0.0002551287179812789, 0.0002629013324622065, 0.00027067394694313407, 0.00027844656142406166, 0.00028621917590498924, 0.0002939918194897473, 0.00030176443397067487, 0.00030953704845160246, 0.00031730966293253005, 0.00032508227741345763, 0.0003328548918943852, 0.0003406275063753128, 0.00034840014996007085, 0.00035617276444099844, 0.000363945378921926, 0.0003717179934028536, 0.0003794906078837812]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 3.0, 3.0, 14.0, 5.0, 9.0, 10.0, 11.0, 22.0, 25.0, 26.0, 24.0, 30.0, 31.0, 37.0, 46.0, 31.0, 56.0, 47.0, 52.0, 36.0, 42.0, 38.0, 38.0, 39.0, 37.0, 29.0, 30.0, 45.0, 25.0, 25.0, 18.0, 19.0, 13.0, 14.0, 18.0, 14.0, 6.0, 7.0, 5.0, 2.0, 10.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00011593103408813477, -0.0001118360087275505, -0.00010774098336696625, -0.00010364595800638199, -9.955093264579773e-05, -9.545590728521347e-05, -9.136088192462921e-05, -8.726585656404495e-05, -8.31708312034607e-05, -7.907580584287643e-05, -7.498078048229218e-05, -7.088575512170792e-05, -6.679072976112366e-05, -6.26957044005394e-05, -5.860067903995514e-05, -5.450565367937088e-05, -5.041062831878662e-05, -4.631560295820236e-05, -4.22205775976181e-05, -3.8125552237033844e-05, -3.4030526876449585e-05, -2.9935501515865326e-05, -2.5840476155281067e-05, -2.1745450794696808e-05, -1.765042543411255e-05, -1.355540007352829e-05, -9.46037471294403e-06, -5.365349352359772e-06, -1.2703239917755127e-06, 2.8247013688087463e-06, 6.919726729393005e-06, 1.1014752089977264e-05, 1.5109777450561523e-05, 1.9204802811145782e-05, 2.329982817173004e-05, 2.73948535323143e-05, 3.148987889289856e-05, 3.558490425348282e-05, 3.967992961406708e-05, 4.377495497465134e-05, 4.7869980335235596e-05, 5.1965005695819855e-05, 5.6060031056404114e-05, 6.015505641698837e-05, 6.425008177757263e-05, 6.834510713815689e-05, 7.244013249874115e-05, 7.653515785932541e-05, 8.063018321990967e-05, 8.472520858049393e-05, 8.882023394107819e-05, 9.291525930166245e-05, 9.70102846622467e-05, 0.00010110531002283096, 0.00010520033538341522, 0.00010929536074399948, 0.00011339038610458374, 0.000117485411465168, 0.00012158043682575226, 0.00012567546218633652, 0.00012977048754692078, 0.00013386551290750504, 0.0001379605382680893, 0.00014205556362867355, 0.0001461505889892578]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 10.0, 20.0, 35.0, 49.0, 73.0, 122.0, 175.0, 268.0, 407.0, 668.0, 1197.0, 2071.0, 3947.0, 8085.0, 18327.0, 57531.0, 3943660.0, 111704.0, 25417.0, 10269.0, 4500.0, 2214.0, 1253.0, 722.0, 487.0, 289.0, 202.0, 143.0, 97.0, 68.0, 44.0, 33.0, 34.0, 24.0, 19.0, 21.0, 24.0, 15.0, 11.0, 6.0, 11.0, 8.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012755393981933594, -0.00012216530740261078, -0.00011677667498588562, -0.00011138804256916046, -0.0001059994101524353, -0.00010061077773571014, -9.522214531898499e-05, -8.983351290225983e-05, -8.444488048553467e-05, -7.905624806880951e-05, -7.366761565208435e-05, -6.827898323535919e-05, -6.289035081863403e-05, -5.7501718401908875e-05, -5.2113085985183716e-05, -4.672445356845856e-05, -4.13358211517334e-05, -3.594718873500824e-05, -3.055855631828308e-05, -2.5169923901557922e-05, -1.9781291484832764e-05, -1.4392659068107605e-05, -9.004026651382446e-06, -3.6153942346572876e-06, 1.773238182067871e-06, 7.16187059879303e-06, 1.2550503015518188e-05, 1.7939135432243347e-05, 2.3327767848968506e-05, 2.8716400265693665e-05, 3.410503268241882e-05, 3.949366509914398e-05, 4.488229751586914e-05, 5.02709299325943e-05, 5.565956234931946e-05, 6.104819476604462e-05, 6.643682718276978e-05, 7.182545959949493e-05, 7.721409201622009e-05, 8.260272443294525e-05, 8.799135684967041e-05, 9.337998926639557e-05, 9.876862168312073e-05, 0.00010415725409984589, 0.00010954588651657104, 0.0001149345189332962, 0.00012032315135002136, 0.00012571178376674652, 0.00013110041618347168, 0.00013648904860019684, 0.000141877681016922, 0.00014726631343364716, 0.00015265494585037231, 0.00015804357826709747, 0.00016343221068382263, 0.0001688208431005478, 0.00017420947551727295, 0.0001795981079339981, 0.00018498674035072327, 0.00019037537276744843, 0.00019576400518417358, 0.00020115263760089874, 0.0002065412700176239, 0.00021192990243434906, 0.00021731853485107422]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 6.0, 1.0, 3.0, 12.0, 10.0, 17.0, 24.0, 31.0, 45.0, 52.0, 90.0, 83.0, 118.0, 113.0, 108.0, 63.0, 70.0, 52.0, 38.0, 18.0, 9.0, 12.0, 9.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4080276489257812e-05, -2.308003604412079e-05, -2.2079795598983765e-05, -2.107955515384674e-05, -2.0079314708709717e-05, -1.9079074263572693e-05, -1.807883381843567e-05, -1.7078593373298645e-05, -1.607835292816162e-05, -1.5078112483024597e-05, -1.4077872037887573e-05, -1.307763159275055e-05, -1.2077391147613525e-05, -1.1077150702476501e-05, -1.0076910257339478e-05, -9.076669812202454e-06, -8.07642936706543e-06, -7.076188921928406e-06, -6.075948476791382e-06, -5.075708031654358e-06, -4.075467586517334e-06, -3.07522714138031e-06, -2.074986696243286e-06, -1.0747462511062622e-06, -7.450580596923828e-08, 9.257346391677856e-07, 1.9259750843048096e-06, 2.9262155294418335e-06, 3.926455974578857e-06, 4.926696419715881e-06, 5.926936864852905e-06, 6.927177309989929e-06, 7.927417755126953e-06, 8.927658200263977e-06, 9.927898645401001e-06, 1.0928139090538025e-05, 1.1928379535675049e-05, 1.2928619980812073e-05, 1.3928860425949097e-05, 1.492910087108612e-05, 1.5929341316223145e-05, 1.692958176136017e-05, 1.7929822206497192e-05, 1.8930062651634216e-05, 1.993030309677124e-05, 2.0930543541908264e-05, 2.1930783987045288e-05, 2.2931024432182312e-05, 2.3931264877319336e-05, 2.493150532245636e-05, 2.5931745767593384e-05, 2.6931986212730408e-05, 2.793222665786743e-05, 2.8932467103004456e-05, 2.993270754814148e-05, 3.0932947993278503e-05, 3.193318843841553e-05, 3.293342888355255e-05, 3.3933669328689575e-05, 3.49339097738266e-05, 3.593415021896362e-05, 3.693439066410065e-05, 3.793463110923767e-05, 3.8934871554374695e-05, 3.993511199951172e-05]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 3.0, 8.0, 12.0, 12.0, 33.0, 35.0, 56.0, 79.0, 127.0, 203.0, 281.0, 495.0, 807.0, 1159.0, 1801.0, 3070.0, 5113.0, 8690.0, 15840.0, 31066.0, 72553.0, 596058.0, 3271612.0, 103391.0, 37743.0, 18801.0, 10072.0, 5711.0, 3586.0, 2198.0, 1282.0, 875.0, 521.0, 348.0, 226.0, 141.0, 99.0, 60.0, 42.0, 27.0, 11.0, 8.0, 12.0, 10.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.4849853515625e-05, -6.289221346378326e-05, -6.093457341194153e-05, -5.897693336009979e-05, -5.701929330825806e-05, -5.506165325641632e-05, -5.3104013204574585e-05, -5.114637315273285e-05, -4.918873310089111e-05, -4.723109304904938e-05, -4.527345299720764e-05, -4.3315812945365906e-05, -4.135817289352417e-05, -3.9400532841682434e-05, -3.74428927898407e-05, -3.548525273799896e-05, -3.3527612686157227e-05, -3.156997263431549e-05, -2.9612332582473755e-05, -2.765469253063202e-05, -2.5697052478790283e-05, -2.3739412426948547e-05, -2.178177237510681e-05, -1.9824132323265076e-05, -1.786649227142334e-05, -1.5908852219581604e-05, -1.3951212167739868e-05, -1.1993572115898132e-05, -1.0035932064056396e-05, -8.07829201221466e-06, -6.120651960372925e-06, -4.163011908531189e-06, -2.205371856689453e-06, -2.477318048477173e-07, 1.7099082469940186e-06, 3.6675482988357544e-06, 5.62518835067749e-06, 7.582828402519226e-06, 9.540468454360962e-06, 1.1498108506202698e-05, 1.3455748558044434e-05, 1.541338860988617e-05, 1.7371028661727905e-05, 1.932866871356964e-05, 2.1286308765411377e-05, 2.3243948817253113e-05, 2.520158886909485e-05, 2.7159228920936584e-05, 2.911686897277832e-05, 3.1074509024620056e-05, 3.303214907646179e-05, 3.498978912830353e-05, 3.6947429180145264e-05, 3.8905069231987e-05, 4.0862709283828735e-05, 4.282034933567047e-05, 4.477798938751221e-05, 4.673562943935394e-05, 4.869326949119568e-05, 5.0650909543037415e-05, 5.260854959487915e-05, 5.4566189646720886e-05, 5.652382969856262e-05, 5.848146975040436e-05, 6.0439109802246094e-05]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 8.0, 3.0, 3.0, 3.0, 8.0, 12.0, 15.0, 9.0, 17.0, 20.0, 28.0, 26.0, 45.0, 118.0, 303.0, 1118.0, 1690.0, 269.0, 90.0, 51.0, 45.0, 17.0, 24.0, 20.0, 24.0, 18.0, 14.0, 16.0, 9.0, 8.0, 7.0, 7.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.737211227416992e-05, -3.603845834732056e-05, -3.470480442047119e-05, -3.3371150493621826e-05, -3.203749656677246e-05, -3.0703842639923096e-05, -2.937018871307373e-05, -2.8036534786224365e-05, -2.6702880859375e-05, -2.5369226932525635e-05, -2.403557300567627e-05, -2.2701919078826904e-05, -2.136826515197754e-05, -2.0034611225128174e-05, -1.870095729827881e-05, -1.7367303371429443e-05, -1.6033649444580078e-05, -1.4699995517730713e-05, -1.3366341590881348e-05, -1.2032687664031982e-05, -1.0699033737182617e-05, -9.365379810333252e-06, -8.031725883483887e-06, -6.6980719566345215e-06, -5.364418029785156e-06, -4.030764102935791e-06, -2.6971101760864258e-06, -1.3634562492370605e-06, -2.9802322387695312e-08, 1.30385160446167e-06, 2.637505531311035e-06, 3.9711594581604e-06, 5.304813385009766e-06, 6.638467311859131e-06, 7.972121238708496e-06, 9.305775165557861e-06, 1.0639429092407227e-05, 1.1973083019256592e-05, 1.3306736946105957e-05, 1.4640390872955322e-05, 1.5974044799804688e-05, 1.7307698726654053e-05, 1.8641352653503418e-05, 1.9975006580352783e-05, 2.130866050720215e-05, 2.2642314434051514e-05, 2.397596836090088e-05, 2.5309622287750244e-05, 2.664327621459961e-05, 2.7976930141448975e-05, 2.931058406829834e-05, 3.0644237995147705e-05, 3.197789192199707e-05, 3.3311545848846436e-05, 3.46451997756958e-05, 3.5978853702545166e-05, 3.731250762939453e-05, 3.8646161556243896e-05, 3.997981548309326e-05, 4.131346940994263e-05, 4.264712333679199e-05, 4.398077726364136e-05, 4.531443119049072e-05, 4.664808511734009e-05, 4.798173904418945e-05]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 11.0, 17.0, 13.0, 21.0, 29.0, 49.0, 53.0, 77.0, 106.0, 114.0, 95.0, 87.0, 59.0, 41.0, 29.0, 29.0, 19.0, 27.0, 20.0, 21.0, 18.0, 12.0, 7.0, 4.0, 6.0, 6.0, 10.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012354517821222544, -0.00011799007188528776, -0.0001124349728343077, -0.00010687987378332764, -0.00010132476745638996, -9.576966112945229e-05, -9.021456207847223e-05, -8.465946302749217e-05, -7.910435670055449e-05, -7.354925037361681e-05, -6.799415132263675e-05, -6.243905227165669e-05, -5.6883945944719017e-05, -5.132884325576015e-05, -4.577374056680128e-05, -4.021863787784241e-05, -3.466353518888354e-05, -2.9108432499924675e-05, -2.3553329810965806e-05, -1.7998227122006938e-05, -1.244312443304807e-05, -6.888021744089201e-06, -1.3329190551303327e-06, 4.222183633828536e-06, 9.777286322787404e-06, 1.5332389011746272e-05, 2.088749170070514e-05, 2.644259438966401e-05, 3.199769707862288e-05, 3.7552799767581746e-05, 4.3107902456540614e-05, 4.866300514549948e-05, 5.421809328254312e-05, 5.977319597150199e-05, 6.532829866046086e-05, 7.088339771144092e-05, 7.64385040383786e-05, 8.199361036531627e-05, 8.754870941629633e-05, 9.31038084672764e-05, 9.865891479421407e-05, 0.00010421402112115175, 0.0001097691201721318, 0.00011532421922311187, 0.00012087932555004954, 0.00012643443187698722, 0.0001319895382039249, 0.00013754462997894734, 0.00014309973630588502, 0.0001486548426328227, 0.00015420993440784514, 0.00015976504073478281, 0.0001653201470617205, 0.00017087525338865817, 0.00017643035971559584, 0.0001819854514906183, 0.00018754055781755596, 0.00019309566414449364, 0.0001986507559195161, 0.00020420586224645376, 0.00020976096857339144, 0.0002153160749003291, 0.0002208711812272668, 0.00022642627300228924, 0.0002319813793292269]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 10.0, 13.0, 10.0, 23.0, 15.0, 19.0, 23.0, 27.0, 17.0, 24.0, 18.0, 22.0, 41.0, 30.0, 35.0, 38.0, 33.0, 29.0, 36.0, 41.0, 40.0, 40.0, 38.0, 28.0, 43.0, 35.0, 27.0, 26.0, 29.0, 23.0, 21.0, 22.0, 23.0, 14.0, 16.0, 10.0, 14.0, 8.0, 10.0, 7.0, 8.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.00010341405868530273, -0.00010017026215791702, -9.692646563053131e-05, -9.36826691031456e-05, -9.043887257575989e-05, -8.719507604837418e-05, -8.395127952098846e-05, -8.070748299360275e-05, -7.746368646621704e-05, -7.421988993883133e-05, -7.097609341144562e-05, -6.77322968840599e-05, -6.44885003566742e-05, -6.124470382928848e-05, -5.800090730190277e-05, -5.475711077451706e-05, -5.151331424713135e-05, -4.8269517719745636e-05, -4.5025721192359924e-05, -4.178192466497421e-05, -3.85381281375885e-05, -3.529433161020279e-05, -3.205053508281708e-05, -2.8806738555431366e-05, -2.5562942028045654e-05, -2.2319145500659943e-05, -1.907534897327423e-05, -1.583155244588852e-05, -1.2587755918502808e-05, -9.343959391117096e-06, -6.100162863731384e-06, -2.8563663363456726e-06, 3.8743019104003906e-07, 3.6312267184257507e-06, 6.875023245811462e-06, 1.0118819773197174e-05, 1.3362616300582886e-05, 1.6606412827968597e-05, 1.985020935535431e-05, 2.309400588274002e-05, 2.6337802410125732e-05, 2.9581598937511444e-05, 3.2825395464897156e-05, 3.606919199228287e-05, 3.931298851966858e-05, 4.255678504705429e-05, 4.580058157444e-05, 4.9044378101825714e-05, 5.2288174629211426e-05, 5.553197115659714e-05, 5.877576768398285e-05, 6.201956421136856e-05, 6.526336073875427e-05, 6.850715726613998e-05, 7.17509537935257e-05, 7.499475032091141e-05, 7.823854684829712e-05, 8.148234337568283e-05, 8.472613990306854e-05, 8.796993643045425e-05, 9.121373295783997e-05, 9.445752948522568e-05, 9.770132601261139e-05, 0.0001009451225399971, 0.00010418891906738281]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 4.0, 6.0, 6.0, 9.0, 12.0, 12.0, 21.0, 26.0, 27.0, 38.0, 61.0, 110.0, 178.0, 297.0, 535.0, 976.0, 1836.0, 3873.0, 8733.0, 22523.0, 68426.0, 405870.0, 425745.0, 69792.0, 22508.0, 8676.0, 4035.0, 1866.0, 953.0, 555.0, 314.0, 176.0, 120.0, 63.0, 48.0, 37.0, 18.0, 21.0, 17.0, 8.0, 5.0, 5.0, 3.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00018846988677978516, -0.00018292665481567383, -0.0001773834228515625, -0.00017184019088745117, -0.00016629695892333984, -0.00016075372695922852, -0.0001552104949951172, -0.00014966726303100586, -0.00014412403106689453, -0.0001385807991027832, -0.00013303756713867188, -0.00012749433517456055, -0.00012195110321044922, -0.00011640787124633789, -0.00011086463928222656, -0.00010532140731811523, -9.97781753540039e-05, -9.423494338989258e-05, -8.869171142578125e-05, -8.314847946166992e-05, -7.76052474975586e-05, -7.206201553344727e-05, -6.651878356933594e-05, -6.097555160522461e-05, -5.543231964111328e-05, -4.988908767700195e-05, -4.4345855712890625e-05, -3.88026237487793e-05, -3.325939178466797e-05, -2.771615982055664e-05, -2.2172927856445312e-05, -1.6629695892333984e-05, -1.1086463928222656e-05, -5.543231964111328e-06, 0.0, 5.543231964111328e-06, 1.1086463928222656e-05, 1.6629695892333984e-05, 2.2172927856445312e-05, 2.771615982055664e-05, 3.325939178466797e-05, 3.88026237487793e-05, 4.4345855712890625e-05, 4.988908767700195e-05, 5.543231964111328e-05, 6.097555160522461e-05, 6.651878356933594e-05, 7.206201553344727e-05, 7.76052474975586e-05, 8.314847946166992e-05, 8.869171142578125e-05, 9.423494338989258e-05, 9.97781753540039e-05, 0.00010532140731811523, 0.00011086463928222656, 0.00011640787124633789, 0.00012195110321044922, 0.00012749433517456055, 0.00013303756713867188, 0.0001385807991027832, 0.00014412403106689453, 0.00014966726303100586, 0.0001552104949951172, 0.00016075372695922852, 0.00016629695892333984]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 3.0, 7.0, 7.0, 9.0, 22.0, 28.0, 23.0, 41.0, 41.0, 58.0, 83.0, 86.0, 101.0, 94.0, 106.0, 68.0, 59.0, 44.0, 36.0, 23.0, 14.0, 12.0, 14.0, 2.0, 4.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.811981201171875e-05, -1.7253682017326355e-05, -1.638755202293396e-05, -1.5521422028541565e-05, -1.465529203414917e-05, -1.3789162039756775e-05, -1.292303204536438e-05, -1.2056902050971985e-05, -1.119077205657959e-05, -1.0324642062187195e-05, -9.4585120677948e-06, -8.592382073402405e-06, -7.72625207901001e-06, -6.860122084617615e-06, -5.99399209022522e-06, -5.127862095832825e-06, -4.26173210144043e-06, -3.3956021070480347e-06, -2.5294721126556396e-06, -1.6633421182632446e-06, -7.972121238708496e-07, 6.891787052154541e-08, 9.350478649139404e-07, 1.8011778593063354e-06, 2.6673078536987305e-06, 3.5334378480911255e-06, 4.3995678424835205e-06, 5.2656978368759155e-06, 6.1318278312683105e-06, 6.9979578256607056e-06, 7.8640878200531e-06, 8.730217814445496e-06, 9.59634780883789e-06, 1.0462477803230286e-05, 1.132860779762268e-05, 1.2194737792015076e-05, 1.306086778640747e-05, 1.3926997780799866e-05, 1.479312777519226e-05, 1.5659257769584656e-05, 1.652538776397705e-05, 1.7391517758369446e-05, 1.825764775276184e-05, 1.9123777747154236e-05, 1.998990774154663e-05, 2.0856037735939026e-05, 2.172216773033142e-05, 2.2588297724723816e-05, 2.345442771911621e-05, 2.4320557713508606e-05, 2.5186687707901e-05, 2.6052817702293396e-05, 2.691894769668579e-05, 2.7785077691078186e-05, 2.865120768547058e-05, 2.9517337679862976e-05, 3.038346767425537e-05, 3.1249597668647766e-05, 3.211572766304016e-05, 3.2981857657432556e-05, 3.384798765182495e-05, 3.4714117646217346e-05, 3.558024764060974e-05, 3.6446377635002136e-05, 3.731250762939453e-05]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 8.0, 2.0, 8.0, 8.0, 17.0, 19.0, 30.0, 40.0, 48.0, 88.0, 158.0, 200.0, 257.0, 421.0, 605.0, 931.0, 1460.0, 2349.0, 3432.0, 5744.0, 9276.0, 15487.0, 25735.0, 43946.0, 83223.0, 179639.0, 382955.0, 135998.0, 64886.0, 36071.0, 21364.0, 12824.0, 7627.0, 4935.0, 3056.0, 1946.0, 1279.0, 861.0, 541.0, 321.0, 240.0, 158.0, 105.0, 88.0, 61.0, 40.0, 19.0, 15.0, 12.0, 10.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.869699478149414e-05, -4.703644663095474e-05, -4.5375898480415344e-05, -4.3715350329875946e-05, -4.205480217933655e-05, -4.039425402879715e-05, -3.873370587825775e-05, -3.707315772771835e-05, -3.5412609577178955e-05, -3.375206142663956e-05, -3.209151327610016e-05, -3.043096512556076e-05, -2.8770416975021362e-05, -2.7109868824481964e-05, -2.5449320673942566e-05, -2.3788772523403168e-05, -2.212822437286377e-05, -2.046767622232437e-05, -1.8807128071784973e-05, -1.7146579921245575e-05, -1.5486031770706177e-05, -1.3825483620166779e-05, -1.216493546962738e-05, -1.0504387319087982e-05, -8.843839168548584e-06, -7.183291018009186e-06, -5.522742867469788e-06, -3.862194716930389e-06, -2.201646566390991e-06, -5.41098415851593e-07, 1.1194497346878052e-06, 2.7799978852272034e-06, 4.4405460357666016e-06, 6.101094186306e-06, 7.761642336845398e-06, 9.422190487384796e-06, 1.1082738637924194e-05, 1.2743286788463593e-05, 1.440383493900299e-05, 1.606438308954239e-05, 1.7724931240081787e-05, 1.9385479390621185e-05, 2.1046027541160583e-05, 2.270657569169998e-05, 2.436712384223938e-05, 2.6027671992778778e-05, 2.7688220143318176e-05, 2.9348768293857574e-05, 3.100931644439697e-05, 3.266986459493637e-05, 3.433041274547577e-05, 3.599096089601517e-05, 3.7651509046554565e-05, 3.9312057197093964e-05, 4.097260534763336e-05, 4.263315349817276e-05, 4.429370164871216e-05, 4.5954249799251556e-05, 4.7614797949790955e-05, 4.927534610033035e-05, 5.093589425086975e-05, 5.259644240140915e-05, 5.425699055194855e-05, 5.5917538702487946e-05, 5.7578086853027344e-05]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 6.0, 12.0, 12.0, 9.0, 12.0, 25.0, 19.0, 24.0, 20.0, 22.0, 33.0, 38.0, 37.0, 28.0, 45.0, 42.0, 37.0, 41.0, 45.0, 47.0, 36.0, 45.0, 50.0, 34.0, 22.0, 23.0, 29.0, 34.0, 26.0, 22.0, 20.0, 16.0, 13.0, 16.0, 12.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-4.786252975463867e-05, -4.6479515731334686e-05, -4.50965017080307e-05, -4.3713487684726715e-05, -4.233047366142273e-05, -4.0947459638118744e-05, -3.956444561481476e-05, -3.818143159151077e-05, -3.679841756820679e-05, -3.54154035449028e-05, -3.4032389521598816e-05, -3.264937549829483e-05, -3.1266361474990845e-05, -2.988334745168686e-05, -2.8500333428382874e-05, -2.7117319405078888e-05, -2.5734305381774902e-05, -2.4351291358470917e-05, -2.296827733516693e-05, -2.1585263311862946e-05, -2.020224928855896e-05, -1.8819235265254974e-05, -1.743622124195099e-05, -1.6053207218647003e-05, -1.4670193195343018e-05, -1.3287179172039032e-05, -1.1904165148735046e-05, -1.052115112543106e-05, -9.138137102127075e-06, -7.75512307882309e-06, -6.372109055519104e-06, -4.989095032215118e-06, -3.606081008911133e-06, -2.2230669856071472e-06, -8.400529623031616e-07, 5.42961061000824e-07, 1.9259750843048096e-06, 3.308989107608795e-06, 4.692003130912781e-06, 6.075017154216766e-06, 7.458031177520752e-06, 8.841045200824738e-06, 1.0224059224128723e-05, 1.1607073247432709e-05, 1.2990087270736694e-05, 1.437310129404068e-05, 1.5756115317344666e-05, 1.713912934064865e-05, 1.8522143363952637e-05, 1.9905157387256622e-05, 2.1288171410560608e-05, 2.2671185433864594e-05, 2.405419945716858e-05, 2.5437213480472565e-05, 2.682022750377655e-05, 2.8203241527080536e-05, 2.958625555038452e-05, 3.096926957368851e-05, 3.235228359699249e-05, 3.373529762029648e-05, 3.5118311643600464e-05, 3.650132566690445e-05, 3.7884339690208435e-05, 3.926735371351242e-05, 4.0650367736816406e-05]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 7.0, 8.0, 8.0, 11.0, 10.0, 46.0, 42.0, 38.0, 86.0, 107.0, 161.0, 197.0, 311.0, 485.0, 761.0, 1178.0, 1844.0, 3032.0, 9512.0, 13470.0, 27403.0, 60271.0, 148512.0, 360999.0, 244627.0, 92713.0, 39940.0, 19107.0, 9885.0, 5374.0, 3174.0, 2505.0, 859.0, 615.0, 396.0, 244.0, 188.0, 116.0, 94.0, 81.0, 38.0, 25.0, 22.0, 17.0, 12.0, 9.0, 4.0, 8.0, 2.0, 9.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.814697265625e-06, -3.6908313632011414e-06, -3.5669654607772827e-06, -3.443099558353424e-06, -3.3192336559295654e-06, -3.1953677535057068e-06, -3.071501851081848e-06, -2.9476359486579895e-06, -2.823770046234131e-06, -2.6999041438102722e-06, -2.5760382413864136e-06, -2.452172338962555e-06, -2.3283064365386963e-06, -2.2044405341148376e-06, -2.080574631690979e-06, -1.9567087292671204e-06, -1.8328428268432617e-06, -1.708976924419403e-06, -1.5851110219955444e-06, -1.4612451195716858e-06, -1.3373792171478271e-06, -1.2135133147239685e-06, -1.0896474123001099e-06, -9.657815098762512e-07, -8.419156074523926e-07, -7.180497050285339e-07, -5.941838026046753e-07, -4.7031790018081665e-07, -3.46451997756958e-07, -2.2258609533309937e-07, -9.872019290924072e-08, 2.514570951461792e-08, 1.4901161193847656e-07, 2.728775143623352e-07, 3.9674341678619385e-07, 5.206093192100525e-07, 6.444752216339111e-07, 7.683411240577698e-07, 8.922070264816284e-07, 1.016072928905487e-06, 1.1399388313293457e-06, 1.2638047337532043e-06, 1.387670636177063e-06, 1.5115365386009216e-06, 1.6354024410247803e-06, 1.759268343448639e-06, 1.8831342458724976e-06, 2.007000148296356e-06, 2.130866050720215e-06, 2.2547319531440735e-06, 2.378597855567932e-06, 2.5024637579917908e-06, 2.6263296604156494e-06, 2.750195562839508e-06, 2.8740614652633667e-06, 2.9979273676872253e-06, 3.121793270111084e-06, 3.2456591725349426e-06, 3.3695250749588013e-06, 3.49339097738266e-06, 3.6172568798065186e-06, 3.741122782230377e-06, 3.864988684654236e-06, 3.9888545870780945e-06, 4.112720489501953e-06]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 6.0, 3.0, 4.0, 15.0, 6.0, 5.0, 11.0, 32.0, 16.0, 25.0, 22.0, 79.0, 38.0, 38.0, 38.0, 93.0, 35.0, 55.0, 92.0, 49.0, 42.0, 39.0, 54.0, 29.0, 26.0, 12.0, 40.0, 14.0, 12.0, 8.0, 27.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4437904357910156e-06, -2.368353307247162e-06, -2.292916178703308e-06, -2.2174790501594543e-06, -2.1420419216156006e-06, -2.066604793071747e-06, -1.991167664527893e-06, -1.9157305359840393e-06, -1.8402934074401855e-06, -1.7648562788963318e-06, -1.689419150352478e-06, -1.6139820218086243e-06, -1.5385448932647705e-06, -1.4631077647209167e-06, -1.387670636177063e-06, -1.3122335076332092e-06, -1.2367963790893555e-06, -1.1613592505455017e-06, -1.085922122001648e-06, -1.0104849934577942e-06, -9.350478649139404e-07, -8.596107363700867e-07, -7.841736078262329e-07, -7.087364792823792e-07, -6.332993507385254e-07, -5.578622221946716e-07, -4.824250936508179e-07, -4.069879651069641e-07, -3.3155083656311035e-07, -2.561137080192566e-07, -1.8067657947540283e-07, -1.0523945093154907e-07, -2.9802322387695312e-08, 4.563480615615845e-08, 1.210719347000122e-07, 1.9650906324386597e-07, 2.7194619178771973e-07, 3.473833203315735e-07, 4.2282044887542725e-07, 4.98257577419281e-07, 5.736947059631348e-07, 6.491318345069885e-07, 7.245689630508423e-07, 8.00006091594696e-07, 8.754432201385498e-07, 9.508803486824036e-07, 1.0263174772262573e-06, 1.101754605770111e-06, 1.1771917343139648e-06, 1.2526288628578186e-06, 1.3280659914016724e-06, 1.4035031199455261e-06, 1.4789402484893799e-06, 1.5543773770332336e-06, 1.6298145055770874e-06, 1.7052516341209412e-06, 1.780688762664795e-06, 1.8561258912086487e-06, 1.9315630197525024e-06, 2.007000148296356e-06, 2.08243727684021e-06, 2.1578744053840637e-06, 2.2333115339279175e-06, 2.3087486624717712e-06, 2.384185791015625e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 10.0, 5.0, 32.0, 29.0, 62.0, 53.0, 100.0, 181.0, 131.0, 340.0, 608.0, 487.0, 1377.0, 2475.0, 4243.0, 3379.0, 11117.0, 22026.0, 19408.0, 76743.0, 245333.0, 435784.0, 82081.0, 76309.0, 32424.0, 9049.0, 11172.0, 5995.0, 1818.0, 2396.0, 1367.0, 775.0, 268.0, 362.0, 253.0, 73.0, 103.0, 63.0, 12.0, 31.0, 22.0, 21.0, 7.0, 12.0, 9.0, 2.0, 3.0, 3.0, 3.0], "bins": [-3.6954879760742188e-06, -3.5939738154411316e-06, -3.4924596548080444e-06, -3.3909454941749573e-06, -3.28943133354187e-06, -3.187917172908783e-06, -3.086403012275696e-06, -2.9848888516426086e-06, -2.8833746910095215e-06, -2.7818605303764343e-06, -2.680346369743347e-06, -2.57883220911026e-06, -2.477318048477173e-06, -2.3758038878440857e-06, -2.2742897272109985e-06, -2.1727755665779114e-06, -2.0712614059448242e-06, -1.969747245311737e-06, -1.86823308467865e-06, -1.7667189240455627e-06, -1.6652047634124756e-06, -1.5636906027793884e-06, -1.4621764421463013e-06, -1.3606622815132141e-06, -1.259148120880127e-06, -1.1576339602470398e-06, -1.0561197996139526e-06, -9.546056389808655e-07, -8.530914783477783e-07, -7.515773177146912e-07, -6.50063157081604e-07, -5.485489964485168e-07, -4.470348358154297e-07, -3.4552067518234253e-07, -2.4400651454925537e-07, -1.424923539161682e-07, -4.0978193283081055e-08, 6.05359673500061e-08, 1.6205012798309326e-07, 2.635642886161804e-07, 3.650784492492676e-07, 4.6659260988235474e-07, 5.681067705154419e-07, 6.69620931148529e-07, 7.711350917816162e-07, 8.726492524147034e-07, 9.741634130477905e-07, 1.0756775736808777e-06, 1.1771917343139648e-06, 1.278705894947052e-06, 1.3802200555801392e-06, 1.4817342162132263e-06, 1.5832483768463135e-06, 1.6847625374794006e-06, 1.7862766981124878e-06, 1.887790858745575e-06, 1.989305019378662e-06, 2.0908191800117493e-06, 2.1923333406448364e-06, 2.2938475012779236e-06, 2.3953616619110107e-06, 2.496875822544098e-06, 2.598389983177185e-06, 2.6999041438102722e-06, 2.8014183044433594e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 2.0, 4.0, 6.0, 8.0, 7.0, 17.0, 10.0, 8.0, 26.0, 11.0, 21.0, 48.0, 28.0, 32.0, 68.0, 36.0, 42.0, 85.0, 48.0, 37.0, 82.0, 35.0, 41.0, 56.0, 29.0, 20.0, 49.0, 14.0, 15.0, 32.0, 11.0, 5.0, 24.0, 4.0, 3.0, 10.0, 2.0, 6.0, 4.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2649765014648438e-06, -2.185814082622528e-06, -2.1066516637802124e-06, -2.0274892449378967e-06, -1.948326826095581e-06, -1.8691644072532654e-06, -1.7900019884109497e-06, -1.710839569568634e-06, -1.6316771507263184e-06, -1.5525147318840027e-06, -1.473352313041687e-06, -1.3941898941993713e-06, -1.3150274753570557e-06, -1.23586505651474e-06, -1.1567026376724243e-06, -1.0775402188301086e-06, -9.98377799987793e-07, -9.192153811454773e-07, -8.400529623031616e-07, -7.60890543460846e-07, -6.817281246185303e-07, -6.025657057762146e-07, -5.234032869338989e-07, -4.4424086809158325e-07, -3.650784492492676e-07, -2.859160304069519e-07, -2.0675361156463623e-07, -1.2759119272232056e-07, -4.842877388000488e-08, 3.073364496231079e-08, 1.0989606380462646e-07, 1.8905848264694214e-07, 2.682209014892578e-07, 3.473833203315735e-07, 4.2654573917388916e-07, 5.057081580162048e-07, 5.848705768585205e-07, 6.640329957008362e-07, 7.431954145431519e-07, 8.223578333854675e-07, 9.015202522277832e-07, 9.806826710700989e-07, 1.0598450899124146e-06, 1.1390075087547302e-06, 1.218169927597046e-06, 1.2973323464393616e-06, 1.3764947652816772e-06, 1.455657184123993e-06, 1.5348196029663086e-06, 1.6139820218086243e-06, 1.69314444065094e-06, 1.7723068594932556e-06, 1.8514692783355713e-06, 1.930631697177887e-06, 2.0097941160202026e-06, 2.0889565348625183e-06, 2.168118953704834e-06, 2.2472813725471497e-06, 2.3264437913894653e-06, 2.405606210231781e-06, 2.4847686290740967e-06, 2.5639310479164124e-06, 2.643093466758728e-06, 2.7222558856010437e-06, 2.8014183044433594e-06]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 5.0, 7.0, 7.0, 11.0, 32.0, 22.0, 48.0, 111.0, 196.0, 195.0, 100.0, 60.0, 52.0, 24.0, 26.0, 21.0, 21.0, 13.0, 14.0, 9.0, 5.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015457380504813045, -0.0001453852019039914, -0.00013619661331176758, -0.00012700801016762853, -0.00011781940702348948, -0.00010863080387935042, -9.944220801116899e-05, -9.025361214298755e-05, -8.10650089988485e-05, -7.187640585470945e-05, -6.268780998652801e-05, -5.3499210480367765e-05, -4.431061097420752e-05, -3.5122011468047276e-05, -2.5933411961887032e-05, -1.6744816093705595e-05, -7.556212949566543e-06, 1.6323865565937012e-06, 1.0820986062753946e-05, 2.000958556891419e-05, 2.9198185075074434e-05, 3.838678458123468e-05, 4.757538408739492e-05, 5.676397995557636e-05, 6.595258309971541e-05, 7.514118624385446e-05, 8.43297821120359e-05, 9.351837798021734e-05, 0.00010270698112435639, 0.00011189558426849544, 0.00012108418013667688, 0.00013027277600485831, 0.00013946136459708214, 0.0001486499677412212, 0.00015783857088536024, 0.00016702715947758406, 0.00017621576262172312, 0.00018540436576586217, 0.000194592954358086, 0.00020378155750222504, 0.0002129701606463641, 0.00022215876379050314, 0.0002313473669346422, 0.00024053595552686602, 0.00024972454411908984, 0.0002589131472632289, 0.00026810175040736794, 0.000277290353551507, 0.00028647895669564605, 0.0002956675598397851, 0.00030485616298392415, 0.0003140447661280632, 0.00032323336927220225, 0.00033242194331251085, 0.0003416105464566499, 0.00035079914960078895, 0.000359987752744928, 0.00036917635588906705, 0.0003783649590332061, 0.00038755356217734516, 0.00039674213621765375, 0.0004059307393617928, 0.00041511934250593185, 0.0004243079456500709, 0.00043349654879420996]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 6.0, 14.0, 13.0, 10.0, 21.0, 19.0, 17.0, 24.0, 27.0, 20.0, 28.0, 35.0, 40.0, 43.0, 40.0, 39.0, 50.0, 39.0, 55.0, 47.0, 39.0, 40.0, 37.0, 39.0, 40.0, 30.0, 26.0, 28.0, 19.0, 16.0, 16.0, 15.0, 13.0, 14.0, 7.0, 7.0, 7.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014698505401611328, -0.00014236848801374435, -0.00013775192201137543, -0.0001331353560090065, -0.00012851879000663757, -0.00012390222400426865, -0.00011928565800189972, -0.00011466909199953079, -0.00011005252599716187, -0.00010543595999479294, -0.00010081939399242401, -9.620282799005508e-05, -9.158626198768616e-05, -8.696969598531723e-05, -8.23531299829483e-05, -7.773656398057938e-05, -7.311999797821045e-05, -6.850343197584152e-05, -6.38868659734726e-05, -5.927029997110367e-05, -5.465373396873474e-05, -5.0037167966365814e-05, -4.542060196399689e-05, -4.080403596162796e-05, -3.618746995925903e-05, -3.1570903956890106e-05, -2.695433795452118e-05, -2.2337771952152252e-05, -1.7721205949783325e-05, -1.3104639947414398e-05, -8.488073945045471e-06, -3.871507942676544e-06, 7.450580596923828e-07, 5.36162406206131e-06, 9.978190064430237e-06, 1.4594756066799164e-05, 1.921132206916809e-05, 2.3827888071537018e-05, 2.8444454073905945e-05, 3.306102007627487e-05, 3.76775860786438e-05, 4.2294152081012726e-05, 4.691071808338165e-05, 5.152728408575058e-05, 5.614385008811951e-05, 6.0760416090488434e-05, 6.537698209285736e-05, 6.999354809522629e-05, 7.461011409759521e-05, 7.922668009996414e-05, 8.384324610233307e-05, 8.8459812104702e-05, 9.307637810707092e-05, 9.769294410943985e-05, 0.00010230951011180878, 0.0001069260761141777, 0.00011154264211654663, 0.00011615920811891556, 0.00012077577412128448, 0.0001253923401236534, 0.00013000890612602234, 0.00013462547212839127, 0.0001392420381307602, 0.00014385860413312912, 0.00014847517013549805]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 12.0, 10.0, 13.0, 25.0, 24.0, 42.0, 67.0, 87.0, 176.0, 232.0, 426.0, 594.0, 943.0, 1660.0, 2780.0, 4860.0, 9765.0, 20124.0, 51421.0, 2565571.0, 1442153.0, 51239.0, 21134.0, 9530.0, 4896.0, 2513.0, 1395.0, 883.0, 522.0, 302.0, 214.0, 165.0, 108.0, 84.0, 60.0, 44.0, 41.0, 30.0, 23.0, 16.0, 29.0, 11.0, 11.0, 9.0, 12.0, 5.0, 10.0, 3.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00010138750076293945, -9.748619049787521e-05, -9.358488023281097e-05, -8.968356996774673e-05, -8.57822597026825e-05, -8.188094943761826e-05, -7.797963917255402e-05, -7.407832890748978e-05, -7.017701864242554e-05, -6.62757083773613e-05, -6.237439811229706e-05, -5.847308784723282e-05, -5.457177758216858e-05, -5.067046731710434e-05, -4.67691570520401e-05, -4.286784678697586e-05, -3.896653652191162e-05, -3.506522625684738e-05, -3.116391599178314e-05, -2.7262605726718903e-05, -2.3361295461654663e-05, -1.9459985196590424e-05, -1.5558674931526184e-05, -1.1657364666461945e-05, -7.756054401397705e-06, -3.8547441363334656e-06, 4.6566128730773926e-08, 3.9478763937950134e-06, 7.849186658859253e-06, 1.1750496923923492e-05, 1.5651807188987732e-05, 1.955311745405197e-05, 2.345442771911621e-05, 2.735573798418045e-05, 3.125704824924469e-05, 3.515835851430893e-05, 3.905966877937317e-05, 4.296097904443741e-05, 4.686228930950165e-05, 5.076359957456589e-05, 5.466490983963013e-05, 5.8566220104694366e-05, 6.24675303697586e-05, 6.636884063482285e-05, 7.027015089988708e-05, 7.417146116495132e-05, 7.807277143001556e-05, 8.19740816950798e-05, 8.587539196014404e-05, 8.977670222520828e-05, 9.367801249027252e-05, 9.757932275533676e-05, 0.000101480633020401, 0.00010538194328546524, 0.00010928325355052948, 0.00011318456381559372, 0.00011708587408065796, 0.0001209871843457222, 0.00012488849461078644, 0.00012878980487585068, 0.00013269111514091492, 0.00013659242540597916, 0.0001404937356710434, 0.00014439504593610764, 0.00014829635620117188]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 6.0, 6.0, 9.0, 7.0, 11.0, 23.0, 22.0, 35.0, 46.0, 62.0, 58.0, 79.0, 83.0, 94.0, 91.0, 72.0, 70.0, 60.0, 53.0, 32.0, 26.0, 16.0, 7.0, 12.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2411346435546875e-05, -2.1529383957386017e-05, -2.064742147922516e-05, -1.97654590010643e-05, -1.8883496522903442e-05, -1.8001534044742584e-05, -1.7119571566581726e-05, -1.6237609088420868e-05, -1.535564661026001e-05, -1.4473684132099152e-05, -1.3591721653938293e-05, -1.2709759175777435e-05, -1.1827796697616577e-05, -1.0945834219455719e-05, -1.006387174129486e-05, -9.181909263134003e-06, -8.299946784973145e-06, -7.417984306812286e-06, -6.536021828651428e-06, -5.65405935049057e-06, -4.772096872329712e-06, -3.890134394168854e-06, -3.0081719160079956e-06, -2.1262094378471375e-06, -1.2442469596862793e-06, -3.6228448152542114e-07, 5.19677996635437e-07, 1.4016404747962952e-06, 2.2836029529571533e-06, 3.1655654311180115e-06, 4.04752790927887e-06, 4.929490387439728e-06, 5.811452865600586e-06, 6.693415343761444e-06, 7.575377821922302e-06, 8.45734030008316e-06, 9.339302778244019e-06, 1.0221265256404877e-05, 1.1103227734565735e-05, 1.1985190212726593e-05, 1.2867152690887451e-05, 1.374911516904831e-05, 1.4631077647209167e-05, 1.5513040125370026e-05, 1.6395002603530884e-05, 1.7276965081691742e-05, 1.81589275598526e-05, 1.9040890038013458e-05, 1.9922852516174316e-05, 2.0804814994335175e-05, 2.1686777472496033e-05, 2.256873995065689e-05, 2.345070242881775e-05, 2.4332664906978607e-05, 2.5214627385139465e-05, 2.6096589863300323e-05, 2.697855234146118e-05, 2.786051481962204e-05, 2.8742477297782898e-05, 2.9624439775943756e-05, 3.0506402254104614e-05, 3.138836473226547e-05, 3.227032721042633e-05, 3.315228968858719e-05, 3.403425216674805e-05]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 17.0, 12.0, 13.0, 26.0, 32.0, 46.0, 83.0, 86.0, 160.0, 225.0, 373.0, 544.0, 963.0, 1590.0, 2627.0, 4819.0, 8433.0, 16612.0, 33391.0, 85969.0, 1458321.0, 2415353.0, 93199.0, 34039.0, 16801.0, 8579.0, 4953.0, 2757.0, 1558.0, 971.0, 612.0, 348.0, 253.0, 162.0, 96.0, 82.0, 48.0, 27.0, 22.0, 22.0, 16.0, 10.0, 7.0, 2.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.790327072143555e-05, -7.561314851045609e-05, -7.332302629947662e-05, -7.103290408849716e-05, -6.87427818775177e-05, -6.645265966653824e-05, -6.416253745555878e-05, -6.187241524457932e-05, -5.9582293033599854e-05, -5.729217082262039e-05, -5.500204861164093e-05, -5.271192640066147e-05, -5.042180418968201e-05, -4.8131681978702545e-05, -4.5841559767723083e-05, -4.355143755674362e-05, -4.126131534576416e-05, -3.89711931347847e-05, -3.668107092380524e-05, -3.4390948712825775e-05, -3.2100826501846313e-05, -2.9810704290866852e-05, -2.752058207988739e-05, -2.523045986890793e-05, -2.2940337657928467e-05, -2.0650215446949005e-05, -1.8360093235969543e-05, -1.6069971024990082e-05, -1.377984881401062e-05, -1.1489726603031158e-05, -9.199604392051697e-06, -6.909482181072235e-06, -4.6193599700927734e-06, -2.3292377591133118e-06, -3.91155481338501e-08, 2.2510066628456116e-06, 4.541128873825073e-06, 6.831251084804535e-06, 9.121373295783997e-06, 1.1411495506763458e-05, 1.370161771774292e-05, 1.599173992872238e-05, 1.8281862139701843e-05, 2.0571984350681305e-05, 2.2862106561660767e-05, 2.5152228772640228e-05, 2.744235098361969e-05, 2.973247319459915e-05, 3.202259540557861e-05, 3.4312717616558075e-05, 3.660283982753754e-05, 3.8892962038517e-05, 4.118308424949646e-05, 4.347320646047592e-05, 4.576332867145538e-05, 4.8053450882434845e-05, 5.034357309341431e-05, 5.263369530439377e-05, 5.492381751537323e-05, 5.721393972635269e-05, 5.950406193733215e-05, 6.179418414831161e-05, 6.408430635929108e-05, 6.637442857027054e-05, 6.866455078125e-05]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 1.0, 3.0, 11.0, 11.0, 8.0, 10.0, 15.0, 12.0, 17.0, 24.0, 25.0, 41.0, 75.0, 133.0, 515.0, 2267.0, 500.0, 128.0, 75.0, 40.0, 28.0, 29.0, 24.0, 22.0, 12.0, 19.0, 6.0, 5.0, 3.0, 4.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.340576171875e-05, -5.159713327884674e-05, -4.978850483894348e-05, -4.797987639904022e-05, -4.617124795913696e-05, -4.4362619519233704e-05, -4.2553991079330444e-05, -4.0745362639427185e-05, -3.8936734199523926e-05, -3.7128105759620667e-05, -3.531947731971741e-05, -3.351084887981415e-05, -3.170222043991089e-05, -2.989359200000763e-05, -2.808496356010437e-05, -2.627633512020111e-05, -2.446770668029785e-05, -2.2659078240394592e-05, -2.0850449800491333e-05, -1.9041821360588074e-05, -1.7233192920684814e-05, -1.5424564480781555e-05, -1.3615936040878296e-05, -1.1807307600975037e-05, -9.998679161071777e-06, -8.190050721168518e-06, -6.381422281265259e-06, -4.5727938413619995e-06, -2.7641654014587402e-06, -9.55536961555481e-07, 8.530914783477783e-07, 2.6617199182510376e-06, 4.470348358154297e-06, 6.278976798057556e-06, 8.087605237960815e-06, 9.896233677864075e-06, 1.1704862117767334e-05, 1.3513490557670593e-05, 1.5322118997573853e-05, 1.7130747437477112e-05, 1.893937587738037e-05, 2.074800431728363e-05, 2.255663275718689e-05, 2.436526119709015e-05, 2.6173889636993408e-05, 2.7982518076896667e-05, 2.9791146516799927e-05, 3.1599774956703186e-05, 3.3408403396606445e-05, 3.5217031836509705e-05, 3.7025660276412964e-05, 3.883428871631622e-05, 4.064291715621948e-05, 4.245154559612274e-05, 4.4260174036026e-05, 4.606880247592926e-05, 4.787743091583252e-05, 4.968605935573578e-05, 5.149468779563904e-05, 5.33033162355423e-05, 5.511194467544556e-05, 5.6920573115348816e-05, 5.8729201555252075e-05, 6.0537829995155334e-05, 6.23464584350586e-05]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 6.0, 3.0, 9.0, 5.0, 12.0, 16.0, 26.0, 28.0, 28.0, 48.0, 59.0, 101.0, 102.0, 115.0, 94.0, 80.0, 60.0, 32.0, 40.0, 24.0, 23.0, 20.0, 15.0, 13.0, 12.0, 3.0, 3.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013912879512645304, -0.00013305667380336672, -0.0001269845524802804, -0.00012091243115719408, -0.00011484030255815014, -0.00010876818123506382, -0.0001026960599119775, -9.662393131293356e-05, -9.055180998984724e-05, -8.447968866676092e-05, -7.84075673436746e-05, -7.233544602058828e-05, -6.626331742154434e-05, -6.019119609845802e-05, -5.41190747753717e-05, -4.804694981430657e-05, -4.197483212919906e-05, -3.5902710806112736e-05, -2.9830585845047608e-05, -2.3758464521961287e-05, -1.7686341379885562e-05, -1.1614218237809837e-05, -5.5420969147235155e-06, 5.300280463416129e-07, 6.602149369427934e-06, 1.267427251150366e-05, 1.8746395653579384e-05, 2.4818516976665705e-05, 3.089063829975203e-05, 3.6962763260817155e-05, 4.3034884583903477e-05, 4.9107009544968605e-05, 5.5179130868054926e-05, 6.125125219114125e-05, 6.732337351422757e-05, 7.339549483731389e-05, 7.946762343635783e-05, 8.553974475944415e-05, 9.161186608253047e-05, 9.76839946815744e-05, 0.00010375611600466073, 0.00010982823732774705, 0.00011590035865083337, 0.00012197247997391969, 0.000128044601297006, 0.00013411673717200756, 0.00014018884394317865, 0.0001462609798181802, 0.0001523330865893513, 0.00015840520791243762, 0.00016447732923552394, 0.00017054945055861026, 0.00017662157188169658, 0.00018269370775669813, 0.00018876581452786922, 0.00019483795040287077, 0.0002009100717259571, 0.00020698219304904342, 0.00021305431437212974, 0.00021912643569521606, 0.00022519855701830238, 0.0002312706783413887, 0.00023734281421639025, 0.00024341493553947657, 0.0002494870568625629]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 5.0, 4.0, 5.0, 5.0, 5.0, 5.0, 6.0, 17.0, 13.0, 13.0, 14.0, 23.0, 22.0, 21.0, 20.0, 32.0, 34.0, 24.0, 33.0, 29.0, 23.0, 45.0, 34.0, 44.0, 47.0, 33.0, 32.0, 46.0, 39.0, 33.0, 27.0, 31.0, 20.0, 29.0, 28.0, 25.0, 22.0, 22.0, 16.0, 14.0, 12.0, 13.0, 9.0, 6.0, 8.0, 3.0, 5.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0001137852668762207, -0.00011046510189771652, -0.00010714493691921234, -0.00010382477194070816, -0.00010050460696220398, -9.71844419836998e-05, -9.386427700519562e-05, -9.054411202669144e-05, -8.722394704818726e-05, -8.390378206968307e-05, -8.05836170911789e-05, -7.726345211267471e-05, -7.394328713417053e-05, -7.062312215566635e-05, -6.730295717716217e-05, -6.398279219865799e-05, -6.066262722015381e-05, -5.734246224164963e-05, -5.402229726314545e-05, -5.0702132284641266e-05, -4.7381967306137085e-05, -4.4061802327632904e-05, -4.074163734912872e-05, -3.742147237062454e-05, -3.410130739212036e-05, -3.078114241361618e-05, -2.7460977435112e-05, -2.414081245660782e-05, -2.0820647478103638e-05, -1.7500482499599457e-05, -1.4180317521095276e-05, -1.0860152542591095e-05, -7.539987564086914e-06, -4.219822585582733e-06, -8.996576070785522e-07, 2.4205073714256287e-06, 5.7406723499298096e-06, 9.06083732843399e-06, 1.2381002306938171e-05, 1.5701167285442352e-05, 1.9021332263946533e-05, 2.2341497242450714e-05, 2.5661662220954895e-05, 2.8981827199459076e-05, 3.230199217796326e-05, 3.562215715646744e-05, 3.894232213497162e-05, 4.22624871134758e-05, 4.558265209197998e-05, 4.890281707048416e-05, 5.222298204898834e-05, 5.554314702749252e-05, 5.8863312005996704e-05, 6.218347698450089e-05, 6.550364196300507e-05, 6.882380694150925e-05, 7.214397192001343e-05, 7.546413689851761e-05, 7.878430187702179e-05, 8.210446685552597e-05, 8.542463183403015e-05, 8.874479681253433e-05, 9.206496179103851e-05, 9.53851267695427e-05, 9.870529174804688e-05]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 6.0, 12.0, 15.0, 19.0, 18.0, 24.0, 41.0, 56.0, 96.0, 116.0, 163.0, 310.0, 513.0, 932.0, 1835.0, 3679.0, 8588.0, 22451.0, 69593.0, 382859.0, 443871.0, 73136.0, 22894.0, 9081.0, 3857.0, 1862.0, 963.0, 553.0, 331.0, 200.0, 140.0, 98.0, 57.0, 45.0, 33.0, 24.0, 15.0, 18.0, 13.0, 7.0, 8.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00015366077423095703, -0.00014914385974407196, -0.0001446269452571869, -0.00014011003077030182, -0.00013559311628341675, -0.00013107620179653168, -0.0001265592873096466, -0.00012204237282276154, -0.00011752545833587646, -0.0001130085438489914, -0.00010849162936210632, -0.00010397471487522125, -9.945780038833618e-05, -9.494088590145111e-05, -9.042397141456604e-05, -8.590705692768097e-05, -8.13901424407959e-05, -7.687322795391083e-05, -7.235631346702576e-05, -6.783939898014069e-05, -6.332248449325562e-05, -5.8805570006370544e-05, -5.4288655519485474e-05, -4.97717410326004e-05, -4.525482654571533e-05, -4.073791205883026e-05, -3.622099757194519e-05, -3.170408308506012e-05, -2.718716859817505e-05, -2.2670254111289978e-05, -1.8153339624404907e-05, -1.3636425137519836e-05, -9.119510650634766e-06, -4.602596163749695e-06, -8.568167686462402e-08, 4.431232810020447e-06, 8.948147296905518e-06, 1.3465061783790588e-05, 1.798197627067566e-05, 2.249889075756073e-05, 2.70158052444458e-05, 3.153271973133087e-05, 3.604963421821594e-05, 4.056654870510101e-05, 4.5083463191986084e-05, 4.9600377678871155e-05, 5.4117292165756226e-05, 5.8634206652641296e-05, 6.315112113952637e-05, 6.766803562641144e-05, 7.218495011329651e-05, 7.670186460018158e-05, 8.121877908706665e-05, 8.573569357395172e-05, 9.025260806083679e-05, 9.476952254772186e-05, 9.928643703460693e-05, 0.000103803351521492, 0.00010832026600837708, 0.00011283718049526215, 0.00011735409498214722, 0.00012187100946903229, 0.00012638792395591736, 0.00013090483844280243, 0.0001354217529296875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 7.0, 12.0, 14.0, 24.0, 35.0, 49.0, 60.0, 60.0, 97.0, 108.0, 110.0, 97.0, 80.0, 60.0, 45.0, 24.0, 38.0, 21.0, 17.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1219253540039062e-05, -2.0305626094341278e-05, -1.9391998648643494e-05, -1.847837120294571e-05, -1.7564743757247925e-05, -1.665111631155014e-05, -1.5737488865852356e-05, -1.4823861420154572e-05, -1.3910233974456787e-05, -1.2996606528759003e-05, -1.2082979083061218e-05, -1.1169351637363434e-05, -1.025572419166565e-05, -9.342096745967865e-06, -8.42846930027008e-06, -7.514841854572296e-06, -6.601214408874512e-06, -5.687586963176727e-06, -4.773959517478943e-06, -3.8603320717811584e-06, -2.946704626083374e-06, -2.0330771803855896e-06, -1.1194497346878052e-06, -2.0582228899002075e-07, 7.078051567077637e-07, 1.621432602405548e-06, 2.5350600481033325e-06, 3.448687493801117e-06, 4.362314939498901e-06, 5.275942385196686e-06, 6.18956983089447e-06, 7.103197276592255e-06, 8.016824722290039e-06, 8.930452167987823e-06, 9.844079613685608e-06, 1.0757707059383392e-05, 1.1671334505081177e-05, 1.2584961950778961e-05, 1.3498589396476746e-05, 1.441221684217453e-05, 1.5325844287872314e-05, 1.62394717335701e-05, 1.7153099179267883e-05, 1.8066726624965668e-05, 1.8980354070663452e-05, 1.9893981516361237e-05, 2.080760896205902e-05, 2.1721236407756805e-05, 2.263486385345459e-05, 2.3548491299152374e-05, 2.446211874485016e-05, 2.5375746190547943e-05, 2.6289373636245728e-05, 2.7203001081943512e-05, 2.8116628527641296e-05, 2.903025597333908e-05, 2.9943883419036865e-05, 3.085751086473465e-05, 3.1771138310432434e-05, 3.268476575613022e-05, 3.3598393201828e-05, 3.451202064752579e-05, 3.542564809322357e-05, 3.6339275538921356e-05, 3.725290298461914e-05]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 4.0, 9.0, 10.0, 26.0, 21.0, 33.0, 60.0, 81.0, 127.0, 177.0, 245.0, 397.0, 553.0, 788.0, 1401.0, 1846.0, 3223.0, 4698.0, 7508.0, 12557.0, 19819.0, 34201.0, 56691.0, 108015.0, 333443.0, 235695.0, 97919.0, 50239.0, 30577.0, 17585.0, 10872.0, 7175.0, 4286.0, 2914.0, 1781.0, 1166.0, 845.0, 486.0, 359.0, 234.0, 154.0, 99.0, 80.0, 56.0, 31.0, 25.0, 14.0, 13.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.589557647705078e-05, -4.4500455260276794e-05, -4.310533404350281e-05, -4.171021282672882e-05, -4.0315091609954834e-05, -3.891997039318085e-05, -3.752484917640686e-05, -3.6129727959632874e-05, -3.473460674285889e-05, -3.33394855260849e-05, -3.194436430931091e-05, -3.0549243092536926e-05, -2.915412187576294e-05, -2.7759000658988953e-05, -2.6363879442214966e-05, -2.496875822544098e-05, -2.3573637008666992e-05, -2.2178515791893005e-05, -2.078339457511902e-05, -1.9388273358345032e-05, -1.7993152141571045e-05, -1.6598030924797058e-05, -1.5202909708023071e-05, -1.3807788491249084e-05, -1.2412667274475098e-05, -1.101754605770111e-05, -9.622424840927124e-06, -8.227303624153137e-06, -6.83218240737915e-06, -5.4370611906051636e-06, -4.041939973831177e-06, -2.64681875705719e-06, -1.2516975402832031e-06, 1.434236764907837e-07, 1.5385448932647705e-06, 2.9336661100387573e-06, 4.328787326812744e-06, 5.723908543586731e-06, 7.119029760360718e-06, 8.514150977134705e-06, 9.909272193908691e-06, 1.1304393410682678e-05, 1.2699514627456665e-05, 1.4094635844230652e-05, 1.548975706100464e-05, 1.6884878277778625e-05, 1.8279999494552612e-05, 1.96751207113266e-05, 2.1070241928100586e-05, 2.2465363144874573e-05, 2.386048436164856e-05, 2.5255605578422546e-05, 2.6650726795196533e-05, 2.804584801197052e-05, 2.9440969228744507e-05, 3.0836090445518494e-05, 3.223121166229248e-05, 3.362633287906647e-05, 3.5021454095840454e-05, 3.641657531261444e-05, 3.781169652938843e-05, 3.9206817746162415e-05, 4.06019389629364e-05, 4.199706017971039e-05, 4.3392181396484375e-05]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 9.0, 10.0, 15.0, 21.0, 17.0, 18.0, 31.0, 25.0, 23.0, 31.0, 36.0, 38.0, 50.0, 46.0, 45.0, 52.0, 62.0, 48.0, 38.0, 36.0, 48.0, 36.0, 38.0, 35.0, 26.0, 26.0, 23.0, 16.0, 16.0, 16.0, 9.0, 9.0, 10.0, 9.0, 6.0, 3.0, 2.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.190206527709961e-05, -4.054047167301178e-05, -3.917887806892395e-05, -3.781728446483612e-05, -3.645569086074829e-05, -3.509409725666046e-05, -3.373250365257263e-05, -3.23709100484848e-05, -3.100931644439697e-05, -2.9647722840309143e-05, -2.8286129236221313e-05, -2.6924535632133484e-05, -2.5562942028045654e-05, -2.4201348423957825e-05, -2.2839754819869995e-05, -2.1478161215782166e-05, -2.0116567611694336e-05, -1.8754974007606506e-05, -1.7393380403518677e-05, -1.6031786799430847e-05, -1.4670193195343018e-05, -1.3308599591255188e-05, -1.1947005987167358e-05, -1.0585412383079529e-05, -9.2238187789917e-06, -7.86222517490387e-06, -6.50063157081604e-06, -5.1390379667282104e-06, -3.777444362640381e-06, -2.4158507585525513e-06, -1.0542571544647217e-06, 3.073364496231079e-07, 1.6689300537109375e-06, 3.030523657798767e-06, 4.392117261886597e-06, 5.753710865974426e-06, 7.115304470062256e-06, 8.476898074150085e-06, 9.838491678237915e-06, 1.1200085282325745e-05, 1.2561678886413574e-05, 1.3923272490501404e-05, 1.5284866094589233e-05, 1.6646459698677063e-05, 1.8008053302764893e-05, 1.9369646906852722e-05, 2.0731240510940552e-05, 2.209283411502838e-05, 2.345442771911621e-05, 2.481602132320404e-05, 2.617761492729187e-05, 2.75392085313797e-05, 2.890080213546753e-05, 3.026239573955536e-05, 3.162398934364319e-05, 3.298558294773102e-05, 3.434717655181885e-05, 3.570877015590668e-05, 3.707036375999451e-05, 3.8431957364082336e-05, 3.9793550968170166e-05, 4.1155144572257996e-05, 4.2516738176345825e-05, 4.3878331780433655e-05, 4.5239925384521484e-05]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 11.0, 17.0, 24.0, 44.0, 60.0, 95.0, 143.0, 456.0, 622.0, 1425.0, 2992.0, 7026.0, 18216.0, 50513.0, 147363.0, 590581.0, 147677.0, 50101.0, 18277.0, 7104.0, 2951.0, 1367.0, 614.0, 508.0, 150.0, 80.0, 36.0, 28.0, 26.0, 15.0, 10.0, 11.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.112720489501953e-06, -3.986060619354248e-06, -3.859400749206543e-06, -3.732740879058838e-06, -3.606081008911133e-06, -3.4794211387634277e-06, -3.3527612686157227e-06, -3.2261013984680176e-06, -3.0994415283203125e-06, -2.9727816581726074e-06, -2.8461217880249023e-06, -2.7194619178771973e-06, -2.592802047729492e-06, -2.466142177581787e-06, -2.339482307434082e-06, -2.212822437286377e-06, -2.086162567138672e-06, -1.959502696990967e-06, -1.8328428268432617e-06, -1.7061829566955566e-06, -1.5795230865478516e-06, -1.4528632164001465e-06, -1.3262033462524414e-06, -1.1995434761047363e-06, -1.0728836059570312e-06, -9.462237358093262e-07, -8.195638656616211e-07, -6.92903995513916e-07, -5.662441253662109e-07, -4.3958425521850586e-07, -3.129243850708008e-07, -1.862645149230957e-07, -5.960464477539063e-08, 6.705522537231445e-08, 1.9371509552001953e-07, 3.203749656677246e-07, 4.470348358154297e-07, 5.736947059631348e-07, 7.003545761108398e-07, 8.270144462585449e-07, 9.5367431640625e-07, 1.080334186553955e-06, 1.2069940567016602e-06, 1.3336539268493652e-06, 1.4603137969970703e-06, 1.5869736671447754e-06, 1.7136335372924805e-06, 1.8402934074401855e-06, 1.9669532775878906e-06, 2.0936131477355957e-06, 2.2202730178833008e-06, 2.346932888031006e-06, 2.473592758178711e-06, 2.600252628326416e-06, 2.726912498474121e-06, 2.853572368621826e-06, 2.9802322387695312e-06, 3.1068921089172363e-06, 3.2335519790649414e-06, 3.3602118492126465e-06, 3.4868717193603516e-06, 3.6135315895080566e-06, 3.7401914596557617e-06, 3.866851329803467e-06, 3.993511199951172e-06]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 0.0, 7.0, 16.0, 13.0, 30.0, 36.0, 28.0, 0.0, 42.0, 43.0, 47.0, 47.0, 71.0, 59.0, 0.0, 65.0, 66.0, 72.0, 36.0, 55.0, 47.0, 0.0, 26.0, 47.0, 31.0, 29.0, 21.0, 12.0, 0.0, 15.0, 11.0, 8.0, 4.0, 6.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8477439880371094e-06, -1.796521246433258e-06, -1.7452985048294067e-06, -1.6940757632255554e-06, -1.642853021621704e-06, -1.5916302800178528e-06, -1.5404075384140015e-06, -1.4891847968101501e-06, -1.4379620552062988e-06, -1.3867393136024475e-06, -1.3355165719985962e-06, -1.2842938303947449e-06, -1.2330710887908936e-06, -1.1818483471870422e-06, -1.130625605583191e-06, -1.0794028639793396e-06, -1.0281801223754883e-06, -9.76957380771637e-07, -9.257346391677856e-07, -8.745118975639343e-07, -8.23289155960083e-07, -7.720664143562317e-07, -7.208436727523804e-07, -6.69620931148529e-07, -6.183981895446777e-07, -5.671754479408264e-07, -5.159527063369751e-07, -4.647299647331238e-07, -4.1350722312927246e-07, -3.6228448152542114e-07, -3.110617399215698e-07, -2.598389983177185e-07, -2.086162567138672e-07, -1.5739351511001587e-07, -1.0617077350616455e-07, -5.494803190231323e-08, -3.725290298461914e-09, 4.7497451305389404e-08, 9.872019290924072e-08, 1.4994293451309204e-07, 2.0116567611694336e-07, 2.523884177207947e-07, 3.03611159324646e-07, 3.548339009284973e-07, 4.0605664253234863e-07, 4.5727938413619995e-07, 5.085021257400513e-07, 5.597248673439026e-07, 6.109476089477539e-07, 6.621703505516052e-07, 7.133930921554565e-07, 7.646158337593079e-07, 8.158385753631592e-07, 8.670613169670105e-07, 9.182840585708618e-07, 9.695068001747131e-07, 1.0207295417785645e-06, 1.0719522833824158e-06, 1.123175024986267e-06, 1.1743977665901184e-06, 1.2256205081939697e-06, 1.276843249797821e-06, 1.3280659914016724e-06, 1.3792887330055237e-06, 1.430511474609375e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 7.0, 7.0, 9.0, 41.0, 30.0, 44.0, 47.0, 64.0, 275.0, 209.0, 309.0, 424.0, 1487.0, 1357.0, 2198.0, 3456.0, 15547.0, 17854.0, 35047.0, 74792.0, 554161.0, 188162.0, 74620.0, 34950.0, 17869.0, 15524.0, 3525.0, 2125.0, 1384.0, 1575.0, 406.0, 296.0, 209.0, 274.0, 77.0, 54.0, 36.0, 40.0, 19.0, 5.0, 10.0, 4.0, 10.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.205371856689453e-06, -2.1317973732948303e-06, -2.0582228899002075e-06, -1.9846484065055847e-06, -1.911073923110962e-06, -1.8374994397163391e-06, -1.7639249563217163e-06, -1.6903504729270935e-06, -1.6167759895324707e-06, -1.543201506137848e-06, -1.469627022743225e-06, -1.3960525393486023e-06, -1.3224780559539795e-06, -1.2489035725593567e-06, -1.1753290891647339e-06, -1.101754605770111e-06, -1.0281801223754883e-06, -9.546056389808655e-07, -8.810311555862427e-07, -8.074566721916199e-07, -7.338821887969971e-07, -6.603077054023743e-07, -5.867332220077515e-07, -5.131587386131287e-07, -4.3958425521850586e-07, -3.6600977182388306e-07, -2.9243528842926025e-07, -2.1886080503463745e-07, -1.4528632164001465e-07, -7.171183824539185e-08, 1.862645149230957e-09, 7.543712854385376e-08, 1.4901161193847656e-07, 2.2258609533309937e-07, 2.9616057872772217e-07, 3.6973506212234497e-07, 4.4330954551696777e-07, 5.168840289115906e-07, 5.904585123062134e-07, 6.640329957008362e-07, 7.37607479095459e-07, 8.111819624900818e-07, 8.847564458847046e-07, 9.583309292793274e-07, 1.0319054126739502e-06, 1.105479896068573e-06, 1.1790543794631958e-06, 1.2526288628578186e-06, 1.3262033462524414e-06, 1.3997778296470642e-06, 1.473352313041687e-06, 1.5469267964363098e-06, 1.6205012798309326e-06, 1.6940757632255554e-06, 1.7676502466201782e-06, 1.841224730014801e-06, 1.914799213409424e-06, 1.9883736968040466e-06, 2.0619481801986694e-06, 2.1355226635932922e-06, 2.209097146987915e-06, 2.282671630382538e-06, 2.3562461137771606e-06, 2.4298205971717834e-06, 2.5033950805664062e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 4.0, 3.0, 6.0, 5.0, 9.0, 7.0, 17.0, 23.0, 25.0, 74.0, 40.0, 45.0, 72.0, 60.0, 66.0, 63.0, 67.0, 80.0, 52.0, 104.0, 33.0, 36.0, 26.0, 16.0, 17.0, 11.0, 7.0, 5.0, 6.0, 4.0, 8.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-06, -2.4382025003433228e-06, -2.3730099201202393e-06, -2.3078173398971558e-06, -2.2426247596740723e-06, -2.1774321794509888e-06, -2.1122395992279053e-06, -2.0470470190048218e-06, -1.9818544387817383e-06, -1.9166618585586548e-06, -1.8514692783355713e-06, -1.7862766981124878e-06, -1.7210841178894043e-06, -1.6558915376663208e-06, -1.5906989574432373e-06, -1.5255063772201538e-06, -1.4603137969970703e-06, -1.3951212167739868e-06, -1.3299286365509033e-06, -1.2647360563278198e-06, -1.1995434761047363e-06, -1.1343508958816528e-06, -1.0691583156585693e-06, -1.0039657354354858e-06, -9.387731552124023e-07, -8.735805749893188e-07, -8.083879947662354e-07, -7.431954145431519e-07, -6.780028343200684e-07, -6.128102540969849e-07, -5.476176738739014e-07, -4.824250936508179e-07, -4.172325134277344e-07, -3.520399332046509e-07, -2.868473529815674e-07, -2.2165477275848389e-07, -1.564621925354004e-07, -9.12696123123169e-08, -2.60770320892334e-08, 3.91155481338501e-08, 1.043081283569336e-07, 1.695007085800171e-07, 2.3469328880310059e-07, 2.998858690261841e-07, 3.650784492492676e-07, 4.302710294723511e-07, 4.954636096954346e-07, 5.606561899185181e-07, 6.258487701416016e-07, 6.910413503646851e-07, 7.562339305877686e-07, 8.21426510810852e-07, 8.866190910339355e-07, 9.51811671257019e-07, 1.0170042514801025e-06, 1.082196831703186e-06, 1.1473894119262695e-06, 1.212581992149353e-06, 1.2777745723724365e-06, 1.34296715259552e-06, 1.4081597328186035e-06, 1.473352313041687e-06, 1.5385448932647705e-06, 1.603737473487854e-06, 1.6689300537109375e-06]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 5.0, 8.0, 8.0, 3.0, 3.0, 16.0, 16.0, 26.0, 30.0, 44.0, 89.0, 139.0, 171.0, 74.0, 71.0, 54.0, 56.0, 33.0, 23.0, 20.0, 16.0, 11.0, 16.0, 8.0, 15.0, 6.0, 8.0, 9.0, 4.0, 4.0, 6.0, 3.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.648930088384077e-05, -8.113245712593198e-05, -7.577561336802319e-05, -7.04187696101144e-05, -6.506191857624799e-05, -5.9705078456318006e-05, -5.434823106043041e-05, -4.8991387302521616e-05, -4.3634543544612825e-05, -3.8277699786704034e-05, -3.292085602879524e-05, -2.7564008632907644e-05, -2.2207164874998853e-05, -1.685032111709006e-05, -1.1493473721202463e-05, -6.136629963293672e-06, -7.797862053848803e-07, 4.577058462018613e-06, 9.933903129422106e-06, 1.52907487063203e-05, 2.0647592464229092e-05, 2.6004436222137883e-05, 3.136128361802548e-05, 3.671812737593427e-05, 4.2074971133843064e-05, 4.7431814891751856e-05, 5.278865864966065e-05, 5.8145506045548245e-05, 6.350234616547823e-05, 6.885919719934464e-05, 7.421604095725343e-05, 7.957288471516222e-05, 8.49297211971134e-05, 9.028656495502219e-05, 9.564340871293098e-05, 0.00010100025974679738, 0.00010635709622874856, 0.00011171394726261497, 0.00011707079102052376, 0.00012242763477843255, 0.00012778447126038373, 0.00013314132229425013, 0.0001384981587762013, 0.0001438550098100677, 0.0001492118462920189, 0.0001545686973258853, 0.0001599255483597517, 0.00016528238484170288, 0.00017063923587556928, 0.0001759960869094357, 0.00018135292339138687, 0.00018670977442525327, 0.00019206661090720445, 0.00019742346194107085, 0.00020278029842302203, 0.00020813714945688844, 0.00021349400049075484, 0.00021885085152462125, 0.00022420768800657243, 0.00022956453904043883, 0.00023492137552239, 0.0002402782265562564, 0.0002456350775901228, 0.00025099189952015877, 0.0002563487505540252]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 8.0, 4.0, 9.0, 14.0, 12.0, 13.0, 22.0, 21.0, 20.0, 33.0, 24.0, 32.0, 33.0, 35.0, 37.0, 37.0, 42.0, 30.0, 42.0, 58.0, 35.0, 37.0, 31.0, 41.0, 37.0, 38.0, 33.0, 27.0, 22.0, 21.0, 21.0, 23.0, 23.0, 15.0, 11.0, 13.0, 10.0, 8.0, 10.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00011712312698364258, -0.00011355802416801453, -0.00010999292135238647, -0.00010642781853675842, -0.00010286271572113037, -9.929761290550232e-05, -9.573251008987427e-05, -9.216740727424622e-05, -8.860230445861816e-05, -8.503720164299011e-05, -8.147209882736206e-05, -7.790699601173401e-05, -7.434189319610596e-05, -7.07767903804779e-05, -6.721168756484985e-05, -6.36465847492218e-05, -6.008148193359375e-05, -5.65163791179657e-05, -5.2951276302337646e-05, -4.9386173486709595e-05, -4.582107067108154e-05, -4.225596785545349e-05, -3.869086503982544e-05, -3.512576222419739e-05, -3.1560659408569336e-05, -2.7995556592941284e-05, -2.4430453777313232e-05, -2.086535096168518e-05, -1.730024814605713e-05, -1.3735145330429077e-05, -1.0170042514801025e-05, -6.604939699172974e-06, -3.039836883544922e-06, 5.252659320831299e-07, 4.090368747711182e-06, 7.655471563339233e-06, 1.1220574378967285e-05, 1.4785677194595337e-05, 1.835078001022339e-05, 2.191588282585144e-05, 2.5480985641479492e-05, 2.9046088457107544e-05, 3.2611191272735596e-05, 3.617629408836365e-05, 3.97413969039917e-05, 4.330649971961975e-05, 4.68716025352478e-05, 5.0436705350875854e-05, 5.4001808166503906e-05, 5.756691098213196e-05, 6.113201379776001e-05, 6.469711661338806e-05, 6.826221942901611e-05, 7.182732224464417e-05, 7.539242506027222e-05, 7.895752787590027e-05, 8.252263069152832e-05, 8.608773350715637e-05, 8.965283632278442e-05, 9.321793913841248e-05, 9.678304195404053e-05, 0.00010034814476966858, 0.00010391324758529663, 0.00010747835040092468, 0.00011104345321655273]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 7.0, 21.0, 19.0, 37.0, 68.0, 102.0, 165.0, 294.0, 526.0, 1011.0, 1987.0, 4285.0, 10209.0, 29917.0, 355076.0, 3721430.0, 42972.0, 13670.0, 5581.0, 2722.0, 1577.0, 911.0, 501.0, 387.0, 238.0, 150.0, 98.0, 82.0, 52.0, 47.0, 32.0, 19.0, 15.0, 12.0, 15.0, 11.0, 11.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010776519775390625, -0.00010289810597896576, -9.803101420402527e-05, -9.316392242908478e-05, -8.829683065414429e-05, -8.34297388792038e-05, -7.85626471042633e-05, -7.369555532932281e-05, -6.882846355438232e-05, -6.396137177944183e-05, -5.909428000450134e-05, -5.422718822956085e-05, -4.936009645462036e-05, -4.449300467967987e-05, -3.962591290473938e-05, -3.475882112979889e-05, -2.98917293548584e-05, -2.5024637579917908e-05, -2.0157545804977417e-05, -1.5290454030036926e-05, -1.0423362255096436e-05, -5.556270480155945e-06, -6.891787052154541e-07, 4.177913069725037e-06, 9.045004844665527e-06, 1.3912096619606018e-05, 1.877918839454651e-05, 2.3646280169487e-05, 2.851337194442749e-05, 3.338046371936798e-05, 3.824755549430847e-05, 4.311464726924896e-05, 4.798173904418945e-05, 5.2848830819129944e-05, 5.7715922594070435e-05, 6.258301436901093e-05, 6.745010614395142e-05, 7.23171979188919e-05, 7.71842896938324e-05, 8.205138146877289e-05, 8.691847324371338e-05, 9.178556501865387e-05, 9.665265679359436e-05, 0.00010151974856853485, 0.00010638684034347534, 0.00011125393211841583, 0.00011612102389335632, 0.00012098811566829681, 0.0001258552074432373, 0.0001307222992181778, 0.00013558939099311829, 0.00014045648276805878, 0.00014532357454299927, 0.00015019066631793976, 0.00015505775809288025, 0.00015992484986782074, 0.00016479194164276123, 0.00016965903341770172, 0.0001745261251926422, 0.0001793932169675827, 0.0001842603087425232, 0.00018912740051746368, 0.00019399449229240417, 0.00019886158406734467, 0.00020372867584228516]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 10.0, 14.0, 14.0, 25.0, 45.0, 58.0, 53.0, 71.0, 84.0, 113.0, 106.0, 84.0, 76.0, 59.0, 50.0, 30.0, 25.0, 14.0, 16.0, 4.0, 9.0, 8.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.913309097290039e-05, -1.8263235688209534e-05, -1.7393380403518677e-05, -1.652352511882782e-05, -1.5653669834136963e-05, -1.4783814549446106e-05, -1.3913959264755249e-05, -1.3044103980064392e-05, -1.2174248695373535e-05, -1.1304393410682678e-05, -1.0434538125991821e-05, -9.564682841300964e-06, -8.694827556610107e-06, -7.82497227191925e-06, -6.9551169872283936e-06, -6.085261702537537e-06, -5.21540641784668e-06, -4.345551133155823e-06, -3.475695848464966e-06, -2.605840563774109e-06, -1.735985279083252e-06, -8.66129994392395e-07, 3.725290298461914e-09, 8.735805749893188e-07, 1.7434358596801758e-06, 2.6132911443710327e-06, 3.4831464290618896e-06, 4.353001713752747e-06, 5.2228569984436035e-06, 6.0927122831344604e-06, 6.962567567825317e-06, 7.832422852516174e-06, 8.702278137207031e-06, 9.572133421897888e-06, 1.0441988706588745e-05, 1.1311843991279602e-05, 1.2181699275970459e-05, 1.3051554560661316e-05, 1.3921409845352173e-05, 1.479126513004303e-05, 1.5661120414733887e-05, 1.6530975699424744e-05, 1.74008309841156e-05, 1.8270686268806458e-05, 1.9140541553497314e-05, 2.001039683818817e-05, 2.088025212287903e-05, 2.1750107407569885e-05, 2.2619962692260742e-05, 2.34898179769516e-05, 2.4359673261642456e-05, 2.5229528546333313e-05, 2.609938383102417e-05, 2.6969239115715027e-05, 2.7839094400405884e-05, 2.870894968509674e-05, 2.9578804969787598e-05, 3.0448660254478455e-05, 3.131851553916931e-05, 3.218837082386017e-05, 3.3058226108551025e-05, 3.392808139324188e-05, 3.479793667793274e-05, 3.5667791962623596e-05, 3.653764724731445e-05]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 6.0, 2.0, 8.0, 6.0, 9.0, 14.0, 36.0, 34.0, 56.0, 72.0, 120.0, 145.0, 228.0, 316.0, 443.0, 650.0, 956.0, 1324.0, 2024.0, 3162.0, 5193.0, 8321.0, 14004.0, 25436.0, 51961.0, 150882.0, 3249576.0, 508406.0, 85156.0, 36949.0, 19082.0, 10950.0, 6625.0, 4020.0, 2743.0, 1707.0, 1064.0, 799.0, 555.0, 406.0, 265.0, 176.0, 128.0, 91.0, 56.0, 39.0, 32.0, 18.0, 14.0, 6.0, 12.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.125999450683594e-05, -4.9593858420848846e-05, -4.7927722334861755e-05, -4.6261586248874664e-05, -4.459545016288757e-05, -4.292931407690048e-05, -4.126317799091339e-05, -3.95970419049263e-05, -3.793090581893921e-05, -3.626476973295212e-05, -3.459863364696503e-05, -3.2932497560977936e-05, -3.1266361474990845e-05, -2.9600225389003754e-05, -2.7934089303016663e-05, -2.626795321702957e-05, -2.460181713104248e-05, -2.293568104505539e-05, -2.12695449590683e-05, -1.9603408873081207e-05, -1.7937272787094116e-05, -1.6271136701107025e-05, -1.4605000615119934e-05, -1.2938864529132843e-05, -1.1272728443145752e-05, -9.606592357158661e-06, -7.94045627117157e-06, -6.274320185184479e-06, -4.608184099197388e-06, -2.9420480132102966e-06, -1.2759119272232056e-06, 3.902241587638855e-07, 2.0563602447509766e-06, 3.7224963307380676e-06, 5.388632416725159e-06, 7.05476850271225e-06, 8.72090458869934e-06, 1.0387040674686432e-05, 1.2053176760673523e-05, 1.3719312846660614e-05, 1.5385448932647705e-05, 1.7051585018634796e-05, 1.8717721104621887e-05, 2.0383857190608978e-05, 2.204999327659607e-05, 2.371612936258316e-05, 2.538226544857025e-05, 2.7048401534557343e-05, 2.8714537620544434e-05, 3.0380673706531525e-05, 3.2046809792518616e-05, 3.371294587850571e-05, 3.53790819644928e-05, 3.704521805047989e-05, 3.871135413646698e-05, 4.037749022245407e-05, 4.204362630844116e-05, 4.370976239442825e-05, 4.5375898480415344e-05, 4.7042034566402435e-05, 4.8708170652389526e-05, 5.037430673837662e-05, 5.204044282436371e-05, 5.37065789103508e-05, 5.537271499633789e-05]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 1.0, 6.0, 8.0, 6.0, 5.0, 9.0, 11.0, 21.0, 19.0, 23.0, 26.0, 44.0, 34.0, 87.0, 170.0, 535.0, 1910.0, 618.0, 168.0, 102.0, 44.0, 39.0, 31.0, 30.0, 27.0, 15.0, 14.0, 13.0, 6.0, 4.0, 5.0, 4.0, 8.0, 3.0, 9.0, 2.0, 8.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07099723815918e-05, -3.933347761631012e-05, -3.795698285102844e-05, -3.6580488085746765e-05, -3.520399332046509e-05, -3.382749855518341e-05, -3.2451003789901733e-05, -3.1074509024620056e-05, -2.969801425933838e-05, -2.83215194940567e-05, -2.6945024728775024e-05, -2.5568529963493347e-05, -2.419203519821167e-05, -2.2815540432929993e-05, -2.1439045667648315e-05, -2.0062550902366638e-05, -1.868605613708496e-05, -1.7309561371803284e-05, -1.5933066606521606e-05, -1.455657184123993e-05, -1.3180077075958252e-05, -1.1803582310676575e-05, -1.0427087545394897e-05, -9.05059278011322e-06, -7.674098014831543e-06, -6.297603249549866e-06, -4.9211084842681885e-06, -3.5446137189865112e-06, -2.168118953704834e-06, -7.916241884231567e-07, 5.848705768585205e-07, 1.9613653421401978e-06, 3.337860107421875e-06, 4.714354872703552e-06, 6.0908496379852295e-06, 7.467344403266907e-06, 8.843839168548584e-06, 1.0220333933830261e-05, 1.1596828699111938e-05, 1.2973323464393616e-05, 1.4349818229675293e-05, 1.572631299495697e-05, 1.7102807760238647e-05, 1.8479302525520325e-05, 1.9855797290802002e-05, 2.123229205608368e-05, 2.2608786821365356e-05, 2.3985281586647034e-05, 2.536177635192871e-05, 2.6738271117210388e-05, 2.8114765882492065e-05, 2.9491260647773743e-05, 3.086775541305542e-05, 3.22442501783371e-05, 3.3620744943618774e-05, 3.499723970890045e-05, 3.637373447418213e-05, 3.7750229239463806e-05, 3.9126724004745483e-05, 4.050321877002716e-05, 4.187971353530884e-05, 4.3256208300590515e-05, 4.463270306587219e-05, 4.600919783115387e-05, 4.738569259643555e-05]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 9.0, 13.0, 11.0, 18.0, 14.0, 20.0, 46.0, 54.0, 70.0, 111.0, 146.0, 90.0, 90.0, 73.0, 39.0, 44.0, 38.0, 28.0, 16.0, 14.0, 15.0, 7.0, 6.0, 4.0, 3.0, 6.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019756786059588194, -0.00019064501975663006, -0.00018372216436546296, -0.00017679932352621108, -0.00016987646813504398, -0.0001629536272957921, -0.000156030771904625, -0.00014910793106537312, -0.00014218507567420602, -0.00013526223483495414, -0.00012833937944378704, -0.00012141653132857755, -0.00011449368321336806, -0.00010757084237411618, -0.00010064798698294908, -9.37251461436972e-05, -8.680229802848771e-05, -7.987944991327822e-05, -7.295660179806873e-05, -6.603375368285924e-05, -5.911090556764975e-05, -5.218806109041907e-05, -4.526521297520958e-05, -3.834236486000009e-05, -3.14195167447906e-05, -2.449666862958111e-05, -1.757382051437162e-05, -1.0650974218151532e-05, -3.728126102942042e-06, 3.1947201932780445e-06, 1.0117568308487535e-05, 1.7040416423697025e-05, 2.3963264538906515e-05, 3.0886112654116005e-05, 3.7808960769325495e-05, 4.4731808884534985e-05, 5.1654656999744475e-05, 5.857750147697516e-05, 6.550035323016346e-05, 7.242319406941533e-05, 7.934604946058244e-05, 8.626889757579193e-05, 9.319174569100142e-05, 0.0001001145938062109, 0.0001070374419214204, 0.00011396028276067227, 0.00012088313815183938, 0.00012780597899109125, 0.00013472881983034313, 0.000141651660669595, 0.0001485745160607621, 0.00015549735690001398, 0.0001624202122911811, 0.00016934305313043296, 0.00017626590852160007, 0.00018318874936085194, 0.00019011160475201905, 0.00019703444559127092, 0.00020395730098243803, 0.0002108801418216899, 0.000217802997212857, 0.00022472583805210888, 0.000231648693443276, 0.00023857153428252786, 0.00024549438967369497]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 14.0, 8.0, 8.0, 9.0, 13.0, 11.0, 17.0, 15.0, 23.0, 28.0, 20.0, 34.0, 30.0, 39.0, 40.0, 33.0, 32.0, 33.0, 34.0, 47.0, 46.0, 35.0, 43.0, 41.0, 37.0, 36.0, 36.0, 33.0, 28.0, 23.0, 16.0, 17.0, 20.0, 19.0, 21.0, 10.0, 18.0, 3.0, 11.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.00013452768325805664, -0.00013100076466798782, -0.000127473846077919, -0.0001239469274878502, -0.00012042000889778137, -0.00011689309030771255, -0.00011336617171764374, -0.00010983925312757492, -0.0001063123345375061, -0.00010278541594743729, -9.925849735736847e-05, -9.573157876729965e-05, -9.220466017723083e-05, -8.867774158716202e-05, -8.51508229970932e-05, -8.162390440702438e-05, -7.809698581695557e-05, -7.457006722688675e-05, -7.104314863681793e-05, -6.751623004674911e-05, -6.39893114566803e-05, -6.046239286661148e-05, -5.6935474276542664e-05, -5.3408555686473846e-05, -4.988163709640503e-05, -4.635471850633621e-05, -4.2827799916267395e-05, -3.930088132619858e-05, -3.577396273612976e-05, -3.2247044146060944e-05, -2.8720125555992126e-05, -2.519320696592331e-05, -2.1666288375854492e-05, -1.8139369785785675e-05, -1.4612451195716858e-05, -1.108553260564804e-05, -7.558614015579224e-06, -4.0316954255104065e-06, -5.047768354415894e-07, 3.0221417546272278e-06, 6.549060344696045e-06, 1.0075978934764862e-05, 1.360289752483368e-05, 1.7129816114902496e-05, 2.0656734704971313e-05, 2.418365329504013e-05, 2.7710571885108948e-05, 3.1237490475177765e-05, 3.476440906524658e-05, 3.82913276553154e-05, 4.1818246245384216e-05, 4.5345164835453033e-05, 4.887208342552185e-05, 5.239900201559067e-05, 5.5925920605659485e-05, 5.94528391957283e-05, 6.297975778579712e-05, 6.650667637586594e-05, 7.003359496593475e-05, 7.356051355600357e-05, 7.708743214607239e-05, 8.06143507361412e-05, 8.414126932621002e-05, 8.766818791627884e-05, 9.119510650634766e-05]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 9.0, 11.0, 13.0, 12.0, 15.0, 24.0, 28.0, 40.0, 55.0, 97.0, 183.0, 391.0, 849.0, 2020.0, 5575.0, 18366.0, 82317.0, 642870.0, 237714.0, 41091.0, 10650.0, 3597.0, 1341.0, 594.0, 286.0, 124.0, 74.0, 50.0, 39.0, 25.0, 16.0, 19.0, 15.0, 5.0, 5.0, 7.0, 4.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00024509429931640625, -0.00023783929646015167, -0.0002305842936038971, -0.00022332929074764252, -0.00021607428789138794, -0.00020881928503513336, -0.00020156428217887878, -0.0001943092793226242, -0.00018705427646636963, -0.00017979927361011505, -0.00017254427075386047, -0.0001652892678976059, -0.00015803426504135132, -0.00015077926218509674, -0.00014352425932884216, -0.00013626925647258759, -0.000129014253616333, -0.00012175925076007843, -0.00011450424790382385, -0.00010724924504756927, -9.99942421913147e-05, -9.273923933506012e-05, -8.548423647880554e-05, -7.822923362255096e-05, -7.097423076629639e-05, -6.371922791004181e-05, -5.646422505378723e-05, -4.9209222197532654e-05, -4.1954219341278076e-05, -3.46992164850235e-05, -2.744421362876892e-05, -2.0189210772514343e-05, -1.2934207916259766e-05, -5.679205060005188e-06, 1.5757977962493896e-06, 8.830800652503967e-06, 1.6085803508758545e-05, 2.3340806365013123e-05, 3.05958092212677e-05, 3.785081207752228e-05, 4.5105814933776855e-05, 5.236081779003143e-05, 5.961582064628601e-05, 6.687082350254059e-05, 7.412582635879517e-05, 8.138082921504974e-05, 8.863583207130432e-05, 9.58908349275589e-05, 0.00010314583778381348, 0.00011040084064006805, 0.00011765584349632263, 0.0001249108463525772, 0.0001321658492088318, 0.00013942085206508636, 0.00014667585492134094, 0.00015393085777759552, 0.0001611858606338501, 0.00016844086349010468, 0.00017569586634635925, 0.00018295086920261383, 0.0001902058720588684, 0.00019746087491512299, 0.00020471587777137756, 0.00021197088062763214, 0.00021922588348388672]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 9.0, 10.0, 13.0, 37.0, 45.0, 61.0, 80.0, 103.0, 97.0, 135.0, 106.0, 71.0, 65.0, 45.0, 49.0, 21.0, 17.0, 8.0, 8.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.014636993408203e-05, -1.9038096070289612e-05, -1.7929822206497192e-05, -1.6821548342704773e-05, -1.5713274478912354e-05, -1.4605000615119934e-05, -1.3496726751327515e-05, -1.2388452887535095e-05, -1.1280179023742676e-05, -1.0171905159950256e-05, -9.063631296157837e-06, -7.955357432365417e-06, -6.847083568572998e-06, -5.738809704780579e-06, -4.630535840988159e-06, -3.5222619771957397e-06, -2.4139881134033203e-06, -1.3057142496109009e-06, -1.9744038581848145e-07, 9.10833477973938e-07, 2.0191073417663574e-06, 3.127381205558777e-06, 4.235655069351196e-06, 5.343928933143616e-06, 6.452202796936035e-06, 7.560476660728455e-06, 8.668750524520874e-06, 9.777024388313293e-06, 1.0885298252105713e-05, 1.1993572115898132e-05, 1.3101845979690552e-05, 1.4210119843482971e-05, 1.531839370727539e-05, 1.642666757106781e-05, 1.753494143486023e-05, 1.864321529865265e-05, 1.975148916244507e-05, 2.0859763026237488e-05, 2.1968036890029907e-05, 2.3076310753822327e-05, 2.4184584617614746e-05, 2.5292858481407166e-05, 2.6401132345199585e-05, 2.7509406208992004e-05, 2.8617680072784424e-05, 2.9725953936576843e-05, 3.083422780036926e-05, 3.194250166416168e-05, 3.30507755279541e-05, 3.415904939174652e-05, 3.526732325553894e-05, 3.637559711933136e-05, 3.748387098312378e-05, 3.85921448469162e-05, 3.970041871070862e-05, 4.080869257450104e-05, 4.191696643829346e-05, 4.3025240302085876e-05, 4.4133514165878296e-05, 4.5241788029670715e-05, 4.6350061893463135e-05, 4.7458335757255554e-05, 4.8566609621047974e-05, 4.967488348484039e-05, 5.078315734863281e-05]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 7.0, 8.0, 23.0, 20.0, 31.0, 68.0, 77.0, 111.0, 185.0, 270.0, 405.0, 727.0, 1051.0, 1570.0, 2590.0, 4153.0, 7119.0, 11882.0, 21145.0, 36198.0, 66107.0, 137952.0, 384731.0, 186001.0, 81822.0, 44050.0, 24442.0, 14054.0, 8354.0, 5056.0, 3065.0, 1884.0, 1218.0, 772.0, 478.0, 295.0, 209.0, 142.0, 77.0, 72.0, 53.0, 24.0, 21.0, 13.0, 5.0, 9.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.4776668548583984e-05, -5.309935659170151e-05, -5.142204463481903e-05, -4.9744732677936554e-05, -4.806742072105408e-05, -4.63901087641716e-05, -4.4712796807289124e-05, -4.303548485040665e-05, -4.135817289352417e-05, -3.968086093664169e-05, -3.8003548979759216e-05, -3.632623702287674e-05, -3.464892506599426e-05, -3.2971613109111786e-05, -3.129430115222931e-05, -2.9616989195346832e-05, -2.7939677238464355e-05, -2.626236528158188e-05, -2.4585053324699402e-05, -2.2907741367816925e-05, -2.1230429410934448e-05, -1.955311745405197e-05, -1.7875805497169495e-05, -1.6198493540287018e-05, -1.4521181583404541e-05, -1.2843869626522064e-05, -1.1166557669639587e-05, -9.48924571275711e-06, -7.811933755874634e-06, -6.134621798992157e-06, -4.45730984210968e-06, -2.7799978852272034e-06, -1.1026859283447266e-06, 5.746260285377502e-07, 2.251937985420227e-06, 3.929249942302704e-06, 5.606561899185181e-06, 7.2838738560676575e-06, 8.961185812950134e-06, 1.0638497769832611e-05, 1.2315809726715088e-05, 1.3993121683597565e-05, 1.567043364048004e-05, 1.734774559736252e-05, 1.9025057554244995e-05, 2.0702369511127472e-05, 2.237968146800995e-05, 2.4056993424892426e-05, 2.5734305381774902e-05, 2.741161733865738e-05, 2.9088929295539856e-05, 3.076624125242233e-05, 3.244355320930481e-05, 3.4120865166187286e-05, 3.579817712306976e-05, 3.747548907995224e-05, 3.915280103683472e-05, 4.0830112993717194e-05, 4.250742495059967e-05, 4.418473690748215e-05, 4.5862048864364624e-05, 4.75393608212471e-05, 4.921667277812958e-05, 5.0893984735012054e-05, 5.257129669189453e-05]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 4.0, 12.0, 8.0, 14.0, 14.0, 15.0, 24.0, 27.0, 21.0, 17.0, 26.0, 41.0, 32.0, 41.0, 47.0, 45.0, 56.0, 38.0, 53.0, 41.0, 41.0, 39.0, 37.0, 35.0, 36.0, 33.0, 32.0, 29.0, 22.0, 23.0, 17.0, 16.0, 12.0, 6.0, 9.0, 15.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.70280647277832e-05, -4.557892680168152e-05, -4.4129788875579834e-05, -4.268065094947815e-05, -4.1231513023376465e-05, -3.978237509727478e-05, -3.8333237171173096e-05, -3.688409924507141e-05, -3.5434961318969727e-05, -3.398582339286804e-05, -3.253668546676636e-05, -3.108754754066467e-05, -2.9638409614562988e-05, -2.8189271688461304e-05, -2.674013376235962e-05, -2.5290995836257935e-05, -2.384185791015625e-05, -2.2392719984054565e-05, -2.094358205795288e-05, -1.9494444131851196e-05, -1.8045306205749512e-05, -1.6596168279647827e-05, -1.5147030353546143e-05, -1.3697892427444458e-05, -1.2248754501342773e-05, -1.0799616575241089e-05, -9.350478649139404e-06, -7.90134072303772e-06, -6.452202796936035e-06, -5.003064870834351e-06, -3.553926944732666e-06, -2.1047890186309814e-06, -6.556510925292969e-07, 7.934868335723877e-07, 2.2426247596740723e-06, 3.691762685775757e-06, 5.140900611877441e-06, 6.590038537979126e-06, 8.03917646408081e-06, 9.488314390182495e-06, 1.093745231628418e-05, 1.2386590242385864e-05, 1.3835728168487549e-05, 1.5284866094589233e-05, 1.6734004020690918e-05, 1.8183141946792603e-05, 1.9632279872894287e-05, 2.108141779899597e-05, 2.2530555725097656e-05, 2.397969365119934e-05, 2.5428831577301025e-05, 2.687796950340271e-05, 2.8327107429504395e-05, 2.977624535560608e-05, 3.1225383281707764e-05, 3.267452120780945e-05, 3.412365913391113e-05, 3.557279706001282e-05, 3.70219349861145e-05, 3.8471072912216187e-05, 3.992021083831787e-05, 4.1369348764419556e-05, 4.281848669052124e-05, 4.4267624616622925e-05, 4.571676254272461e-05]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 8.0, 7.0, 14.0, 18.0, 26.0, 51.0, 66.0, 103.0, 152.0, 377.0, 418.0, 658.0, 2132.0, 2824.0, 5055.0, 10234.0, 42557.0, 87182.0, 256258.0, 396045.0, 179577.0, 33860.0, 14723.0, 9355.0, 2821.0, 1518.0, 901.0, 799.0, 288.0, 177.0, 163.0, 57.0, 44.0, 22.0, 24.0, 10.0, 12.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.231929779052734e-06, -4.0959566831588745e-06, -3.959983587265015e-06, -3.824010491371155e-06, -3.688037395477295e-06, -3.552064299583435e-06, -3.416091203689575e-06, -3.2801181077957153e-06, -3.1441450119018555e-06, -3.0081719160079956e-06, -2.8721988201141357e-06, -2.736225724220276e-06, -2.600252628326416e-06, -2.464279532432556e-06, -2.3283064365386963e-06, -2.1923333406448364e-06, -2.0563602447509766e-06, -1.9203871488571167e-06, -1.7844140529632568e-06, -1.648440957069397e-06, -1.5124678611755371e-06, -1.3764947652816772e-06, -1.2405216693878174e-06, -1.1045485734939575e-06, -9.685754776000977e-07, -8.326023817062378e-07, -6.966292858123779e-07, -5.606561899185181e-07, -4.246830940246582e-07, -2.8870999813079834e-07, -1.5273690223693848e-07, -1.6763806343078613e-08, 1.1920928955078125e-07, 2.551823854446411e-07, 3.91155481338501e-07, 5.271285772323608e-07, 6.631016731262207e-07, 7.990747690200806e-07, 9.350478649139404e-07, 1.0710209608078003e-06, 1.2069940567016602e-06, 1.34296715259552e-06, 1.4789402484893799e-06, 1.6149133443832397e-06, 1.7508864402770996e-06, 1.8868595361709595e-06, 2.0228326320648193e-06, 2.158805727958679e-06, 2.294778823852539e-06, 2.430751919746399e-06, 2.566725015640259e-06, 2.7026981115341187e-06, 2.8386712074279785e-06, 2.9746443033218384e-06, 3.1106173992156982e-06, 3.246590495109558e-06, 3.382563591003418e-06, 3.518536686897278e-06, 3.6545097827911377e-06, 3.7904828786849976e-06, 3.926455974578857e-06, 4.062429070472717e-06, 4.198402166366577e-06, 4.334375262260437e-06, 4.470348358154297e-06]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 7.0, 10.0, 7.0, 21.0, 21.0, 17.0, 28.0, 35.0, 54.0, 49.0, 42.0, 52.0, 55.0, 74.0, 74.0, 51.0, 52.0, 50.0, 35.0, 39.0, 50.0, 39.0, 29.0, 26.0, 14.0, 9.0, 9.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7881393432617188e-06, -1.7285346984863281e-06, -1.6689300537109375e-06, -1.6093254089355469e-06, -1.5497207641601562e-06, -1.4901161193847656e-06, -1.430511474609375e-06, -1.3709068298339844e-06, -1.3113021850585938e-06, -1.2516975402832031e-06, -1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06, 1.7285346984863281e-06, 1.7881393432617188e-06, 1.8477439880371094e-06, 1.9073486328125e-06, 1.9669532775878906e-06, 2.0265579223632812e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 7.0, 18.0, 8.0, 5.0, 41.0, 22.0, 37.0, 89.0, 66.0, 74.0, 237.0, 197.0, 239.0, 732.0, 608.0, 797.0, 2391.0, 1874.0, 2973.0, 10560.0, 9417.0, 15075.0, 67640.0, 82066.0, 178500.0, 479568.0, 82246.0, 43191.0, 39384.0, 9593.0, 6287.0, 6984.0, 2053.0, 1475.0, 1815.0, 572.0, 422.0, 497.0, 180.0, 139.0, 169.0, 74.0, 54.0, 81.0, 19.0, 18.0, 39.0, 9.0, 3.0, 8.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0], "bins": [-2.6226043701171875e-06, -2.543441951274872e-06, -2.464279532432556e-06, -2.3851171135902405e-06, -2.305954694747925e-06, -2.226792275905609e-06, -2.1476298570632935e-06, -2.0684674382209778e-06, -1.989305019378662e-06, -1.9101426005363464e-06, -1.8309801816940308e-06, -1.751817762851715e-06, -1.6726553440093994e-06, -1.5934929251670837e-06, -1.514330506324768e-06, -1.4351680874824524e-06, -1.3560056686401367e-06, -1.276843249797821e-06, -1.1976808309555054e-06, -1.1185184121131897e-06, -1.039355993270874e-06, -9.601935744285583e-07, -8.810311555862427e-07, -8.01868736743927e-07, -7.227063179016113e-07, -6.435438990592957e-07, -5.6438148021698e-07, -4.852190613746643e-07, -4.0605664253234863e-07, -3.2689422369003296e-07, -2.477318048477173e-07, -1.685693860054016e-07, -8.940696716308594e-08, -1.0244548320770264e-08, 6.891787052154541e-08, 1.4808028936386108e-07, 2.2724270820617676e-07, 3.0640512704849243e-07, 3.855675458908081e-07, 4.647299647331238e-07, 5.438923835754395e-07, 6.230548024177551e-07, 7.022172212600708e-07, 7.813796401023865e-07, 8.605420589447021e-07, 9.397044777870178e-07, 1.0188668966293335e-06, 1.0980293154716492e-06, 1.1771917343139648e-06, 1.2563541531562805e-06, 1.3355165719985962e-06, 1.4146789908409119e-06, 1.4938414096832275e-06, 1.5730038285255432e-06, 1.6521662473678589e-06, 1.7313286662101746e-06, 1.8104910850524902e-06, 1.889653503894806e-06, 1.9688159227371216e-06, 2.0479783415794373e-06, 2.127140760421753e-06, 2.2063031792640686e-06, 2.2854655981063843e-06, 2.3646280169487e-06, 2.4437904357910156e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 14.0, 15.0, 7.0, 17.0, 12.0, 15.0, 37.0, 34.0, 42.0, 35.0, 26.0, 42.0, 48.0, 121.0, 47.0, 56.0, 47.0, 57.0, 51.0, 76.0, 27.0, 25.0, 17.0, 23.0, 18.0, 21.0, 4.0, 9.0, 10.0, 7.0, 9.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.3245811462402344e-06, -2.255663275718689e-06, -2.1867454051971436e-06, -2.117827534675598e-06, -2.0489096641540527e-06, -1.9799917936325073e-06, -1.911073923110962e-06, -1.8421560525894165e-06, -1.773238182067871e-06, -1.7043203115463257e-06, -1.6354024410247803e-06, -1.5664845705032349e-06, -1.4975666999816895e-06, -1.428648829460144e-06, -1.3597309589385986e-06, -1.2908130884170532e-06, -1.2218952178955078e-06, -1.1529773473739624e-06, -1.084059476852417e-06, -1.0151416063308716e-06, -9.462237358093262e-07, -8.773058652877808e-07, -8.083879947662354e-07, -7.394701242446899e-07, -6.705522537231445e-07, -6.016343832015991e-07, -5.327165126800537e-07, -4.637986421585083e-07, -3.948807716369629e-07, -3.259629011154175e-07, -2.5704503059387207e-07, -1.8812716007232666e-07, -1.1920928955078125e-07, -5.029141902923584e-08, 1.862645149230957e-08, 8.754432201385498e-08, 1.564621925354004e-07, 2.253800630569458e-07, 2.942979335784912e-07, 3.632158041000366e-07, 4.3213367462158203e-07, 5.010515451431274e-07, 5.699694156646729e-07, 6.388872861862183e-07, 7.078051567077637e-07, 7.767230272293091e-07, 8.456408977508545e-07, 9.145587682723999e-07, 9.834766387939453e-07, 1.0523945093154907e-06, 1.1213123798370361e-06, 1.1902302503585815e-06, 1.259148120880127e-06, 1.3280659914016724e-06, 1.3969838619232178e-06, 1.4659017324447632e-06, 1.5348196029663086e-06, 1.603737473487854e-06, 1.6726553440093994e-06, 1.7415732145309448e-06, 1.8104910850524902e-06, 1.8794089555740356e-06, 1.948326826095581e-06, 2.0172446966171265e-06, 2.086162567138672e-06]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 7.0, 4.0, 11.0, 7.0, 25.0, 33.0, 46.0, 63.0, 86.0, 221.0, 129.0, 83.0, 50.0, 45.0, 31.0, 33.0, 23.0, 28.0, 17.0, 9.0, 9.0, 8.0, 6.0, 5.0, 4.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001194621654576622, -0.00011302295024506748, -0.00010658373503247276, -0.00010014451981987804, -9.370529733132571e-05, -8.726608211873099e-05, -8.082686690613627e-05, -7.438764441758394e-05, -6.794843648094684e-05, -6.150922126835212e-05, -5.5070002417778596e-05, -4.863078720518388e-05, -4.2191568354610354e-05, -3.5752353142015636e-05, -2.9313137929420918e-05, -2.2873919078847393e-05, -1.643470022827387e-05, -9.995483196689747e-06, -3.5562670746003278e-06, 2.8829490474890918e-06, 9.322166079073213e-06, 1.5761383110657334e-05, 2.2200598323252052e-05, 2.8639817173825577e-05, 3.5079032386420295e-05, 4.151824759901501e-05, 4.795746644958854e-05, 5.4396681662183255e-05, 6.083589687477797e-05, 6.72751193633303e-05, 7.371432729996741e-05, 8.015354978851974e-05, 8.659275772515684e-05, 9.303197293775156e-05, 9.947118815034628e-05, 0.00010591041063889861, 0.00011234962585149333, 0.00011878884106408805, 0.00012522804900072515, 0.00013166727148927748, 0.00013810649397782981, 0.00014454571646638215, 0.00015098492440301925, 0.00015742414689157158, 0.00016386335482820868, 0.00017030257731676102, 0.00017674179980531335, 0.00018318100774195045, 0.00018962021567858756, 0.0001960594381671399, 0.000202498646103777, 0.00020893786859232932, 0.00021537707652896643, 0.00022181629901751876, 0.0002282555215060711, 0.0002346947294427082, 0.00024113395193126053, 0.00024757315986789763, 0.00025401238235644996, 0.0002604516048450023, 0.0002668908273335546, 0.0002733300207182765, 0.00027976924320682883, 0.00028620846569538116, 0.0002926476881839335]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 4.0, 7.0, 6.0, 17.0, 12.0, 17.0, 16.0, 14.0, 26.0, 24.0, 31.0, 24.0, 29.0, 35.0, 22.0, 28.0, 37.0, 31.0, 48.0, 47.0, 34.0, 47.0, 33.0, 36.0, 43.0, 37.0, 37.0, 27.0, 33.0, 28.0, 27.0, 23.0, 20.0, 20.0, 17.0, 4.0, 14.0, 13.0, 7.0, 3.0, 5.0, 7.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012439489364624023, -0.00012074410915374756, -0.00011709332466125488, -0.00011344254016876221, -0.00010979175567626953, -0.00010614097118377686, -0.00010249018669128418, -9.88394021987915e-05, -9.518861770629883e-05, -9.153783321380615e-05, -8.788704872131348e-05, -8.42362642288208e-05, -8.058547973632812e-05, -7.693469524383545e-05, -7.328391075134277e-05, -6.96331262588501e-05, -6.598234176635742e-05, -6.233155727386475e-05, -5.868077278137207e-05, -5.5029988288879395e-05, -5.137920379638672e-05, -4.772841930389404e-05, -4.407763481140137e-05, -4.042685031890869e-05, -3.6776065826416016e-05, -3.312528133392334e-05, -2.9474496841430664e-05, -2.5823712348937988e-05, -2.2172927856445312e-05, -1.8522143363952637e-05, -1.4871358871459961e-05, -1.1220574378967285e-05, -7.569789886474609e-06, -3.919005393981934e-06, -2.682209014892578e-07, 3.382563591003418e-06, 7.033348083496094e-06, 1.068413257598877e-05, 1.4334917068481445e-05, 1.798570156097412e-05, 2.1636486053466797e-05, 2.5287270545959473e-05, 2.893805503845215e-05, 3.2588839530944824e-05, 3.62396240234375e-05, 3.9890408515930176e-05, 4.354119300842285e-05, 4.719197750091553e-05, 5.08427619934082e-05, 5.449354648590088e-05, 5.8144330978393555e-05, 6.179511547088623e-05, 6.54458999633789e-05, 6.909668445587158e-05, 7.274746894836426e-05, 7.639825344085693e-05, 8.004903793334961e-05, 8.369982242584229e-05, 8.735060691833496e-05, 9.100139141082764e-05, 9.465217590332031e-05, 9.830296039581299e-05, 0.00010195374488830566, 0.00010560452938079834, 0.00010925531387329102]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 4.0, 5.0, 5.0, 7.0, 13.0, 27.0, 32.0, 31.0, 80.0, 94.0, 180.0, 280.0, 434.0, 766.0, 1352.0, 2794.0, 6288.0, 16495.0, 88356.0, 3972089.0, 75706.0, 16540.0, 6225.0, 2759.0, 1512.0, 875.0, 448.0, 288.0, 172.0, 119.0, 86.0, 67.0, 41.0, 27.0, 27.0, 21.0, 13.0, 8.0, 0.0, 7.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011789798736572266, -0.00011360645294189453, -0.0001093149185180664, -0.00010502338409423828, -0.00010073184967041016, -9.644031524658203e-05, -9.21487808227539e-05, -8.785724639892578e-05, -8.356571197509766e-05, -7.927417755126953e-05, -7.49826431274414e-05, -7.069110870361328e-05, -6.639957427978516e-05, -6.210803985595703e-05, -5.7816505432128906e-05, -5.352497100830078e-05, -4.9233436584472656e-05, -4.494190216064453e-05, -4.0650367736816406e-05, -3.635883331298828e-05, -3.2067298889160156e-05, -2.777576446533203e-05, -2.3484230041503906e-05, -1.919269561767578e-05, -1.4901161193847656e-05, -1.0609626770019531e-05, -6.318092346191406e-06, -2.0265579223632812e-06, 2.2649765014648438e-06, 6.556510925292969e-06, 1.0848045349121094e-05, 1.5139579772949219e-05, 1.9431114196777344e-05, 2.372264862060547e-05, 2.8014183044433594e-05, 3.230571746826172e-05, 3.6597251892089844e-05, 4.088878631591797e-05, 4.5180320739746094e-05, 4.947185516357422e-05, 5.3763389587402344e-05, 5.805492401123047e-05, 6.23464584350586e-05, 6.663799285888672e-05, 7.092952728271484e-05, 7.522106170654297e-05, 7.95125961303711e-05, 8.380413055419922e-05, 8.809566497802734e-05, 9.238719940185547e-05, 9.66787338256836e-05, 0.00010097026824951172, 0.00010526180267333984, 0.00010955333709716797, 0.0001138448715209961, 0.00011813640594482422, 0.00012242794036865234, 0.00012671947479248047, 0.0001310110092163086, 0.00013530254364013672, 0.00013959407806396484, 0.00014388561248779297, 0.0001481771469116211, 0.00015246868133544922, 0.00015676021575927734]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 6.0, 2.0, 6.0, 9.0, 10.0, 21.0, 20.0, 21.0, 29.0, 54.0, 69.0, 82.0, 105.0, 93.0, 85.0, 88.0, 72.0, 60.0, 47.0, 38.0, 17.0, 17.0, 13.0, 12.0, 5.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5331974029541016e-05, -2.4422071874141693e-05, -2.351216971874237e-05, -2.2602267563343048e-05, -2.1692365407943726e-05, -2.0782463252544403e-05, -1.987256109714508e-05, -1.8962658941745758e-05, -1.8052756786346436e-05, -1.7142854630947113e-05, -1.623295247554779e-05, -1.5323050320148468e-05, -1.4413148164749146e-05, -1.3503246009349823e-05, -1.25933438539505e-05, -1.1683441698551178e-05, -1.0773539543151855e-05, -9.863637387752533e-06, -8.95373523235321e-06, -8.043833076953888e-06, -7.1339309215545654e-06, -6.224028766155243e-06, -5.31412661075592e-06, -4.404224455356598e-06, -3.4943222999572754e-06, -2.584420144557953e-06, -1.6745179891586304e-06, -7.646158337593079e-07, 1.4528632164001465e-07, 1.0551884770393372e-06, 1.9650906324386597e-06, 2.874992787837982e-06, 3.7848949432373047e-06, 4.694797098636627e-06, 5.60469925403595e-06, 6.514601409435272e-06, 7.424503564834595e-06, 8.334405720233917e-06, 9.24430787563324e-06, 1.0154210031032562e-05, 1.1064112186431885e-05, 1.1974014341831207e-05, 1.288391649723053e-05, 1.3793818652629852e-05, 1.4703720808029175e-05, 1.5613622963428497e-05, 1.652352511882782e-05, 1.7433427274227142e-05, 1.8343329429626465e-05, 1.9253231585025787e-05, 2.016313374042511e-05, 2.1073035895824432e-05, 2.1982938051223755e-05, 2.2892840206623077e-05, 2.38027423620224e-05, 2.4712644517421722e-05, 2.5622546672821045e-05, 2.6532448828220367e-05, 2.744235098361969e-05, 2.8352253139019012e-05, 2.9262155294418335e-05, 3.0172057449817657e-05, 3.108195960521698e-05, 3.19918617606163e-05, 3.2901763916015625e-05]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 7.0, 14.0, 17.0, 23.0, 23.0, 46.0, 50.0, 82.0, 104.0, 132.0, 213.0, 270.0, 378.0, 613.0, 841.0, 1436.0, 2047.0, 3326.0, 5508.0, 9712.0, 18887.0, 37843.0, 96258.0, 836555.0, 2943664.0, 140601.0, 45404.0, 21401.0, 11399.0, 6605.0, 3786.0, 2324.0, 1467.0, 1029.0, 682.0, 480.0, 304.0, 206.0, 155.0, 113.0, 76.0, 66.0, 33.0, 27.0, 21.0, 16.0, 11.0, 7.0, 10.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.863739013671875e-05, -4.707463085651398e-05, -4.5511871576309204e-05, -4.394911229610443e-05, -4.238635301589966e-05, -4.0823593735694885e-05, -3.926083445549011e-05, -3.769807517528534e-05, -3.6135315895080566e-05, -3.4572556614875793e-05, -3.300979733467102e-05, -3.144703805446625e-05, -2.9884278774261475e-05, -2.83215194940567e-05, -2.675876021385193e-05, -2.5196000933647156e-05, -2.3633241653442383e-05, -2.207048237323761e-05, -2.0507723093032837e-05, -1.8944963812828064e-05, -1.738220453262329e-05, -1.5819445252418518e-05, -1.4256685972213745e-05, -1.2693926692008972e-05, -1.11311674118042e-05, -9.568408131599426e-06, -8.005648851394653e-06, -6.44288957118988e-06, -4.880130290985107e-06, -3.3173710107803345e-06, -1.7546117305755615e-06, -1.9185245037078857e-07, 1.3709068298339844e-06, 2.9336661100387573e-06, 4.49642539024353e-06, 6.059184670448303e-06, 7.621943950653076e-06, 9.184703230857849e-06, 1.0747462511062622e-05, 1.2310221791267395e-05, 1.3872981071472168e-05, 1.543574035167694e-05, 1.6998499631881714e-05, 1.8561258912086487e-05, 2.012401819229126e-05, 2.1686777472496033e-05, 2.3249536752700806e-05, 2.481229603290558e-05, 2.637505531311035e-05, 2.7937814593315125e-05, 2.9500573873519897e-05, 3.106333315372467e-05, 3.262609243392944e-05, 3.4188851714134216e-05, 3.575161099433899e-05, 3.731437027454376e-05, 3.8877129554748535e-05, 4.043988883495331e-05, 4.200264811515808e-05, 4.3565407395362854e-05, 4.512816667556763e-05, 4.66909259557724e-05, 4.825368523597717e-05, 4.9816444516181946e-05, 5.137920379638672e-05]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 11.0, 14.0, 21.0, 19.0, 33.0, 28.0, 33.0, 60.0, 88.0, 207.0, 732.0, 1810.0, 557.0, 170.0, 79.0, 42.0, 35.0, 25.0, 12.0, 20.0, 19.0, 14.0, 3.0, 12.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.537271499633789e-05, -5.371309816837311e-05, -5.2053481340408325e-05, -5.039386451244354e-05, -4.873424768447876e-05, -4.707463085651398e-05, -4.5415014028549194e-05, -4.375539720058441e-05, -4.209578037261963e-05, -4.0436163544654846e-05, -3.8776546716690063e-05, -3.711692988872528e-05, -3.54573130607605e-05, -3.3797696232795715e-05, -3.213807940483093e-05, -3.047846257686615e-05, -2.8818845748901367e-05, -2.7159228920936584e-05, -2.5499612092971802e-05, -2.383999526500702e-05, -2.2180378437042236e-05, -2.0520761609077454e-05, -1.886114478111267e-05, -1.7201527953147888e-05, -1.5541911125183105e-05, -1.3882294297218323e-05, -1.222267746925354e-05, -1.0563060641288757e-05, -8.903443813323975e-06, -7.243826985359192e-06, -5.584210157394409e-06, -3.9245933294296265e-06, -2.2649765014648438e-06, -6.05359673500061e-07, 1.0542571544647217e-06, 2.7138739824295044e-06, 4.373490810394287e-06, 6.03310763835907e-06, 7.692724466323853e-06, 9.352341294288635e-06, 1.1011958122253418e-05, 1.26715749502182e-05, 1.4331191778182983e-05, 1.5990808606147766e-05, 1.765042543411255e-05, 1.931004226207733e-05, 2.0969659090042114e-05, 2.2629275918006897e-05, 2.428889274597168e-05, 2.5948509573936462e-05, 2.7608126401901245e-05, 2.9267743229866028e-05, 3.092736005783081e-05, 3.258697688579559e-05, 3.4246593713760376e-05, 3.590621054172516e-05, 3.756582736968994e-05, 3.9225444197654724e-05, 4.088506102561951e-05, 4.254467785358429e-05, 4.420429468154907e-05, 4.5863911509513855e-05, 4.752352833747864e-05, 4.918314516544342e-05, 5.08427619934082e-05]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 8.0, 9.0, 7.0, 12.0, 14.0, 15.0, 23.0, 25.0, 35.0, 35.0, 40.0, 77.0, 77.0, 116.0, 80.0, 79.0, 49.0, 36.0, 39.0, 31.0, 18.0, 23.0, 19.0, 24.0, 15.0, 14.0, 11.0, 8.0, 10.0, 11.0, 5.0, 6.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.00016491103451699018, -0.00016014021821320057, -0.00015536940190941095, -0.00015059858560562134, -0.00014582776930183172, -0.0001410569529980421, -0.0001362861366942525, -0.00013151532039046288, -0.00012674450408667326, -0.00012197368778288364, -0.00011720287147909403, -0.00011243205517530441, -0.0001076612388715148, -0.00010289042256772518, -9.811961353989318e-05, -9.334879723610356e-05, -8.857798820827156e-05, -8.380717190448195e-05, -7.903635560069233e-05, -7.426553929690272e-05, -6.94947229931131e-05, -6.472390668932348e-05, -5.9953097661491483e-05, -5.518228135770187e-05, -5.041146505391225e-05, -4.5640648750122637e-05, -4.086983244633302e-05, -3.609901978052221e-05, -3.13282034767326e-05, -2.655738717294298e-05, -2.178657268814277e-05, -1.7015758203342557e-05, -1.224495645146817e-05, -7.474141057173256e-06, -2.703325662878342e-06, 2.067489731416572e-06, 6.838305125711486e-06, 1.1609121429501101e-05, 1.6379935914301313e-05, 2.1150750399101526e-05, 2.592156670289114e-05, 3.069238300668076e-05, 3.546319931047037e-05, 4.023401197628118e-05, 4.5004828280070797e-05, 4.977564458386041e-05, 5.454645724967122e-05, 5.9317273553460836e-05, 6.408808985725045e-05, 6.885890616104007e-05, 7.362972246482968e-05, 7.84005387686193e-05, 8.317135507240891e-05, 8.794217137619853e-05, 9.271298040403053e-05, 9.748379670782015e-05, 0.00010225461301160976, 0.00010702542931539938, 0.000111796245619189, 0.00011656706192297861, 0.00012133787095081061, 0.00012610868725460023, 0.00013087950355838984, 0.00013565031986217946, 0.00014042113616596907]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 2.0, 4.0, 1.0, 7.0, 12.0, 19.0, 8.0, 14.0, 16.0, 15.0, 20.0, 27.0, 24.0, 34.0, 25.0, 26.0, 36.0, 35.0, 33.0, 49.0, 31.0, 40.0, 42.0, 39.0, 36.0, 44.0, 33.0, 33.0, 33.0, 25.0, 35.0, 20.0, 35.0, 20.0, 20.0, 18.0, 23.0, 20.0, 16.0, 2.0, 8.0, 6.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010854005813598633, -0.00010499265044927597, -0.00010144524276256561, -9.789783507585526e-05, -9.43504273891449e-05, -9.080301970243454e-05, -8.725561201572418e-05, -8.370820432901382e-05, -8.016079664230347e-05, -7.661338895559311e-05, -7.306598126888275e-05, -6.95185735821724e-05, -6.597116589546204e-05, -6.242375820875168e-05, -5.887635052204132e-05, -5.532894283533096e-05, -5.1781535148620605e-05, -4.823412746191025e-05, -4.468671977519989e-05, -4.113931208848953e-05, -3.7591904401779175e-05, -3.404449671506882e-05, -3.049708902835846e-05, -2.6949681341648102e-05, -2.3402273654937744e-05, -1.9854865968227386e-05, -1.630745828151703e-05, -1.2760050594806671e-05, -9.212642908096313e-06, -5.665235221385956e-06, -2.117827534675598e-06, 1.4295801520347595e-06, 4.976987838745117e-06, 8.524395525455475e-06, 1.2071803212165833e-05, 1.561921089887619e-05, 1.9166618585586548e-05, 2.2714026272296906e-05, 2.6261433959007263e-05, 2.980884164571762e-05, 3.335624933242798e-05, 3.6903657019138336e-05, 4.0451064705848694e-05, 4.399847239255905e-05, 4.754588007926941e-05, 5.109328776597977e-05, 5.4640695452690125e-05, 5.818810313940048e-05, 6.173551082611084e-05, 6.52829185128212e-05, 6.883032619953156e-05, 7.237773388624191e-05, 7.592514157295227e-05, 7.947254925966263e-05, 8.301995694637299e-05, 8.656736463308334e-05, 9.01147723197937e-05, 9.366218000650406e-05, 9.720958769321442e-05, 0.00010075699537992477, 0.00010430440306663513, 0.00010785181075334549, 0.00011139921844005585, 0.0001149466261267662, 0.00011849403381347656]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 8.0, 8.0, 12.0, 13.0, 28.0, 35.0, 51.0, 70.0, 105.0, 144.0, 226.0, 396.0, 666.0, 1088.0, 2097.0, 3958.0, 8490.0, 19429.0, 50533.0, 163761.0, 571717.0, 145015.0, 45768.0, 18258.0, 7889.0, 3940.0, 1967.0, 1102.0, 649.0, 385.0, 245.0, 156.0, 96.0, 78.0, 43.0, 33.0, 26.0, 20.0, 12.0, 7.0, 12.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012373924255371094, -0.00011953897774219513, -0.00011533871293067932, -0.00011113844811916351, -0.0001069381833076477, -0.0001027379184961319, -9.853765368461609e-05, -9.433738887310028e-05, -9.013712406158447e-05, -8.593685925006866e-05, -8.173659443855286e-05, -7.753632962703705e-05, -7.333606481552124e-05, -6.913580000400543e-05, -6.493553519248962e-05, -6.0735270380973816e-05, -5.653500556945801e-05, -5.23347407579422e-05, -4.813447594642639e-05, -4.3934211134910583e-05, -3.9733946323394775e-05, -3.553368151187897e-05, -3.133341670036316e-05, -2.713315188884735e-05, -2.2932887077331543e-05, -1.8732622265815735e-05, -1.4532357454299927e-05, -1.0332092642784119e-05, -6.1318278312683105e-06, -1.9315630197525024e-06, 2.2687017917633057e-06, 6.468966603279114e-06, 1.0669231414794922e-05, 1.486949622631073e-05, 1.9069761037826538e-05, 2.3270025849342346e-05, 2.7470290660858154e-05, 3.167055547237396e-05, 3.587082028388977e-05, 4.007108509540558e-05, 4.427134990692139e-05, 4.8471614718437195e-05, 5.2671879529953e-05, 5.687214434146881e-05, 6.107240915298462e-05, 6.527267396450043e-05, 6.947293877601624e-05, 7.367320358753204e-05, 7.787346839904785e-05, 8.207373321056366e-05, 8.627399802207947e-05, 9.047426283359528e-05, 9.467452764511108e-05, 9.887479245662689e-05, 0.0001030750572681427, 0.00010727532207965851, 0.00011147558689117432, 0.00011567585170269012, 0.00011987611651420593, 0.00012407638132572174, 0.00012827664613723755, 0.00013247691094875336, 0.00013667717576026917, 0.00014087744057178497, 0.00014507770538330078]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 15.0, 14.0, 26.0, 29.0, 33.0, 46.0, 66.0, 72.0, 99.0, 86.0, 85.0, 97.0, 61.0, 57.0, 46.0, 37.0, 25.0, 29.0, 12.0, 16.0, 5.0, 10.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0444393157958984e-05, -1.9591301679611206e-05, -1.8738210201263428e-05, -1.788511872291565e-05, -1.703202724456787e-05, -1.6178935766220093e-05, -1.5325844287872314e-05, -1.4472752809524536e-05, -1.3619661331176758e-05, -1.276656985282898e-05, -1.1913478374481201e-05, -1.1060386896133423e-05, -1.0207295417785645e-05, -9.354203939437866e-06, -8.501112461090088e-06, -7.64802098274231e-06, -6.794929504394531e-06, -5.941838026046753e-06, -5.088746547698975e-06, -4.235655069351196e-06, -3.382563591003418e-06, -2.5294721126556396e-06, -1.6763806343078613e-06, -8.23289155960083e-07, 2.9802322387695312e-08, 8.828938007354736e-07, 1.735985279083252e-06, 2.5890767574310303e-06, 3.4421682357788086e-06, 4.295259714126587e-06, 5.148351192474365e-06, 6.0014426708221436e-06, 6.854534149169922e-06, 7.7076256275177e-06, 8.560717105865479e-06, 9.413808584213257e-06, 1.0266900062561035e-05, 1.1119991540908813e-05, 1.1973083019256592e-05, 1.282617449760437e-05, 1.3679265975952148e-05, 1.4532357454299927e-05, 1.5385448932647705e-05, 1.6238540410995483e-05, 1.7091631889343262e-05, 1.794472336769104e-05, 1.879781484603882e-05, 1.9650906324386597e-05, 2.0503997802734375e-05, 2.1357089281082153e-05, 2.221018075942993e-05, 2.306327223777771e-05, 2.3916363716125488e-05, 2.4769455194473267e-05, 2.5622546672821045e-05, 2.6475638151168823e-05, 2.73287296295166e-05, 2.818182110786438e-05, 2.9034912586212158e-05, 2.9888004064559937e-05, 3.0741095542907715e-05, 3.159418702125549e-05, 3.244727849960327e-05, 3.330036997795105e-05, 3.415346145629883e-05]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 5.0, 4.0, 23.0, 34.0, 49.0, 59.0, 96.0, 172.0, 197.0, 295.0, 484.0, 752.0, 1004.0, 1585.0, 2402.0, 3536.0, 5877.0, 9376.0, 14848.0, 26636.0, 43576.0, 82418.0, 176652.0, 363942.0, 144081.0, 71530.0, 38618.0, 23430.0, 13616.0, 8136.0, 5442.0, 3320.0, 2013.0, 1452.0, 952.0, 647.0, 446.0, 280.0, 167.0, 112.0, 84.0, 71.0, 42.0, 29.0, 20.0, 18.0, 13.0, 9.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-4.64320182800293e-05, -4.508160054683685e-05, -4.373118281364441e-05, -4.2380765080451965e-05, -4.103034734725952e-05, -3.967992961406708e-05, -3.8329511880874634e-05, -3.697909414768219e-05, -3.5628676414489746e-05, -3.42782586812973e-05, -3.292784094810486e-05, -3.1577423214912415e-05, -3.022700548171997e-05, -2.8876587748527527e-05, -2.7526170015335083e-05, -2.617575228214264e-05, -2.4825334548950195e-05, -2.347491681575775e-05, -2.2124499082565308e-05, -2.0774081349372864e-05, -1.942366361618042e-05, -1.8073245882987976e-05, -1.6722828149795532e-05, -1.537241041660309e-05, -1.4021992683410645e-05, -1.26715749502182e-05, -1.1321157217025757e-05, -9.970739483833313e-06, -8.620321750640869e-06, -7.269904017448425e-06, -5.9194862842559814e-06, -4.569068551063538e-06, -3.2186508178710938e-06, -1.86823308467865e-06, -5.178153514862061e-07, 8.326023817062378e-07, 2.1830201148986816e-06, 3.5334378480911255e-06, 4.883855581283569e-06, 6.234273314476013e-06, 7.584691047668457e-06, 8.935108780860901e-06, 1.0285526514053345e-05, 1.1635944247245789e-05, 1.2986361980438232e-05, 1.4336779713630676e-05, 1.568719744682312e-05, 1.7037615180015564e-05, 1.8388032913208008e-05, 1.973845064640045e-05, 2.1088868379592896e-05, 2.243928611278534e-05, 2.3789703845977783e-05, 2.5140121579170227e-05, 2.649053931236267e-05, 2.7840957045555115e-05, 2.919137477874756e-05, 3.054179251194e-05, 3.1892210245132446e-05, 3.324262797832489e-05, 3.4593045711517334e-05, 3.594346344470978e-05, 3.729388117790222e-05, 3.8644298911094666e-05, 3.999471664428711e-05]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 5.0, 4.0, 11.0, 13.0, 4.0, 13.0, 12.0, 13.0, 17.0, 24.0, 15.0, 33.0, 32.0, 29.0, 32.0, 30.0, 34.0, 38.0, 39.0, 39.0, 30.0, 30.0, 52.0, 45.0, 31.0, 35.0, 29.0, 30.0, 30.0, 30.0, 30.0, 29.0, 24.0, 23.0, 14.0, 14.0, 15.0, 11.0, 11.0, 8.0, 17.0, 3.0, 9.0, 2.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.838539123535156e-05, -3.727339208126068e-05, -3.61613929271698e-05, -3.504939377307892e-05, -3.393739461898804e-05, -3.2825395464897156e-05, -3.1713396310806274e-05, -3.060139715671539e-05, -2.9489398002624512e-05, -2.837739884853363e-05, -2.726539969444275e-05, -2.6153400540351868e-05, -2.5041401386260986e-05, -2.3929402232170105e-05, -2.2817403078079224e-05, -2.1705403923988342e-05, -2.059340476989746e-05, -1.948140561580658e-05, -1.8369406461715698e-05, -1.7257407307624817e-05, -1.6145408153533936e-05, -1.5033408999443054e-05, -1.3921409845352173e-05, -1.2809410691261292e-05, -1.169741153717041e-05, -1.0585412383079529e-05, -9.473413228988647e-06, -8.361414074897766e-06, -7.249414920806885e-06, -6.137415766716003e-06, -5.025416612625122e-06, -3.913417458534241e-06, -2.8014183044433594e-06, -1.689419150352478e-06, -5.774199962615967e-07, 5.345791578292847e-07, 1.646578311920166e-06, 2.7585774660110474e-06, 3.870576620101929e-06, 4.98257577419281e-06, 6.094574928283691e-06, 7.206574082374573e-06, 8.318573236465454e-06, 9.430572390556335e-06, 1.0542571544647217e-05, 1.1654570698738098e-05, 1.276656985282898e-05, 1.387856900691986e-05, 1.4990568161010742e-05, 1.6102567315101624e-05, 1.7214566469192505e-05, 1.8326565623283386e-05, 1.9438564777374268e-05, 2.055056393146515e-05, 2.166256308555603e-05, 2.277456223964691e-05, 2.3886561393737793e-05, 2.4998560547828674e-05, 2.6110559701919556e-05, 2.7222558856010437e-05, 2.833455801010132e-05, 2.94465571641922e-05, 3.055855631828308e-05, 3.167055547237396e-05, 3.2782554626464844e-05]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 9.0, 10.0, 10.0, 21.0, 17.0, 11.0, 33.0, 51.0, 71.0, 96.0, 115.0, 62.0, 207.0, 328.0, 476.0, 780.0, 1200.0, 891.0, 2697.0, 4878.0, 9598.0, 21267.0, 19633.0, 85639.0, 257672.0, 402511.0, 145741.0, 51543.0, 12612.0, 14235.0, 6740.0, 3610.0, 2130.0, 1308.0, 442.0, 672.0, 389.0, 256.0, 207.0, 130.0, 51.0, 66.0, 39.0, 36.0, 19.0, 17.0, 5.0, 9.0, 6.0, 3.0, 1.0, 3.0], "bins": [-4.0531158447265625e-06, -3.9441511034965515e-06, -3.8351863622665405e-06, -3.7262216210365295e-06, -3.6172568798065186e-06, -3.5082921385765076e-06, -3.3993273973464966e-06, -3.2903626561164856e-06, -3.1813979148864746e-06, -3.0724331736564636e-06, -2.9634684324264526e-06, -2.8545036911964417e-06, -2.7455389499664307e-06, -2.6365742087364197e-06, -2.5276094675064087e-06, -2.4186447262763977e-06, -2.3096799850463867e-06, -2.2007152438163757e-06, -2.0917505025863647e-06, -1.9827857613563538e-06, -1.8738210201263428e-06, -1.7648562788963318e-06, -1.6558915376663208e-06, -1.5469267964363098e-06, -1.4379620552062988e-06, -1.3289973139762878e-06, -1.2200325727462769e-06, -1.1110678315162659e-06, -1.0021030902862549e-06, -8.931383490562439e-07, -7.841736078262329e-07, -6.752088665962219e-07, -5.662441253662109e-07, -4.5727938413619995e-07, -3.4831464290618896e-07, -2.39349901676178e-07, -1.30385160446167e-07, -2.1420419216156006e-08, 8.754432201385498e-08, 1.9650906324386597e-07, 3.0547380447387695e-07, 4.1443854570388794e-07, 5.234032869338989e-07, 6.323680281639099e-07, 7.413327693939209e-07, 8.502975106239319e-07, 9.592622518539429e-07, 1.0682269930839539e-06, 1.1771917343139648e-06, 1.2861564755439758e-06, 1.3951212167739868e-06, 1.5040859580039978e-06, 1.6130506992340088e-06, 1.7220154404640198e-06, 1.8309801816940308e-06, 1.9399449229240417e-06, 2.0489096641540527e-06, 2.1578744053840637e-06, 2.2668391466140747e-06, 2.3758038878440857e-06, 2.4847686290740967e-06, 2.5937333703041077e-06, 2.7026981115341187e-06, 2.8116628527641296e-06, 2.9206275939941406e-06]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 12.0, 12.0, 19.0, 17.0, 0.0, 30.0, 24.0, 45.0, 26.0, 50.0, 0.0, 62.0, 73.0, 66.0, 88.0, 71.0, 0.0, 78.0, 50.0, 48.0, 52.0, 41.0, 25.0, 0.0, 39.0, 18.0, 22.0, 12.0, 10.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4398247003555298e-06, -1.389533281326294e-06, -1.339241862297058e-06, -1.2889504432678223e-06, -1.2386590242385864e-06, -1.1883676052093506e-06, -1.1380761861801147e-06, -1.087784767150879e-06, -1.037493348121643e-06, -9.872019290924072e-07, -9.369105100631714e-07, -8.866190910339355e-07, -8.363276720046997e-07, -7.860362529754639e-07, -7.35744833946228e-07, -6.854534149169922e-07, -6.351619958877563e-07, -5.848705768585205e-07, -5.345791578292847e-07, -4.842877388000488e-07, -4.33996319770813e-07, -3.8370490074157715e-07, -3.334134817123413e-07, -2.8312206268310547e-07, -2.3283064365386963e-07, -1.825392246246338e-07, -1.3224780559539795e-07, -8.195638656616211e-08, -3.166496753692627e-08, 1.862645149230957e-08, 6.891787052154541e-08, 1.1920928955078125e-07, 1.695007085800171e-07, 2.1979212760925293e-07, 2.7008354663848877e-07, 3.203749656677246e-07, 3.7066638469696045e-07, 4.209578037261963e-07, 4.7124922275543213e-07, 5.21540641784668e-07, 5.718320608139038e-07, 6.221234798431396e-07, 6.724148988723755e-07, 7.227063179016113e-07, 7.729977369308472e-07, 8.23289155960083e-07, 8.735805749893188e-07, 9.238719940185547e-07, 9.741634130477905e-07, 1.0244548320770264e-06, 1.0747462511062622e-06, 1.125037670135498e-06, 1.1753290891647339e-06, 1.2256205081939697e-06, 1.2759119272232056e-06, 1.3262033462524414e-06, 1.3764947652816772e-06, 1.426786184310913e-06, 1.477077603340149e-06, 1.5273690223693848e-06, 1.5776604413986206e-06, 1.6279518604278564e-06, 1.6782432794570923e-06, 1.7285346984863281e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 18.0, 13.0, 24.0, 14.0, 48.0, 36.0, 37.0, 119.0, 87.0, 226.0, 163.0, 469.0, 358.0, 1125.0, 854.0, 2848.0, 2430.0, 8586.0, 7918.0, 33532.0, 38569.0, 78099.0, 513890.0, 183738.0, 116426.0, 20973.0, 20296.0, 5287.0, 5816.0, 1668.0, 2118.0, 597.0, 888.0, 269.0, 363.0, 133.0, 181.0, 59.0, 50.0, 76.0, 19.0, 34.0, 18.0, 27.0, 9.0, 13.0, 5.0, 5.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0], "bins": [-2.86102294921875e-06, -2.773478627204895e-06, -2.68593430519104e-06, -2.598389983177185e-06, -2.51084566116333e-06, -2.423301339149475e-06, -2.33575701713562e-06, -2.248212695121765e-06, -2.16066837310791e-06, -2.073124051094055e-06, -1.9855797290802e-06, -1.8980354070663452e-06, -1.8104910850524902e-06, -1.7229467630386353e-06, -1.6354024410247803e-06, -1.5478581190109253e-06, -1.4603137969970703e-06, -1.3727694749832153e-06, -1.2852251529693604e-06, -1.1976808309555054e-06, -1.1101365089416504e-06, -1.0225921869277954e-06, -9.350478649139404e-07, -8.475035429000854e-07, -7.599592208862305e-07, -6.724148988723755e-07, -5.848705768585205e-07, -4.973262548446655e-07, -4.0978193283081055e-07, -3.2223761081695557e-07, -2.3469328880310059e-07, -1.471489667892456e-07, -5.960464477539063e-08, 2.7939677238464355e-08, 1.1548399925231934e-07, 2.0302832126617432e-07, 2.905726432800293e-07, 3.781169652938843e-07, 4.6566128730773926e-07, 5.532056093215942e-07, 6.407499313354492e-07, 7.282942533493042e-07, 8.158385753631592e-07, 9.033828973770142e-07, 9.909272193908691e-07, 1.0784715414047241e-06, 1.166015863418579e-06, 1.253560185432434e-06, 1.341104507446289e-06, 1.428648829460144e-06, 1.516193151473999e-06, 1.603737473487854e-06, 1.691281795501709e-06, 1.778826117515564e-06, 1.866370439529419e-06, 1.953914761543274e-06, 2.041459083557129e-06, 2.129003405570984e-06, 2.216547727584839e-06, 2.304092049598694e-06, 2.391636371612549e-06, 2.479180693626404e-06, 2.566725015640259e-06, 2.6542693376541138e-06, 2.7418136596679688e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 7.0, 10.0, 8.0, 7.0, 23.0, 11.0, 21.0, 32.0, 32.0, 31.0, 96.0, 57.0, 61.0, 112.0, 76.0, 69.0, 93.0, 48.0, 38.0, 39.0, 22.0, 18.0, 24.0, 10.0, 13.0, 16.0, 3.0, 1.0, 7.0, 3.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.4437904357910156e-06, -2.3646280169487e-06, -2.2854655981063843e-06, -2.2063031792640686e-06, -2.127140760421753e-06, -2.0479783415794373e-06, -1.9688159227371216e-06, -1.889653503894806e-06, -1.8104910850524902e-06, -1.7313286662101746e-06, -1.6521662473678589e-06, -1.5730038285255432e-06, -1.4938414096832275e-06, -1.4146789908409119e-06, -1.3355165719985962e-06, -1.2563541531562805e-06, -1.1771917343139648e-06, -1.0980293154716492e-06, -1.0188668966293335e-06, -9.397044777870178e-07, -8.605420589447021e-07, -7.813796401023865e-07, -7.022172212600708e-07, -6.230548024177551e-07, -5.438923835754395e-07, -4.647299647331238e-07, -3.855675458908081e-07, -3.0640512704849243e-07, -2.2724270820617676e-07, -1.4808028936386108e-07, -6.891787052154541e-08, 1.0244548320770264e-08, 8.940696716308594e-08, 1.685693860054016e-07, 2.477318048477173e-07, 3.2689422369003296e-07, 4.0605664253234863e-07, 4.852190613746643e-07, 5.6438148021698e-07, 6.435438990592957e-07, 7.227063179016113e-07, 8.01868736743927e-07, 8.810311555862427e-07, 9.601935744285583e-07, 1.039355993270874e-06, 1.1185184121131897e-06, 1.1976808309555054e-06, 1.276843249797821e-06, 1.3560056686401367e-06, 1.4351680874824524e-06, 1.514330506324768e-06, 1.5934929251670837e-06, 1.6726553440093994e-06, 1.751817762851715e-06, 1.8309801816940308e-06, 1.9101426005363464e-06, 1.989305019378662e-06, 2.0684674382209778e-06, 2.1476298570632935e-06, 2.226792275905609e-06, 2.305954694747925e-06, 2.3851171135902405e-06, 2.464279532432556e-06, 2.543441951274872e-06, 2.6226043701171875e-06]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 6.0, 7.0, 9.0, 14.0, 18.0, 34.0, 40.0, 79.0, 107.0, 185.0, 119.0, 85.0, 61.0, 43.0, 37.0, 27.0, 19.0, 21.0, 11.0, 13.0, 11.0, 10.0, 3.0, 6.0, 2.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013186510477680713, -0.00012666518159676343, -0.00012146526569267735, -0.00011626534251263365, -0.00011106541933258995, -0.00010586550342850387, -0.00010066558024846017, -9.546565706841648e-05, -9.026573388837278e-05, -8.506581070832908e-05, -7.9865894804243e-05, -7.46659716241993e-05, -6.94660484441556e-05, -6.426613254006952e-05, -5.906620936002582e-05, -5.3866286179982126e-05, -4.866637027589604e-05, -4.346645073383115e-05, -3.8266527553787455e-05, -3.3066608011722565e-05, -2.786668665066827e-05, -2.2666765289613977e-05, -1.7466845747549087e-05, -1.226692256750539e-05, -7.067003025440499e-06, -1.8670821191335563e-06, 3.3328387871733867e-06, 8.532759238732979e-06, 1.3732680599787273e-05, 1.8932601960841566e-05, 2.4132521502906457e-05, 2.9332444682950154e-05, 3.4532364225015044e-05, 3.9732283767079934e-05, 4.493220694712363e-05, 5.013212648918852e-05, 5.533204966923222e-05, 6.053196921129711e-05, 6.5731888753362e-05, 7.09318119334057e-05, 7.61317351134494e-05, 8.133165829349309e-05, 8.653157419757918e-05, 9.173149737762287e-05, 9.693142055766657e-05, 0.00010213133646175265, 0.00010733125964179635, 0.00011253118282184005, 0.00011773109872592613, 0.00012293101463001221, 0.0001281309378100559, 0.0001333308609900996, 0.0001385307841701433, 0.000143730707350187, 0.00014893061597831547, 0.00015413053915835917, 0.00015933046233840287, 0.00016453038551844656, 0.00016973030869849026, 0.00017493023187853396, 0.00018013014050666243, 0.00018533006368670613, 0.00019052998686674982, 0.00019572991004679352, 0.00020092983322683722]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 9.0, 4.0, 4.0, 14.0, 6.0, 10.0, 10.0, 19.0, 17.0, 16.0, 21.0, 29.0, 22.0, 33.0, 43.0, 38.0, 40.0, 35.0, 35.0, 42.0, 43.0, 45.0, 49.0, 39.0, 35.0, 35.0, 23.0, 41.0, 35.0, 26.0, 20.0, 24.0, 30.0, 19.0, 21.0, 11.0, 9.0, 7.0, 14.0, 5.0, 12.0, 5.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010758638381958008, -0.00010435003787279129, -0.0001011136919260025, -9.787734597921371e-05, -9.464100003242493e-05, -9.140465408563614e-05, -8.816830813884735e-05, -8.493196219205856e-05, -8.169561624526978e-05, -7.845927029848099e-05, -7.52229243516922e-05, -7.198657840490341e-05, -6.875023245811462e-05, -6.551388651132584e-05, -6.227754056453705e-05, -5.904119461774826e-05, -5.580484867095947e-05, -5.2568502724170685e-05, -4.93321567773819e-05, -4.609581083059311e-05, -4.285946488380432e-05, -3.9623118937015533e-05, -3.6386772990226746e-05, -3.315042704343796e-05, -2.991408109664917e-05, -2.6677735149860382e-05, -2.3441389203071594e-05, -2.0205043256282806e-05, -1.696869730949402e-05, -1.373235136270523e-05, -1.0496005415916443e-05, -7.259659469127655e-06, -4.023313522338867e-06, -7.869675755500793e-07, 2.4493783712387085e-06, 5.685724318027496e-06, 8.922070264816284e-06, 1.2158416211605072e-05, 1.539476215839386e-05, 1.8631108105182648e-05, 2.1867454051971436e-05, 2.5103799998760223e-05, 2.834014594554901e-05, 3.15764918923378e-05, 3.481283783912659e-05, 3.8049183785915375e-05, 4.128552973270416e-05, 4.452187567949295e-05, 4.775822162628174e-05, 5.0994567573070526e-05, 5.4230913519859314e-05, 5.74672594666481e-05, 6.070360541343689e-05, 6.393995136022568e-05, 6.717629730701447e-05, 7.041264325380325e-05, 7.364898920059204e-05, 7.688533514738083e-05, 8.012168109416962e-05, 8.33580270409584e-05, 8.659437298774719e-05, 8.983071893453598e-05, 9.306706488132477e-05, 9.630341082811356e-05, 9.953975677490234e-05]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 9.0, 11.0, 15.0, 31.0, 36.0, 47.0, 70.0, 88.0, 160.0, 180.0, 316.0, 497.0, 775.0, 1347.0, 2224.0, 4248.0, 8686.0, 22946.0, 106259.0, 3911052.0, 96137.0, 20645.0, 8419.0, 4050.0, 2159.0, 1301.0, 735.0, 496.0, 331.0, 256.0, 194.0, 114.0, 96.0, 64.0, 53.0, 32.0, 43.0, 29.0, 22.0, 20.0, 8.0, 13.0, 9.0, 11.0, 6.0, 6.0, 7.0, 6.0, 3.0, 6.0, 8.0, 3.0, 4.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.285045623779297e-05, -7.916614413261414e-05, -7.54818320274353e-05, -7.179751992225647e-05, -6.811320781707764e-05, -6.44288957118988e-05, -6.074458360671997e-05, -5.706027150154114e-05, -5.3375959396362305e-05, -4.969164729118347e-05, -4.600733518600464e-05, -4.2323023080825806e-05, -3.863871097564697e-05, -3.495439887046814e-05, -3.127008676528931e-05, -2.7585774660110474e-05, -2.390146255493164e-05, -2.0217150449752808e-05, -1.6532838344573975e-05, -1.2848526239395142e-05, -9.164214134216309e-06, -5.479902029037476e-06, -1.7955899238586426e-06, 1.8887221813201904e-06, 5.5730342864990234e-06, 9.257346391677856e-06, 1.294165849685669e-05, 1.6625970602035522e-05, 2.0310282707214355e-05, 2.399459481239319e-05, 2.767890691757202e-05, 3.1363219022750854e-05, 3.504753112792969e-05, 3.873184323310852e-05, 4.2416155338287354e-05, 4.6100467443466187e-05, 4.978477954864502e-05, 5.346909165382385e-05, 5.7153403759002686e-05, 6.083771586418152e-05, 6.452202796936035e-05, 6.820634007453918e-05, 7.189065217971802e-05, 7.557496428489685e-05, 7.925927639007568e-05, 8.294358849525452e-05, 8.662790060043335e-05, 9.031221270561218e-05, 9.399652481079102e-05, 9.768083691596985e-05, 0.00010136514902114868, 0.00010504946112632751, 0.00010873377323150635, 0.00011241808533668518, 0.00011610239744186401, 0.00011978670954704285, 0.00012347102165222168, 0.0001271553337574005, 0.00013083964586257935, 0.00013452395796775818, 0.000138208270072937, 0.00014189258217811584, 0.00014557689428329468, 0.0001492612063884735, 0.00015294551849365234]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 7.0, 11.0, 17.0, 20.0, 25.0, 29.0, 59.0, 65.0, 92.0, 118.0, 102.0, 76.0, 98.0, 78.0, 47.0, 54.0, 21.0, 24.0, 12.0, 9.0, 4.0, 7.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.205371856689453e-05, -2.1078623831272125e-05, -2.010352909564972e-05, -1.9128434360027313e-05, -1.8153339624404907e-05, -1.71782448887825e-05, -1.6203150153160095e-05, -1.522805541753769e-05, -1.4252960681915283e-05, -1.3277865946292877e-05, -1.2302771210670471e-05, -1.1327676475048065e-05, -1.035258173942566e-05, -9.377487003803253e-06, -8.402392268180847e-06, -7.427297532558441e-06, -6.452202796936035e-06, -5.477108061313629e-06, -4.502013325691223e-06, -3.526918590068817e-06, -2.551823854446411e-06, -1.5767291188240051e-06, -6.016343832015991e-07, 3.734603524208069e-07, 1.3485550880432129e-06, 2.323649823665619e-06, 3.298744559288025e-06, 4.273839294910431e-06, 5.248934030532837e-06, 6.224028766155243e-06, 7.199123501777649e-06, 8.174218237400055e-06, 9.149312973022461e-06, 1.0124407708644867e-05, 1.1099502444267273e-05, 1.2074597179889679e-05, 1.3049691915512085e-05, 1.4024786651134491e-05, 1.4999881386756897e-05, 1.5974976122379303e-05, 1.695007085800171e-05, 1.7925165593624115e-05, 1.890026032924652e-05, 1.9875355064868927e-05, 2.0850449800491333e-05, 2.182554453611374e-05, 2.2800639271736145e-05, 2.377573400735855e-05, 2.4750828742980957e-05, 2.5725923478603363e-05, 2.670101821422577e-05, 2.7676112949848175e-05, 2.865120768547058e-05, 2.9626302421092987e-05, 3.060139715671539e-05, 3.15764918923378e-05, 3.2551586627960205e-05, 3.352668136358261e-05, 3.450177609920502e-05, 3.547687083482742e-05, 3.645196557044983e-05, 3.7427060306072235e-05, 3.840215504169464e-05, 3.937724977731705e-05, 4.035234451293945e-05]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 13.0, 19.0, 32.0, 48.0, 67.0, 103.0, 129.0, 187.0, 314.0, 465.0, 728.0, 986.0, 1515.0, 2483.0, 3768.0, 7288.0, 13704.0, 28416.0, 65396.0, 314310.0, 3452932.0, 194564.0, 53040.0, 24440.0, 12181.0, 6421.0, 3919.0, 2462.0, 1554.0, 915.0, 634.0, 429.0, 277.0, 180.0, 110.0, 82.0, 54.0, 31.0, 18.0, 20.0, 11.0, 9.0, 9.0, 5.0, 7.0, 3.0, 3.0], "bins": [-6.401538848876953e-05, -6.230361759662628e-05, -6.059184670448303e-05, -5.888007581233978e-05, -5.716830492019653e-05, -5.5456534028053284e-05, -5.3744763135910034e-05, -5.2032992243766785e-05, -5.0321221351623535e-05, -4.8609450459480286e-05, -4.6897679567337036e-05, -4.518590867519379e-05, -4.347413778305054e-05, -4.176236689090729e-05, -4.005059599876404e-05, -3.833882510662079e-05, -3.662705421447754e-05, -3.491528332233429e-05, -3.320351243019104e-05, -3.149174153804779e-05, -2.977997064590454e-05, -2.806819975376129e-05, -2.6356428861618042e-05, -2.4644657969474792e-05, -2.2932887077331543e-05, -2.1221116185188293e-05, -1.9509345293045044e-05, -1.7797574400901794e-05, -1.6085803508758545e-05, -1.4374032616615295e-05, -1.2662261724472046e-05, -1.0950490832328796e-05, -9.238719940185547e-06, -7.526949048042297e-06, -5.815178155899048e-06, -4.103407263755798e-06, -2.391636371612549e-06, -6.798654794692993e-07, 1.0319054126739502e-06, 2.7436763048171997e-06, 4.455447196960449e-06, 6.167218089103699e-06, 7.878988981246948e-06, 9.590759873390198e-06, 1.1302530765533447e-05, 1.3014301657676697e-05, 1.4726072549819946e-05, 1.6437843441963196e-05, 1.8149614334106445e-05, 1.9861385226249695e-05, 2.1573156118392944e-05, 2.3284927010536194e-05, 2.4996697902679443e-05, 2.6708468794822693e-05, 2.8420239686965942e-05, 3.0132010579109192e-05, 3.184378147125244e-05, 3.355555236339569e-05, 3.526732325553894e-05, 3.697909414768219e-05, 3.869086503982544e-05, 4.040263593196869e-05, 4.211440682411194e-05, 4.382617771625519e-05, 4.553794860839844e-05]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 12.0, 16.0, 29.0, 30.0, 39.0, 43.0, 72.0, 135.0, 465.0, 1648.0, 911.0, 276.0, 95.0, 56.0, 49.0, 27.0, 25.0, 21.0, 23.0, 16.0, 9.0, 9.0, 5.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.412101745605469e-05, -5.256384611129761e-05, -5.100667476654053e-05, -4.944950342178345e-05, -4.789233207702637e-05, -4.633516073226929e-05, -4.477798938751221e-05, -4.322081804275513e-05, -4.166364669799805e-05, -4.010647535324097e-05, -3.854930400848389e-05, -3.699213266372681e-05, -3.5434961318969727e-05, -3.3877789974212646e-05, -3.2320618629455566e-05, -3.0763447284698486e-05, -2.9206275939941406e-05, -2.7649104595184326e-05, -2.6091933250427246e-05, -2.4534761905670166e-05, -2.2977590560913086e-05, -2.1420419216156006e-05, -1.9863247871398926e-05, -1.8306076526641846e-05, -1.6748905181884766e-05, -1.5191733837127686e-05, -1.3634562492370605e-05, -1.2077391147613525e-05, -1.0520219802856445e-05, -8.963048458099365e-06, -7.405877113342285e-06, -5.848705768585205e-06, -4.291534423828125e-06, -2.734363079071045e-06, -1.1771917343139648e-06, 3.7997961044311523e-07, 1.9371509552001953e-06, 3.4943222999572754e-06, 5.0514936447143555e-06, 6.6086649894714355e-06, 8.165836334228516e-06, 9.723007678985596e-06, 1.1280179023742676e-05, 1.2837350368499756e-05, 1.4394521713256836e-05, 1.5951693058013916e-05, 1.7508864402770996e-05, 1.9066035747528076e-05, 2.0623207092285156e-05, 2.2180378437042236e-05, 2.3737549781799316e-05, 2.5294721126556396e-05, 2.6851892471313477e-05, 2.8409063816070557e-05, 2.9966235160827637e-05, 3.152340650558472e-05, 3.30805778503418e-05, 3.463774919509888e-05, 3.619492053985596e-05, 3.775209188461304e-05, 3.930926322937012e-05, 4.08664345741272e-05, 4.242360591888428e-05, 4.398077726364136e-05, 4.553794860839844e-05]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 18.0, 18.0, 21.0, 33.0, 44.0, 43.0, 74.0, 103.0, 106.0, 125.0, 88.0, 88.0, 44.0, 40.0, 34.0, 17.0, 15.0, 13.0, 15.0, 7.0, 7.0, 2.0, 6.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00017192374798469245, -0.00016515079187229276, -0.00015837782120797783, -0.00015160486509557813, -0.0001448318944312632, -0.0001380589383188635, -0.00013128598220646381, -0.00012451302609406412, -0.00011774005542974919, -0.00011096709204139188, -0.00010419412865303457, -9.742117254063487e-05, -9.064820915227756e-05, -8.387524576392025e-05, -7.710228965152055e-05, -7.032932626316324e-05, -6.355636287480593e-05, -5.6783399486448616e-05, -5.001043973607011e-05, -4.323747998569161e-05, -3.6464516597334296e-05, -2.9691553208976984e-05, -2.291859345859848e-05, -1.6145633708219975e-05, -9.372670319862664e-06, -2.599708750494756e-06, 4.173252818873152e-06, 1.094621438824106e-05, 1.7719175957608968e-05, 2.449213934596628e-05, 3.1265099096344784e-05, 3.803805884672329e-05, 4.48110222350806e-05, 5.158398562343791e-05, 5.8356945373816416e-05, 6.512990512419492e-05, 7.190286851255223e-05, 7.867583190090954e-05, 8.544878801330924e-05, 9.222175140166655e-05, 9.899471479002386e-05, 0.00010576767817838117, 0.00011254064156673849, 0.00011931359767913818, 0.00012608655379153788, 0.0001328595244558528, 0.0001396324805682525, 0.00014640545123256743, 0.00015317840734496713, 0.00015995136345736682, 0.00016672433412168175, 0.00017349729023408145, 0.00018027026089839637, 0.00018704321701079607, 0.00019381617312319577, 0.00020058912923559546, 0.0002073620998999104, 0.0002141350560123101, 0.000220908026676625, 0.0002276809827890247, 0.0002344539389014244, 0.00024122690956573933, 0.00024799988023005426, 0.00025477283634245396, 0.00026154579245485365]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 6.0, 6.0, 9.0, 8.0, 7.0, 5.0, 11.0, 13.0, 16.0, 16.0, 19.0, 21.0, 24.0, 25.0, 24.0, 23.0, 33.0, 33.0, 34.0, 39.0, 47.0, 39.0, 41.0, 37.0, 44.0, 35.0, 29.0, 42.0, 27.0, 46.0, 32.0, 34.0, 30.0, 22.0, 17.0, 20.0, 13.0, 12.0, 10.0, 13.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011074542999267578, -0.00010712537914514542, -0.00010350532829761505, -9.988527745008469e-05, -9.626522660255432e-05, -9.264517575502396e-05, -8.902512490749359e-05, -8.540507405996323e-05, -8.178502321243286e-05, -7.81649723649025e-05, -7.454492151737213e-05, -7.092487066984177e-05, -6.73048198223114e-05, -6.368476897478104e-05, -6.006471812725067e-05, -5.6444667279720306e-05, -5.282461643218994e-05, -4.9204565584659576e-05, -4.558451473712921e-05, -4.1964463889598846e-05, -3.834441304206848e-05, -3.4724362194538116e-05, -3.110431134700775e-05, -2.7484260499477386e-05, -2.386420965194702e-05, -2.0244158804416656e-05, -1.662410795688629e-05, -1.3004057109355927e-05, -9.384006261825562e-06, -5.7639554142951965e-06, -2.1439045667648315e-06, 1.4761462807655334e-06, 5.0961971282958984e-06, 8.716247975826263e-06, 1.2336298823356628e-05, 1.5956349670886993e-05, 1.957640051841736e-05, 2.3196451365947723e-05, 2.681650221347809e-05, 3.0436553061008453e-05, 3.405660390853882e-05, 3.767665475606918e-05, 4.129670560359955e-05, 4.491675645112991e-05, 4.853680729866028e-05, 5.215685814619064e-05, 5.577690899372101e-05, 5.939695984125137e-05, 6.301701068878174e-05, 6.66370615363121e-05, 7.025711238384247e-05, 7.387716323137283e-05, 7.74972140789032e-05, 8.111726492643356e-05, 8.473731577396393e-05, 8.835736662149429e-05, 9.197741746902466e-05, 9.559746831655502e-05, 9.921751916408539e-05, 0.00010283757001161575, 0.00010645762085914612, 0.00011007767170667648, 0.00011369772255420685, 0.00011731777340173721, 0.00012093782424926758]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 1.0, 5.0, 7.0, 9.0, 13.0, 29.0, 29.0, 56.0, 84.0, 134.0, 209.0, 299.0, 571.0, 1064.0, 1899.0, 4350.0, 9785.0, 25350.0, 84959.0, 558977.0, 269566.0, 57691.0, 18764.0, 7560.0, 3324.0, 1636.0, 888.0, 479.0, 292.0, 175.0, 109.0, 65.0, 57.0, 34.0, 28.0, 24.0, 10.0, 5.0, 8.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015020370483398438, -0.00014533475041389465, -0.00014046579599380493, -0.0001355968415737152, -0.0001307278871536255, -0.00012585893273353577, -0.00012098997831344604, -0.00011612102389335632, -0.0001112520694732666, -0.00010638311505317688, -0.00010151416063308716, -9.664520621299744e-05, -9.177625179290771e-05, -8.690729737281799e-05, -8.203834295272827e-05, -7.716938853263855e-05, -7.230043411254883e-05, -6.74314796924591e-05, -6.256252527236938e-05, -5.769357085227966e-05, -5.282461643218994e-05, -4.795566201210022e-05, -4.30867075920105e-05, -3.8217753171920776e-05, -3.3348798751831055e-05, -2.8479844331741333e-05, -2.361088991165161e-05, -1.874193549156189e-05, -1.3872981071472168e-05, -9.004026651382446e-06, -4.135072231292725e-06, 7.338821887969971e-07, 5.602836608886719e-06, 1.047179102897644e-05, 1.5340745449066162e-05, 2.0209699869155884e-05, 2.5078654289245605e-05, 2.9947608709335327e-05, 3.481656312942505e-05, 3.968551754951477e-05, 4.455447196960449e-05, 4.9423426389694214e-05, 5.4292380809783936e-05, 5.916133522987366e-05, 6.403028964996338e-05, 6.88992440700531e-05, 7.376819849014282e-05, 7.863715291023254e-05, 8.350610733032227e-05, 8.837506175041199e-05, 9.324401617050171e-05, 9.811297059059143e-05, 0.00010298192501068115, 0.00010785087943077087, 0.0001127198338508606, 0.00011758878827095032, 0.00012245774269104004, 0.00012732669711112976, 0.00013219565153121948, 0.0001370646059513092, 0.00014193356037139893, 0.00014680251479148865, 0.00015167146921157837, 0.0001565404236316681, 0.0001614093780517578]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 9.0, 10.0, 13.0, 20.0, 26.0, 31.0, 46.0, 65.0, 73.0, 104.0, 105.0, 97.0, 95.0, 67.0, 61.0, 55.0, 25.0, 20.0, 24.0, 13.0, 7.0, 5.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-05, -2.4106353521347046e-05, -2.317875623703003e-05, -2.2251158952713013e-05, -2.1323561668395996e-05, -2.039596438407898e-05, -1.9468367099761963e-05, -1.8540769815444946e-05, -1.761317253112793e-05, -1.6685575246810913e-05, -1.5757977962493896e-05, -1.483038067817688e-05, -1.3902783393859863e-05, -1.2975186109542847e-05, -1.204758882522583e-05, -1.1119991540908813e-05, -1.0192394256591797e-05, -9.26479697227478e-06, -8.337199687957764e-06, -7.409602403640747e-06, -6.4820051193237305e-06, -5.554407835006714e-06, -4.626810550689697e-06, -3.6992132663726807e-06, -2.771615982055664e-06, -1.8440186977386475e-06, -9.164214134216309e-07, 1.1175870895385742e-08, 9.387731552124023e-07, 1.866370439529419e-06, 2.7939677238464355e-06, 3.721565008163452e-06, 4.649162292480469e-06, 5.576759576797485e-06, 6.504356861114502e-06, 7.4319541454315186e-06, 8.359551429748535e-06, 9.287148714065552e-06, 1.0214745998382568e-05, 1.1142343282699585e-05, 1.2069940567016602e-05, 1.2997537851333618e-05, 1.3925135135650635e-05, 1.4852732419967651e-05, 1.5780329704284668e-05, 1.6707926988601685e-05, 1.76355242729187e-05, 1.8563121557235718e-05, 1.9490718841552734e-05, 2.041831612586975e-05, 2.1345913410186768e-05, 2.2273510694503784e-05, 2.32011079788208e-05, 2.4128705263137817e-05, 2.5056302547454834e-05, 2.598389983177185e-05, 2.6911497116088867e-05, 2.7839094400405884e-05, 2.87666916847229e-05, 2.9694288969039917e-05, 3.0621886253356934e-05, 3.154948353767395e-05, 3.247708082199097e-05, 3.3404678106307983e-05, 3.4332275390625e-05]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 18.0, 16.0, 40.0, 58.0, 112.0, 158.0, 252.0, 478.0, 760.0, 1370.0, 2307.0, 4164.0, 7755.0, 13035.0, 24798.0, 46425.0, 101729.0, 286253.0, 345322.0, 107324.0, 48354.0, 26196.0, 13588.0, 7710.0, 4324.0, 2568.0, 1454.0, 814.0, 475.0, 280.0, 136.0, 88.0, 69.0, 41.0, 20.0, 16.0, 10.0, 9.0, 9.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4717063903808594e-05, -5.295407027006149e-05, -5.119107663631439e-05, -4.942808300256729e-05, -4.766508936882019e-05, -4.590209573507309e-05, -4.413910210132599e-05, -4.237610846757889e-05, -4.061311483383179e-05, -3.8850121200084686e-05, -3.7087127566337585e-05, -3.5324133932590485e-05, -3.3561140298843384e-05, -3.179814666509628e-05, -3.0035153031349182e-05, -2.827215939760208e-05, -2.650916576385498e-05, -2.474617213010788e-05, -2.298317849636078e-05, -2.1220184862613678e-05, -1.9457191228866577e-05, -1.7694197595119476e-05, -1.5931203961372375e-05, -1.4168210327625275e-05, -1.2405216693878174e-05, -1.0642223060131073e-05, -8.879229426383972e-06, -7.116235792636871e-06, -5.3532421588897705e-06, -3.5902485251426697e-06, -1.8272548913955688e-06, -6.426125764846802e-08, 1.6987323760986328e-06, 3.4617260098457336e-06, 5.2247196435928345e-06, 6.987713277339935e-06, 8.750706911087036e-06, 1.0513700544834137e-05, 1.2276694178581238e-05, 1.4039687812328339e-05, 1.580268144607544e-05, 1.756567507982254e-05, 1.932866871356964e-05, 2.1091662347316742e-05, 2.2854655981063843e-05, 2.4617649614810944e-05, 2.6380643248558044e-05, 2.8143636882305145e-05, 2.9906630516052246e-05, 3.166962414979935e-05, 3.343261778354645e-05, 3.519561141729355e-05, 3.695860505104065e-05, 3.872159868478775e-05, 4.048459231853485e-05, 4.224758595228195e-05, 4.401057958602905e-05, 4.5773573219776154e-05, 4.7536566853523254e-05, 4.9299560487270355e-05, 5.1062554121017456e-05, 5.282554775476456e-05, 5.458854138851166e-05, 5.635153502225876e-05, 5.811452865600586e-05]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 12.0, 5.0, 11.0, 14.0, 13.0, 18.0, 19.0, 21.0, 21.0, 24.0, 24.0, 40.0, 34.0, 41.0, 51.0, 51.0, 46.0, 45.0, 40.0, 49.0, 46.0, 36.0, 40.0, 34.0, 33.0, 34.0, 41.0, 22.0, 21.0, 20.0, 14.0, 16.0, 16.0, 10.0, 9.0, 7.0, 7.0, 2.0, 7.0, 2.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.410743713378906e-05, -4.268437623977661e-05, -4.126131534576416e-05, -3.983825445175171e-05, -3.841519355773926e-05, -3.699213266372681e-05, -3.5569071769714355e-05, -3.4146010875701904e-05, -3.272294998168945e-05, -3.1299889087677e-05, -2.987682819366455e-05, -2.84537672996521e-05, -2.703070640563965e-05, -2.5607645511627197e-05, -2.4184584617614746e-05, -2.2761523723602295e-05, -2.1338462829589844e-05, -1.9915401935577393e-05, -1.849234104156494e-05, -1.706928014755249e-05, -1.564621925354004e-05, -1.4223158359527588e-05, -1.2800097465515137e-05, -1.1377036571502686e-05, -9.953975677490234e-06, -8.530914783477783e-06, -7.107853889465332e-06, -5.684792995452881e-06, -4.26173210144043e-06, -2.8386712074279785e-06, -1.4156103134155273e-06, 7.450580596923828e-09, 1.430511474609375e-06, 2.853572368621826e-06, 4.276633262634277e-06, 5.6996941566467285e-06, 7.12275505065918e-06, 8.545815944671631e-06, 9.968876838684082e-06, 1.1391937732696533e-05, 1.2814998626708984e-05, 1.4238059520721436e-05, 1.5661120414733887e-05, 1.7084181308746338e-05, 1.850724220275879e-05, 1.993030309677124e-05, 2.135336399078369e-05, 2.2776424884796143e-05, 2.4199485778808594e-05, 2.5622546672821045e-05, 2.7045607566833496e-05, 2.8468668460845947e-05, 2.98917293548584e-05, 3.131479024887085e-05, 3.27378511428833e-05, 3.416091203689575e-05, 3.55839729309082e-05, 3.7007033824920654e-05, 3.8430094718933105e-05, 3.985315561294556e-05, 4.127621650695801e-05, 4.269927740097046e-05, 4.412233829498291e-05, 4.554539918899536e-05, 4.696846008300781e-05]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 12.0, 12.0, 14.0, 18.0, 11.0, 41.0, 29.0, 82.0, 58.0, 174.0, 121.0, 401.0, 745.0, 607.0, 2004.0, 1770.0, 6527.0, 6278.0, 27644.0, 29724.0, 146422.0, 176021.0, 426915.0, 147300.0, 29061.0, 27555.0, 6384.0, 6673.0, 1696.0, 1963.0, 589.0, 693.0, 227.0, 278.0, 178.0, 78.0, 88.0, 29.0, 55.0, 16.0, 20.0, 8.0, 9.0, 5.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.86102294921875e-06, -2.7688220143318176e-06, -2.6766210794448853e-06, -2.584420144557953e-06, -2.4922192096710205e-06, -2.400018274784088e-06, -2.3078173398971558e-06, -2.2156164050102234e-06, -2.123415470123291e-06, -2.0312145352363586e-06, -1.9390136003494263e-06, -1.846812665462494e-06, -1.7546117305755615e-06, -1.6624107956886292e-06, -1.5702098608016968e-06, -1.4780089259147644e-06, -1.385807991027832e-06, -1.2936070561408997e-06, -1.2014061212539673e-06, -1.109205186367035e-06, -1.0170042514801025e-06, -9.248033165931702e-07, -8.326023817062378e-07, -7.404014468193054e-07, -6.48200511932373e-07, -5.559995770454407e-07, -4.637986421585083e-07, -3.7159770727157593e-07, -2.7939677238464355e-07, -1.8719583749771118e-07, -9.499490261077881e-08, -2.7939677238464355e-09, 8.940696716308594e-08, 1.816079020500183e-07, 2.738088369369507e-07, 3.6600977182388306e-07, 4.5821070671081543e-07, 5.504116415977478e-07, 6.426125764846802e-07, 7.348135113716125e-07, 8.270144462585449e-07, 9.192153811454773e-07, 1.0114163160324097e-06, 1.103617250919342e-06, 1.1958181858062744e-06, 1.2880191206932068e-06, 1.3802200555801392e-06, 1.4724209904670715e-06, 1.564621925354004e-06, 1.6568228602409363e-06, 1.7490237951278687e-06, 1.841224730014801e-06, 1.9334256649017334e-06, 2.0256265997886658e-06, 2.117827534675598e-06, 2.2100284695625305e-06, 2.302229404449463e-06, 2.3944303393363953e-06, 2.4866312742233276e-06, 2.57883220911026e-06, 2.6710331439971924e-06, 2.7632340788841248e-06, 2.855435013771057e-06, 2.9476359486579895e-06, 3.039836883544922e-06]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 0.0, 2.0, 9.0, 12.0, 0.0, 11.0, 21.0, 0.0, 26.0, 42.0, 41.0, 0.0, 39.0, 56.0, 55.0, 0.0, 69.0, 73.0, 69.0, 0.0, 73.0, 76.0, 0.0, 75.0, 49.0, 37.0, 0.0, 38.0, 33.0, 26.0, 0.0, 17.0, 20.0, 14.0, 0.0, 4.0, 6.0, 0.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3113021850585938e-06, -1.2675300240516663e-06, -1.2237578630447388e-06, -1.1799857020378113e-06, -1.1362135410308838e-06, -1.0924413800239563e-06, -1.0486692190170288e-06, -1.0048970580101013e-06, -9.611248970031738e-07, -9.173527359962463e-07, -8.735805749893188e-07, -8.298084139823914e-07, -7.860362529754639e-07, -7.422640919685364e-07, -6.984919309616089e-07, -6.547197699546814e-07, -6.109476089477539e-07, -5.671754479408264e-07, -5.234032869338989e-07, -4.796311259269714e-07, -4.3585896492004395e-07, -3.9208680391311646e-07, -3.4831464290618896e-07, -3.045424818992615e-07, -2.60770320892334e-07, -2.169981598854065e-07, -1.73225998878479e-07, -1.2945383787155151e-07, -8.568167686462402e-08, -4.190951585769653e-08, 1.862645149230957e-09, 4.563480615615845e-08, 8.940696716308594e-08, 1.3317912817001343e-07, 1.7695128917694092e-07, 2.207234501838684e-07, 2.644956111907959e-07, 3.082677721977234e-07, 3.520399332046509e-07, 3.9581209421157837e-07, 4.3958425521850586e-07, 4.833564162254333e-07, 5.271285772323608e-07, 5.709007382392883e-07, 6.146728992462158e-07, 6.584450602531433e-07, 7.022172212600708e-07, 7.459893822669983e-07, 7.897615432739258e-07, 8.335337042808533e-07, 8.773058652877808e-07, 9.210780262947083e-07, 9.648501873016357e-07, 1.0086223483085632e-06, 1.0523945093154907e-06, 1.0961666703224182e-06, 1.1399388313293457e-06, 1.1837109923362732e-06, 1.2274831533432007e-06, 1.2712553143501282e-06, 1.3150274753570557e-06, 1.3587996363639832e-06, 1.4025717973709106e-06, 1.4463439583778381e-06, 1.4901161193847656e-06]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 12.0, 9.0, 22.0, 71.0, 56.0, 77.0, 109.0, 157.0, 532.0, 508.0, 766.0, 1176.0, 1938.0, 8879.0, 10379.0, 19301.0, 37277.0, 79994.0, 533869.0, 192002.0, 80118.0, 37650.0, 19147.0, 15832.0, 3311.0, 1885.0, 1177.0, 743.0, 804.0, 219.0, 154.0, 107.0, 79.0, 88.0, 27.0, 23.0, 14.0, 11.0, 17.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1457672119140625e-06, -2.0740553736686707e-06, -2.002343535423279e-06, -1.930631697177887e-06, -1.8589198589324951e-06, -1.7872080206871033e-06, -1.7154961824417114e-06, -1.6437843441963196e-06, -1.5720725059509277e-06, -1.5003606677055359e-06, -1.428648829460144e-06, -1.3569369912147522e-06, -1.2852251529693604e-06, -1.2135133147239685e-06, -1.1418014764785767e-06, -1.0700896382331848e-06, -9.98377799987793e-07, -9.266659617424011e-07, -8.549541234970093e-07, -7.832422852516174e-07, -7.115304470062256e-07, -6.398186087608337e-07, -5.681067705154419e-07, -4.9639493227005e-07, -4.246830940246582e-07, -3.5297125577926636e-07, -2.812594175338745e-07, -2.0954757928848267e-07, -1.3783574104309082e-07, -6.612390279769897e-08, 5.587935447692871e-09, 7.729977369308472e-08, 1.4901161193847656e-07, 2.207234501838684e-07, 2.9243528842926025e-07, 3.641471266746521e-07, 4.3585896492004395e-07, 5.075708031654358e-07, 5.792826414108276e-07, 6.509944796562195e-07, 7.227063179016113e-07, 7.944181561470032e-07, 8.66129994392395e-07, 9.378418326377869e-07, 1.0095536708831787e-06, 1.0812655091285706e-06, 1.1529773473739624e-06, 1.2246891856193542e-06, 1.296401023864746e-06, 1.368112862110138e-06, 1.4398247003555298e-06, 1.5115365386009216e-06, 1.5832483768463135e-06, 1.6549602150917053e-06, 1.7266720533370972e-06, 1.798383891582489e-06, 1.8700957298278809e-06, 1.9418075680732727e-06, 2.0135194063186646e-06, 2.0852312445640564e-06, 2.1569430828094482e-06, 2.22865492105484e-06, 2.300366759300232e-06, 2.3720785975456238e-06, 2.4437904357910156e-06]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 12.0, 4.0, 7.0, 14.0, 21.0, 25.0, 30.0, 43.0, 36.0, 46.0, 51.0, 60.0, 58.0, 63.0, 68.0, 57.0, 63.0, 49.0, 49.0, 42.0, 41.0, 32.0, 28.0, 20.0, 19.0, 16.0, 15.0, 4.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.667998731136322e-06, -1.607462763786316e-06, -1.5469267964363098e-06, -1.4863908290863037e-06, -1.4258548617362976e-06, -1.3653188943862915e-06, -1.3047829270362854e-06, -1.2442469596862793e-06, -1.1837109923362732e-06, -1.123175024986267e-06, -1.062639057636261e-06, -1.0021030902862549e-06, -9.415671229362488e-07, -8.810311555862427e-07, -8.204951882362366e-07, -7.599592208862305e-07, -6.994232535362244e-07, -6.388872861862183e-07, -5.783513188362122e-07, -5.178153514862061e-07, -4.5727938413619995e-07, -3.9674341678619385e-07, -3.3620744943618774e-07, -2.7567148208618164e-07, -2.1513551473617554e-07, -1.5459954738616943e-07, -9.406358003616333e-08, -3.3527612686157227e-08, 2.7008354663848877e-08, 8.754432201385498e-08, 1.4808028936386108e-07, 2.086162567138672e-07, 2.691522240638733e-07, 3.296881914138794e-07, 3.902241587638855e-07, 4.507601261138916e-07, 5.112960934638977e-07, 5.718320608139038e-07, 6.323680281639099e-07, 6.92903995513916e-07, 7.534399628639221e-07, 8.139759302139282e-07, 8.745118975639343e-07, 9.350478649139404e-07, 9.955838322639465e-07, 1.0561197996139526e-06, 1.1166557669639587e-06, 1.1771917343139648e-06, 1.237727701663971e-06, 1.298263669013977e-06, 1.3587996363639832e-06, 1.4193356037139893e-06, 1.4798715710639954e-06, 1.5404075384140015e-06, 1.6009435057640076e-06, 1.6614794731140137e-06, 1.7220154404640198e-06, 1.7825514078140259e-06, 1.843087375164032e-06, 1.903623342514038e-06, 1.964159309864044e-06, 2.0246952772140503e-06, 2.0852312445640564e-06, 2.1457672119140625e-06]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 10.0, 18.0, 18.0, 30.0, 40.0, 58.0, 127.0, 249.0, 156.0, 86.0, 56.0, 44.0, 25.0, 15.0, 22.0, 10.0, 2.0, 7.0, 5.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001720039581414312, -0.00016356947890017182, -0.00015513499965891242, -0.00014670052041765302, -0.00013826604117639363, -0.00012983157648704946, -0.00012139709724579006, -0.00011296261800453067, -0.00010452813876327127, -9.609365952201188e-05, -8.765918028075248e-05, -7.92247083154507e-05, -7.07902290741913e-05, -6.23557498329319e-05, -5.392127422965132e-05, -4.548679862637073e-05, -3.705231938511133e-05, -2.861784196284134e-05, -2.0183364540571347e-05, -1.1748887118301354e-05, -3.314409696031362e-06, 5.120069545228034e-06, 1.3554545148508623e-05, 2.1989020751789212e-05, 3.0423499993048608e-05, 3.8857979234308004e-05, 4.729245483758859e-05, 5.572693044086918e-05, 6.416140968212858e-05, 7.259588892338797e-05, 8.103036088868976e-05, 8.946484012994915e-05, 9.7899348475039e-05, 0.0001063338277162984, 0.0001147683069575578, 0.0001232027861988172, 0.0001316372654400766, 0.00014007173012942076, 0.00014850620937068015, 0.00015694068861193955, 0.00016537516785319895, 0.00017380964709445834, 0.00018224412633571774, 0.00019067860557697713, 0.0001991130702663213, 0.00020754756405949593, 0.0002159820287488401, 0.0002244165079900995, 0.00023285098723135889, 0.00024128546647261828, 0.0002497199457138777, 0.00025815441040322185, 0.00026658890419639647, 0.00027502336888574064, 0.00028345786267891526, 0.00029189232736825943, 0.0003003267920576036, 0.00030876125674694777, 0.0003171957505401224, 0.00032563021522946656, 0.0003340647090226412, 0.00034249917371198535, 0.00035093366750516, 0.00035936813219450414, 0.00036780262598767877]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 7.0, 11.0, 14.0, 20.0, 15.0, 25.0, 27.0, 20.0, 25.0, 34.0, 31.0, 55.0, 31.0, 33.0, 41.0, 36.0, 33.0, 33.0, 50.0, 43.0, 34.0, 37.0, 27.0, 39.0, 24.0, 31.0, 22.0, 30.0, 24.0, 26.0, 20.0, 13.0, 10.0, 11.0, 1.0, 11.0, 3.0, 5.0, 6.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0], "bins": [-0.00012248754501342773, -0.00011892616748809814, -0.00011536478996276855, -0.00011180341243743896, -0.00010824203491210938, -0.00010468065738677979, -0.0001011192798614502, -9.75579023361206e-05, -9.399652481079102e-05, -9.043514728546143e-05, -8.687376976013184e-05, -8.331239223480225e-05, -7.975101470947266e-05, -7.618963718414307e-05, -7.262825965881348e-05, -6.906688213348389e-05, -6.55055046081543e-05, -6.194412708282471e-05, -5.838274955749512e-05, -5.482137203216553e-05, -5.125999450683594e-05, -4.769861698150635e-05, -4.413723945617676e-05, -4.057586193084717e-05, -3.701448440551758e-05, -3.345310688018799e-05, -2.98917293548584e-05, -2.633035182952881e-05, -2.276897430419922e-05, -1.920759677886963e-05, -1.564621925354004e-05, -1.208484172821045e-05, -8.52346420288086e-06, -4.9620866775512695e-06, -1.4007091522216797e-06, 2.16066837310791e-06, 5.7220458984375e-06, 9.28342342376709e-06, 1.284480094909668e-05, 1.640617847442627e-05, 1.996755599975586e-05, 2.352893352508545e-05, 2.709031105041504e-05, 3.065168857574463e-05, 3.421306610107422e-05, 3.777444362640381e-05, 4.13358211517334e-05, 4.489719867706299e-05, 4.845857620239258e-05, 5.201995372772217e-05, 5.558133125305176e-05, 5.914270877838135e-05, 6.270408630371094e-05, 6.626546382904053e-05, 6.982684135437012e-05, 7.338821887969971e-05, 7.69495964050293e-05, 8.051097393035889e-05, 8.407235145568848e-05, 8.763372898101807e-05, 9.119510650634766e-05, 9.475648403167725e-05, 9.831786155700684e-05, 0.00010187923908233643, 0.00010544061660766602]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 7.0, 10.0, 12.0, 9.0, 14.0, 23.0, 28.0, 49.0, 62.0, 85.0, 118.0, 173.0, 230.0, 349.0, 540.0, 800.0, 1244.0, 2026.0, 3643.0, 7164.0, 15435.0, 48065.0, 953660.0, 3065865.0, 57114.0, 18430.0, 8214.0, 4241.0, 2338.0, 1460.0, 909.0, 585.0, 401.0, 245.0, 186.0, 134.0, 99.0, 59.0, 37.0, 42.0, 28.0, 29.0, 23.0, 15.0, 11.0, 16.0, 5.0, 12.0, 13.0, 7.0, 7.0, 9.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.426738739013672e-05, -7.142126560211182e-05, -6.857514381408691e-05, -6.572902202606201e-05, -6.288290023803711e-05, -6.003677845001221e-05, -5.7190656661987305e-05, -5.43445348739624e-05, -5.14984130859375e-05, -4.86522912979126e-05, -4.5806169509887695e-05, -4.296004772186279e-05, -4.011392593383789e-05, -3.726780414581299e-05, -3.4421682357788086e-05, -3.1575560569763184e-05, -2.872943878173828e-05, -2.588331699371338e-05, -2.3037195205688477e-05, -2.0191073417663574e-05, -1.7344951629638672e-05, -1.449882984161377e-05, -1.1652708053588867e-05, -8.806586265563965e-06, -5.9604644775390625e-06, -3.11434268951416e-06, -2.682209014892578e-07, 2.5779008865356445e-06, 5.424022674560547e-06, 8.27014446258545e-06, 1.1116266250610352e-05, 1.3962388038635254e-05, 1.6808509826660156e-05, 1.965463161468506e-05, 2.250075340270996e-05, 2.5346875190734863e-05, 2.8192996978759766e-05, 3.103911876678467e-05, 3.388524055480957e-05, 3.673136234283447e-05, 3.9577484130859375e-05, 4.242360591888428e-05, 4.526972770690918e-05, 4.811584949493408e-05, 5.0961971282958984e-05, 5.380809307098389e-05, 5.665421485900879e-05, 5.950033664703369e-05, 6.23464584350586e-05, 6.51925802230835e-05, 6.80387020111084e-05, 7.08848237991333e-05, 7.37309455871582e-05, 7.65770673751831e-05, 7.942318916320801e-05, 8.226931095123291e-05, 8.511543273925781e-05, 8.796155452728271e-05, 9.080767631530762e-05, 9.365379810333252e-05, 9.649991989135742e-05, 9.934604167938232e-05, 0.00010219216346740723, 0.00010503828525543213, 0.00010788440704345703]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 1.0, 3.0, 3.0, 18.0, 8.0, 7.0, 19.0, 28.0, 31.0, 56.0, 71.0, 65.0, 93.0, 106.0, 102.0, 64.0, 64.0, 72.0, 57.0, 27.0, 23.0, 19.0, 18.0, 11.0, 7.0, 4.0, 3.0, 9.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.491474151611328e-05, -2.40253284573555e-05, -2.3135915398597717e-05, -2.2246502339839935e-05, -2.1357089281082153e-05, -2.046767622232437e-05, -1.957826316356659e-05, -1.8688850104808807e-05, -1.7799437046051025e-05, -1.6910023987293243e-05, -1.602061092853546e-05, -1.513119786977768e-05, -1.4241784811019897e-05, -1.3352371752262115e-05, -1.2462958693504333e-05, -1.1573545634746552e-05, -1.068413257598877e-05, -9.794719517230988e-06, -8.905306458473206e-06, -8.015893399715424e-06, -7.126480340957642e-06, -6.23706728219986e-06, -5.347654223442078e-06, -4.458241164684296e-06, -3.5688281059265137e-06, -2.6794150471687317e-06, -1.7900019884109497e-06, -9.005889296531677e-07, -1.1175870895385742e-08, 8.782371878623962e-07, 1.7676502466201782e-06, 2.65706330537796e-06, 3.546476364135742e-06, 4.435889422893524e-06, 5.325302481651306e-06, 6.214715540409088e-06, 7.10412859916687e-06, 7.993541657924652e-06, 8.882954716682434e-06, 9.772367775440216e-06, 1.0661780834197998e-05, 1.155119389295578e-05, 1.2440606951713562e-05, 1.3330020010471344e-05, 1.4219433069229126e-05, 1.5108846127986908e-05, 1.599825918674469e-05, 1.6887672245502472e-05, 1.7777085304260254e-05, 1.8666498363018036e-05, 1.9555911421775818e-05, 2.04453244805336e-05, 2.1334737539291382e-05, 2.2224150598049164e-05, 2.3113563656806946e-05, 2.4002976715564728e-05, 2.489238977432251e-05, 2.5781802833080292e-05, 2.6671215891838074e-05, 2.7560628950595856e-05, 2.8450042009353638e-05, 2.933945506811142e-05, 3.02288681268692e-05, 3.1118281185626984e-05, 3.2007694244384766e-05]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 9.0, 4.0, 16.0, 9.0, 21.0, 26.0, 58.0, 73.0, 127.0, 200.0, 350.0, 537.0, 931.0, 1630.0, 2852.0, 5302.0, 10331.0, 21163.0, 54681.0, 235738.0, 3506108.0, 252408.0, 55969.0, 22310.0, 10497.0, 5635.0, 3038.0, 1738.0, 1026.0, 571.0, 336.0, 205.0, 132.0, 89.0, 57.0, 38.0, 30.0, 11.0, 9.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.984306335449219e-05, -5.794409662485123e-05, -5.6045129895210266e-05, -5.4146163165569305e-05, -5.2247196435928345e-05, -5.0348229706287384e-05, -4.844926297664642e-05, -4.655029624700546e-05, -4.46513295173645e-05, -4.275236278772354e-05, -4.085339605808258e-05, -3.895442932844162e-05, -3.705546259880066e-05, -3.51564958691597e-05, -3.325752913951874e-05, -3.135856240987778e-05, -2.9459595680236816e-05, -2.7560628950595856e-05, -2.5661662220954895e-05, -2.3762695491313934e-05, -2.1863728761672974e-05, -1.9964762032032013e-05, -1.8065795302391052e-05, -1.616682857275009e-05, -1.4267861843109131e-05, -1.236889511346817e-05, -1.046992838382721e-05, -8.570961654186249e-06, -6.671994924545288e-06, -4.773028194904327e-06, -2.8740614652633667e-06, -9.75094735622406e-07, 9.238719940185547e-07, 2.8228387236595154e-06, 4.721805453300476e-06, 6.620772182941437e-06, 8.519738912582397e-06, 1.0418705642223358e-05, 1.2317672371864319e-05, 1.421663910150528e-05, 1.611560583114624e-05, 1.80145725607872e-05, 1.991353929042816e-05, 2.1812506020069122e-05, 2.3711472749710083e-05, 2.5610439479351044e-05, 2.7509406208992004e-05, 2.9408372938632965e-05, 3.1307339668273926e-05, 3.3206306397914886e-05, 3.510527312755585e-05, 3.700423985719681e-05, 3.890320658683777e-05, 4.080217331647873e-05, 4.270114004611969e-05, 4.460010677576065e-05, 4.649907350540161e-05, 4.839804023504257e-05, 5.029700696468353e-05, 5.2195973694324493e-05, 5.4094940423965454e-05, 5.5993907153606415e-05, 5.7892873883247375e-05, 5.9791840612888336e-05, 6.16908073425293e-05]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 5.0, 4.0, 12.0, 17.0, 17.0, 20.0, 41.0, 49.0, 57.0, 112.0, 330.0, 1007.0, 1482.0, 456.0, 156.0, 65.0, 55.0, 30.0, 30.0, 24.0, 18.0, 13.0, 12.0, 12.0, 9.0, 6.0, 6.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.684925079345703e-05, -4.52408567070961e-05, -4.363246262073517e-05, -4.202406853437424e-05, -4.0415674448013306e-05, -3.8807280361652374e-05, -3.719888627529144e-05, -3.559049218893051e-05, -3.398209810256958e-05, -3.237370401620865e-05, -3.076530992984772e-05, -2.9156915843486786e-05, -2.7548521757125854e-05, -2.5940127670764923e-05, -2.4331733584403992e-05, -2.272333949804306e-05, -2.111494541168213e-05, -1.9506551325321198e-05, -1.7898157238960266e-05, -1.6289763152599335e-05, -1.4681369066238403e-05, -1.3072974979877472e-05, -1.146458089351654e-05, -9.856186807155609e-06, -8.247792720794678e-06, -6.639398634433746e-06, -5.031004548072815e-06, -3.4226104617118835e-06, -1.8142163753509521e-06, -2.0582228899002075e-07, 1.4025717973709106e-06, 3.010965883731842e-06, 4.6193599700927734e-06, 6.227754056453705e-06, 7.836148142814636e-06, 9.444542229175568e-06, 1.1052936315536499e-05, 1.266133040189743e-05, 1.4269724488258362e-05, 1.5878118574619293e-05, 1.7486512660980225e-05, 1.9094906747341156e-05, 2.0703300833702087e-05, 2.231169492006302e-05, 2.392008900642395e-05, 2.552848309278488e-05, 2.7136877179145813e-05, 2.8745271265506744e-05, 3.0353665351867676e-05, 3.196205943822861e-05, 3.357045352458954e-05, 3.517884761095047e-05, 3.67872416973114e-05, 3.839563578367233e-05, 4.0004029870033264e-05, 4.1612423956394196e-05, 4.322081804275513e-05, 4.482921212911606e-05, 4.643760621547699e-05, 4.804600030183792e-05, 4.965439438819885e-05, 5.1262788474559784e-05, 5.2871182560920715e-05, 5.447957664728165e-05, 5.608797073364258e-05]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 11.0, 11.0, 15.0, 14.0, 21.0, 31.0, 40.0, 51.0, 77.0, 103.0, 107.0, 96.0, 99.0, 66.0, 40.0, 57.0, 23.0, 24.0, 12.0, 19.0, 9.0, 16.0, 8.0, 2.0, 8.0, 4.0, 8.0, 6.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00017171489889733493, -0.00016608646546956152, -0.0001604580320417881, -0.0001548296131659299, -0.0001492011797381565, -0.00014357274631038308, -0.00013794431288260967, -0.00013231587945483625, -0.00012668746057897806, -0.00012105902715120465, -0.00011543060099938884, -0.00010980216757161543, -0.00010417374141979963, -9.854530799202621e-05, -9.29168745642528e-05, -8.728844113647938e-05, -8.166000770870596e-05, -7.603157428093255e-05, -7.040314812911674e-05, -6.477471470134333e-05, -5.914628491154872e-05, -5.351785512175411e-05, -4.7889421693980694e-05, -4.2260991904186085e-05, -3.6632562114391476e-05, -3.100413232459687e-05, -2.5375700715812854e-05, -1.9747269107028842e-05, -1.4118839317234233e-05, -8.490409527439624e-06, -2.861976099666208e-06, 2.766453690128401e-06, 8.394868928007782e-06, 1.4023299627297092e-05, 1.9651730326586403e-05, 2.5280161935370415e-05, 3.0908591725165024e-05, 3.653702151495963e-05, 4.216545494273305e-05, 4.779388473252766e-05, 5.342231452232227e-05, 5.9050744312116876e-05, 6.467917410191149e-05, 7.03076075296849e-05, 7.593604095745832e-05, 8.156446710927412e-05, 8.719290053704754e-05, 9.282132668886334e-05, 9.844976011663675e-05, 0.00010407819354441017, 0.00010970661969622597, 0.00011533505312399939, 0.00012096347927581519, 0.0001265919127035886, 0.00013222034613136202, 0.00013784877955913544, 0.00014347719843499362, 0.00014910563186276704, 0.00015473406529054046, 0.00016036248416639864, 0.00016599091759417206, 0.00017161935102194548, 0.0001772477844497189, 0.0001828762178774923, 0.00018850465130526572]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 7.0, 7.0, 14.0, 15.0, 15.0, 30.0, 19.0, 28.0, 19.0, 42.0, 35.0, 39.0, 44.0, 38.0, 49.0, 61.0, 49.0, 44.0, 49.0, 59.0, 46.0, 44.0, 40.0, 35.0, 29.0, 29.0, 20.0, 22.0, 14.0, 13.0, 12.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.00015342235565185547, -0.00014934968203306198, -0.0001452770084142685, -0.000141204334795475, -0.00013713166117668152, -0.00013305898755788803, -0.00012898631393909454, -0.00012491364032030106, -0.00012084096670150757, -0.00011676829308271408, -0.0001126956194639206, -0.0001086229458451271, -0.00010455027222633362, -0.00010047759860754013, -9.640492498874664e-05, -9.233225136995316e-05, -8.825957775115967e-05, -8.418690413236618e-05, -8.011423051357269e-05, -7.60415568947792e-05, -7.196888327598572e-05, -6.789620965719223e-05, -6.382353603839874e-05, -5.9750862419605255e-05, -5.567818880081177e-05, -5.160551518201828e-05, -4.753284156322479e-05, -4.3460167944431305e-05, -3.938749432563782e-05, -3.531482070684433e-05, -3.124214708805084e-05, -2.7169473469257355e-05, -2.3096799850463867e-05, -1.902412623167038e-05, -1.4951452612876892e-05, -1.0878778994083405e-05, -6.806105375289917e-06, -2.7334317564964294e-06, 1.339241862297058e-06, 5.411915481090546e-06, 9.484589099884033e-06, 1.355726271867752e-05, 1.7629936337471008e-05, 2.1702609956264496e-05, 2.5775283575057983e-05, 2.984795719385147e-05, 3.392063081264496e-05, 3.7993304431438446e-05, 4.2065978050231934e-05, 4.613865166902542e-05, 5.021132528781891e-05, 5.4283998906612396e-05, 5.8356672525405884e-05, 6.242934614419937e-05, 6.650201976299286e-05, 7.057469338178635e-05, 7.464736700057983e-05, 7.872004061937332e-05, 8.279271423816681e-05, 8.68653878569603e-05, 9.093806147575378e-05, 9.501073509454727e-05, 9.908340871334076e-05, 0.00010315608233213425, 0.00010722875595092773]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 12.0, 6.0, 11.0, 9.0, 22.0, 24.0, 26.0, 47.0, 53.0, 86.0, 119.0, 166.0, 281.0, 371.0, 585.0, 1020.0, 1670.0, 3034.0, 5436.0, 10331.0, 21246.0, 47953.0, 131087.0, 508135.0, 197182.0, 64099.0, 27115.0, 12989.0, 6483.0, 3565.0, 2107.0, 1219.0, 692.0, 446.0, 270.0, 178.0, 157.0, 97.0, 59.0, 30.0, 33.0, 14.0, 24.0, 12.0, 13.0, 7.0, 10.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00011336803436279297, -0.00010978709906339645, -0.00010620616376399994, -0.00010262522846460342, -9.904429316520691e-05, -9.54633578658104e-05, -9.188242256641388e-05, -8.830148726701736e-05, -8.472055196762085e-05, -8.113961666822433e-05, -7.755868136882782e-05, -7.39777460694313e-05, -7.039681077003479e-05, -6.681587547063828e-05, -6.323494017124176e-05, -5.9654004871845245e-05, -5.607306957244873e-05, -5.2492134273052216e-05, -4.89111989736557e-05, -4.5330263674259186e-05, -4.174932837486267e-05, -3.8168393075466156e-05, -3.458745777606964e-05, -3.1006522476673126e-05, -2.742558717727661e-05, -2.3844651877880096e-05, -2.026371657848358e-05, -1.6682781279087067e-05, -1.3101845979690552e-05, -9.520910680294037e-06, -5.939975380897522e-06, -2.359040081501007e-06, 1.2218952178955078e-06, 4.802830517292023e-06, 8.383765816688538e-06, 1.1964701116085052e-05, 1.5545636415481567e-05, 1.9126571714878082e-05, 2.2707507014274597e-05, 2.6288442313671112e-05, 2.9869377613067627e-05, 3.345031291246414e-05, 3.703124821186066e-05, 4.061218351125717e-05, 4.4193118810653687e-05, 4.77740541100502e-05, 5.1354989409446716e-05, 5.493592470884323e-05, 5.8516860008239746e-05, 6.209779530763626e-05, 6.567873060703278e-05, 6.925966590642929e-05, 7.28406012058258e-05, 7.642153650522232e-05, 8.000247180461884e-05, 8.358340710401535e-05, 8.716434240341187e-05, 9.074527770280838e-05, 9.43262130022049e-05, 9.790714830160141e-05, 0.00010148808360099792, 0.00010506901890039444, 0.00010864995419979095, 0.00011223088949918747, 0.00011581182479858398]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 9.0, 17.0, 26.0, 19.0, 23.0, 35.0, 49.0, 56.0, 52.0, 81.0, 82.0, 81.0, 90.0, 64.0, 65.0, 44.0, 46.0, 29.0, 21.0, 29.0, 12.0, 12.0, 10.0, 6.0, 8.0, 7.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.728534698486328e-05, -1.6508623957633972e-05, -1.5731900930404663e-05, -1.4955177903175354e-05, -1.4178454875946045e-05, -1.3401731848716736e-05, -1.2625008821487427e-05, -1.1848285794258118e-05, -1.1071562767028809e-05, -1.02948397397995e-05, -9.51811671257019e-06, -8.741393685340881e-06, -7.964670658111572e-06, -7.187947630882263e-06, -6.411224603652954e-06, -5.634501576423645e-06, -4.857778549194336e-06, -4.081055521965027e-06, -3.3043324947357178e-06, -2.5276094675064087e-06, -1.7508864402770996e-06, -9.741634130477905e-07, -1.9744038581848145e-07, 5.792826414108276e-07, 1.3560056686401367e-06, 2.132728695869446e-06, 2.909451723098755e-06, 3.686174750328064e-06, 4.462897777557373e-06, 5.239620804786682e-06, 6.016343832015991e-06, 6.7930668592453e-06, 7.569789886474609e-06, 8.346512913703918e-06, 9.123235940933228e-06, 9.899958968162537e-06, 1.0676681995391846e-05, 1.1453405022621155e-05, 1.2230128049850464e-05, 1.3006851077079773e-05, 1.3783574104309082e-05, 1.4560297131538391e-05, 1.53370201587677e-05, 1.611374318599701e-05, 1.689046621322632e-05, 1.7667189240455627e-05, 1.8443912267684937e-05, 1.9220635294914246e-05, 1.9997358322143555e-05, 2.0774081349372864e-05, 2.1550804376602173e-05, 2.2327527403831482e-05, 2.310425043106079e-05, 2.38809734582901e-05, 2.465769648551941e-05, 2.5434419512748718e-05, 2.6211142539978027e-05, 2.6987865567207336e-05, 2.7764588594436646e-05, 2.8541311621665955e-05, 2.9318034648895264e-05, 3.0094757676124573e-05, 3.087148070335388e-05, 3.164820373058319e-05, 3.24249267578125e-05]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 5.0, 7.0, 18.0, 15.0, 28.0, 39.0, 52.0, 79.0, 141.0, 240.0, 463.0, 842.0, 1651.0, 3257.0, 6437.0, 13142.0, 27963.0, 62934.0, 159907.0, 454404.0, 185460.0, 71230.0, 30993.0, 14577.0, 7156.0, 3565.0, 1826.0, 922.0, 506.0, 287.0, 141.0, 97.0, 46.0, 29.0, 28.0, 16.0, 13.0, 8.0, 9.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.985664367675781e-05, -6.771180778741837e-05, -6.556697189807892e-05, -6.342213600873947e-05, -6.127730011940002e-05, -5.913246423006058e-05, -5.698762834072113e-05, -5.484279245138168e-05, -5.2697956562042236e-05, -5.055312067270279e-05, -4.840828478336334e-05, -4.6263448894023895e-05, -4.411861300468445e-05, -4.1973777115345e-05, -3.9828941226005554e-05, -3.768410533666611e-05, -3.553926944732666e-05, -3.339443355798721e-05, -3.1249597668647766e-05, -2.910476177930832e-05, -2.6959925889968872e-05, -2.4815090000629425e-05, -2.2670254111289978e-05, -2.052541822195053e-05, -1.8380582332611084e-05, -1.6235746443271637e-05, -1.409091055393219e-05, -1.1946074664592743e-05, -9.801238775253296e-06, -7.656402885913849e-06, -5.511566996574402e-06, -3.366731107234955e-06, -1.2218952178955078e-06, 9.229406714439392e-07, 3.0677765607833862e-06, 5.212612450122833e-06, 7.35744833946228e-06, 9.502284228801727e-06, 1.1647120118141174e-05, 1.3791956007480621e-05, 1.593679189682007e-05, 1.8081627786159515e-05, 2.0226463675498962e-05, 2.237129956483841e-05, 2.4516135454177856e-05, 2.6660971343517303e-05, 2.880580723285675e-05, 3.09506431221962e-05, 3.3095479011535645e-05, 3.524031490087509e-05, 3.738515079021454e-05, 3.9529986679553986e-05, 4.167482256889343e-05, 4.381965845823288e-05, 4.596449434757233e-05, 4.8109330236911774e-05, 5.025416612625122e-05, 5.239900201559067e-05, 5.4543837904930115e-05, 5.668867379426956e-05, 5.883350968360901e-05, 6.0978345572948456e-05, 6.31231814622879e-05, 6.526801735162735e-05, 6.74128532409668e-05]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 4.0, 8.0, 13.0, 11.0, 12.0, 17.0, 14.0, 18.0, 24.0, 23.0, 38.0, 29.0, 36.0, 33.0, 38.0, 33.0, 31.0, 52.0, 38.0, 35.0, 48.0, 37.0, 38.0, 33.0, 48.0, 31.0, 40.0, 24.0, 25.0, 33.0, 15.0, 27.0, 18.0, 11.0, 15.0, 12.0, 7.0, 7.0, 8.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.398822784423828e-05, -4.26415354013443e-05, -4.129484295845032e-05, -3.9948150515556335e-05, -3.8601458072662354e-05, -3.725476562976837e-05, -3.590807318687439e-05, -3.456138074398041e-05, -3.3214688301086426e-05, -3.1867995858192444e-05, -3.052130341529846e-05, -2.917461097240448e-05, -2.7827918529510498e-05, -2.6481226086616516e-05, -2.5134533643722534e-05, -2.3787841200828552e-05, -2.244114875793457e-05, -2.109445631504059e-05, -1.9747763872146606e-05, -1.8401071429252625e-05, -1.7054378986358643e-05, -1.570768654346466e-05, -1.4360994100570679e-05, -1.3014301657676697e-05, -1.1667609214782715e-05, -1.0320916771888733e-05, -8.974224328994751e-06, -7.627531886100769e-06, -6.280839443206787e-06, -4.934147000312805e-06, -3.5874545574188232e-06, -2.2407621145248413e-06, -8.940696716308594e-07, 4.5262277126312256e-07, 1.7993152141571045e-06, 3.1460076570510864e-06, 4.492700099945068e-06, 5.83939254283905e-06, 7.186084985733032e-06, 8.532777428627014e-06, 9.879469871520996e-06, 1.1226162314414978e-05, 1.257285475730896e-05, 1.3919547200202942e-05, 1.5266239643096924e-05, 1.6612932085990906e-05, 1.7959624528884888e-05, 1.930631697177887e-05, 2.065300941467285e-05, 2.1999701857566833e-05, 2.3346394300460815e-05, 2.4693086743354797e-05, 2.603977918624878e-05, 2.738647162914276e-05, 2.8733164072036743e-05, 3.0079856514930725e-05, 3.142654895782471e-05, 3.277324140071869e-05, 3.411993384361267e-05, 3.546662628650665e-05, 3.6813318729400635e-05, 3.816001117229462e-05, 3.95067036151886e-05, 4.085339605808258e-05, 4.220008850097656e-05]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 7.0, 4.0, 6.0, 8.0, 8.0, 20.0, 28.0, 40.0, 63.0, 126.0, 197.0, 192.0, 517.0, 1107.0, 1229.0, 3914.0, 9801.0, 15552.0, 69007.0, 312387.0, 382002.0, 184299.0, 44506.0, 13908.0, 3863.0, 2959.0, 1255.0, 516.0, 437.0, 240.0, 91.0, 95.0, 66.0, 33.0, 21.0, 16.0, 8.0, 6.0, 7.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0067901611328125e-06, -4.84660267829895e-06, -4.686415195465088e-06, -4.526227712631226e-06, -4.366040229797363e-06, -4.205852746963501e-06, -4.045665264129639e-06, -3.885477781295776e-06, -3.725290298461914e-06, -3.5651028156280518e-06, -3.4049153327941895e-06, -3.244727849960327e-06, -3.084540367126465e-06, -2.9243528842926025e-06, -2.7641654014587402e-06, -2.603977918624878e-06, -2.4437904357910156e-06, -2.2836029529571533e-06, -2.123415470123291e-06, -1.9632279872894287e-06, -1.8030405044555664e-06, -1.642853021621704e-06, -1.4826655387878418e-06, -1.3224780559539795e-06, -1.1622905731201172e-06, -1.0021030902862549e-06, -8.419156074523926e-07, -6.817281246185303e-07, -5.21540641784668e-07, -3.6135315895080566e-07, -2.0116567611694336e-07, -4.0978193283081055e-08, 1.1920928955078125e-07, 2.7939677238464355e-07, 4.3958425521850586e-07, 5.997717380523682e-07, 7.599592208862305e-07, 9.201467037200928e-07, 1.080334186553955e-06, 1.2405216693878174e-06, 1.4007091522216797e-06, 1.560896635055542e-06, 1.7210841178894043e-06, 1.8812716007232666e-06, 2.041459083557129e-06, 2.201646566390991e-06, 2.3618340492248535e-06, 2.522021532058716e-06, 2.682209014892578e-06, 2.8423964977264404e-06, 3.0025839805603027e-06, 3.162771463394165e-06, 3.3229589462280273e-06, 3.4831464290618896e-06, 3.643333911895752e-06, 3.8035213947296143e-06, 3.9637088775634766e-06, 4.123896360397339e-06, 4.284083843231201e-06, 4.4442713260650635e-06, 4.604458808898926e-06, 4.764646291732788e-06, 4.92483377456665e-06, 5.085021257400513e-06, 5.245208740234375e-06]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 8.0, 9.0, 0.0, 11.0, 10.0, 0.0, 13.0, 11.0, 0.0, 36.0, 43.0, 0.0, 36.0, 50.0, 0.0, 56.0, 55.0, 0.0, 60.0, 91.0, 0.0, 88.0, 60.0, 0.0, 60.0, 61.0, 0.0, 52.0, 36.0, 0.0, 35.0, 34.0, 0.0, 29.0, 20.0, 0.0, 21.0, 8.0, 0.0, 8.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2116506695747375e-06, -1.171603798866272e-06, -1.1315569281578064e-06, -1.0915100574493408e-06, -1.0514631867408752e-06, -1.0114163160324097e-06, -9.71369445323944e-07, -9.313225746154785e-07, -8.912757039070129e-07, -8.512288331985474e-07, -8.111819624900818e-07, -7.711350917816162e-07, -7.310882210731506e-07, -6.910413503646851e-07, -6.509944796562195e-07, -6.109476089477539e-07, -5.709007382392883e-07, -5.308538675308228e-07, -4.908069968223572e-07, -4.507601261138916e-07, -4.10713255405426e-07, -3.7066638469696045e-07, -3.3061951398849487e-07, -2.905726432800293e-07, -2.505257725715637e-07, -2.1047890186309814e-07, -1.7043203115463257e-07, -1.30385160446167e-07, -9.033828973770142e-08, -5.029141902923584e-08, -1.0244548320770264e-08, 2.9802322387695312e-08, 6.984919309616089e-08, 1.0989606380462646e-07, 1.4994293451309204e-07, 1.8998980522155762e-07, 2.300366759300232e-07, 2.7008354663848877e-07, 3.1013041734695435e-07, 3.501772880554199e-07, 3.902241587638855e-07, 4.302710294723511e-07, 4.7031790018081665e-07, 5.103647708892822e-07, 5.504116415977478e-07, 5.904585123062134e-07, 6.30505383014679e-07, 6.705522537231445e-07, 7.105991244316101e-07, 7.506459951400757e-07, 7.906928658485413e-07, 8.307397365570068e-07, 8.707866072654724e-07, 9.10833477973938e-07, 9.508803486824036e-07, 9.909272193908691e-07, 1.0309740900993347e-06, 1.0710209608078003e-06, 1.1110678315162659e-06, 1.1511147022247314e-06, 1.191161572933197e-06, 1.2312084436416626e-06, 1.2712553143501282e-06, 1.3113021850585938e-06]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 8.0, 12.0, 15.0, 33.0, 33.0, 56.0, 65.0, 186.0, 226.0, 560.0, 695.0, 2101.0, 2791.0, 5493.0, 22022.0, 43429.0, 311721.0, 446946.0, 161258.0, 27158.0, 14574.0, 3903.0, 2816.0, 916.0, 551.0, 478.0, 159.0, 148.0, 52.0, 64.0, 21.0, 27.0, 5.0, 10.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.304813385009766e-06, -5.1585957407951355e-06, -5.012378096580505e-06, -4.866160452365875e-06, -4.719942808151245e-06, -4.573725163936615e-06, -4.427507519721985e-06, -4.281289875507355e-06, -4.135072231292725e-06, -3.9888545870780945e-06, -3.842636942863464e-06, -3.6964192986488342e-06, -3.550201654434204e-06, -3.403984010219574e-06, -3.257766366004944e-06, -3.1115487217903137e-06, -2.9653310775756836e-06, -2.8191134333610535e-06, -2.6728957891464233e-06, -2.5266781449317932e-06, -2.380460500717163e-06, -2.234242856502533e-06, -2.088025212287903e-06, -1.9418075680732727e-06, -1.7955899238586426e-06, -1.6493722796440125e-06, -1.5031546354293823e-06, -1.3569369912147522e-06, -1.210719347000122e-06, -1.064501702785492e-06, -9.182840585708618e-07, -7.720664143562317e-07, -6.258487701416016e-07, -4.796311259269714e-07, -3.334134817123413e-07, -1.8719583749771118e-07, -4.0978193283081055e-08, 1.0523945093154907e-07, 2.514570951461792e-07, 3.976747393608093e-07, 5.438923835754395e-07, 6.901100277900696e-07, 8.363276720046997e-07, 9.825453162193298e-07, 1.12876296043396e-06, 1.27498060464859e-06, 1.4211982488632202e-06, 1.5674158930778503e-06, 1.7136335372924805e-06, 1.8598511815071106e-06, 2.0060688257217407e-06, 2.152286469936371e-06, 2.298504114151001e-06, 2.444721758365631e-06, 2.5909394025802612e-06, 2.7371570467948914e-06, 2.8833746910095215e-06, 3.0295923352241516e-06, 3.1758099794387817e-06, 3.322027623653412e-06, 3.468245267868042e-06, 3.614462912082672e-06, 3.7606805562973022e-06, 3.906898200511932e-06, 4.0531158447265625e-06]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 1.0, 8.0, 11.0, 2.0, 14.0, 19.0, 12.0, 33.0, 18.0, 50.0, 66.0, 32.0, 93.0, 99.0, 44.0, 98.0, 90.0, 48.0, 58.0, 53.0, 20.0, 45.0, 28.0, 5.0, 14.0, 11.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6954879760742188e-06, -3.596767783164978e-06, -3.4980475902557373e-06, -3.3993273973464966e-06, -3.300607204437256e-06, -3.201887011528015e-06, -3.1031668186187744e-06, -3.0044466257095337e-06, -2.905726432800293e-06, -2.8070062398910522e-06, -2.7082860469818115e-06, -2.609565854072571e-06, -2.51084566116333e-06, -2.4121254682540894e-06, -2.3134052753448486e-06, -2.214685082435608e-06, -2.115964889526367e-06, -2.0172446966171265e-06, -1.9185245037078857e-06, -1.819804310798645e-06, -1.7210841178894043e-06, -1.6223639249801636e-06, -1.5236437320709229e-06, -1.4249235391616821e-06, -1.3262033462524414e-06, -1.2274831533432007e-06, -1.12876296043396e-06, -1.0300427675247192e-06, -9.313225746154785e-07, -8.326023817062378e-07, -7.338821887969971e-07, -6.351619958877563e-07, -5.364418029785156e-07, -4.377216100692749e-07, -3.390014171600342e-07, -2.4028122425079346e-07, -1.4156103134155273e-07, -4.284083843231201e-08, 5.587935447692871e-08, 1.5459954738616943e-07, 2.5331974029541016e-07, 3.520399332046509e-07, 4.507601261138916e-07, 5.494803190231323e-07, 6.48200511932373e-07, 7.469207048416138e-07, 8.456408977508545e-07, 9.443610906600952e-07, 1.043081283569336e-06, 1.1418014764785767e-06, 1.2405216693878174e-06, 1.339241862297058e-06, 1.4379620552062988e-06, 1.5366822481155396e-06, 1.6354024410247803e-06, 1.734122633934021e-06, 1.8328428268432617e-06, 1.9315630197525024e-06, 2.030283212661743e-06, 2.129003405570984e-06, 2.2277235984802246e-06, 2.3264437913894653e-06, 2.425163984298706e-06, 2.5238841772079468e-06, 2.6226043701171875e-06]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 2.0, 5.0, 10.0, 7.0, 17.0, 36.0, 56.0, 104.0, 210.0, 204.0, 111.0, 72.0, 41.0, 26.0, 30.0, 27.0, 16.0, 9.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001467356487410143, -0.00013755606778431684, -0.0001283765013795346, -0.00011919692042283714, -0.00011001734674209729, -0.00010083777306135744, -9.165819210465997e-05, -8.247861842392012e-05, -7.329904474318027e-05, -6.411947106244043e-05, -5.493989374372177e-05, -4.576031642500311e-05, -3.658074274426326e-05, -2.7401169063523412e-05, -1.8221591744804755e-05, -9.042014426086098e-06, 1.3755925465375185e-07, 9.317134754383005e-06, 1.849671025411226e-05, 2.7676285753841512e-05, 3.6855861253570765e-05, 4.6035434934310615e-05, 5.521501225302927e-05, 6.439458957174793e-05, 7.357416325248778e-05, 8.275373693322763e-05, 9.193331061396748e-05, 0.00010111289157066494, 0.00011029246525140479, 0.00011947203893214464, 0.0001286516198888421, 0.00013783120084553957, 0.00014701078180223703, 0.0001561903627589345, 0.00016536992916371673, 0.0001745495101204142, 0.00018372907652519643, 0.0001929086574818939, 0.00020208823843859136, 0.00021126781939528883, 0.00022044738580007106, 0.00022962696675676852, 0.00023880653316155076, 0.0002479861141182482, 0.0002571656950749457, 0.00026634527603164315, 0.00027552482788451016, 0.0002847044088412076, 0.0002938839897979051, 0.00030306357075460255, 0.0003122431517113, 0.000321422703564167, 0.0003306022845208645, 0.00033978186547756195, 0.0003489614464342594, 0.0003581410273909569, 0.00036732060834765434, 0.0003765001893043518, 0.00038567977026104927, 0.0003948593221139163, 0.00040403890307061374, 0.0004132184840273112, 0.00042239806498400867, 0.00043157764594070613, 0.00044075719779357314]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 7.0, 7.0, 12.0, 12.0, 18.0, 8.0, 26.0, 16.0, 22.0, 16.0, 26.0, 20.0, 26.0, 42.0, 39.0, 45.0, 37.0, 38.0, 38.0, 48.0, 35.0, 47.0, 44.0, 30.0, 34.0, 23.0, 24.0, 36.0, 22.0, 33.0, 26.0, 19.0, 15.0, 12.0, 15.0, 16.0, 14.0, 9.0, 12.0, 8.0, 4.0, 4.0, 0.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00011485815048217773, -0.00011129491031169891, -0.00010773167014122009, -0.00010416842997074127, -0.00010060518980026245, -9.704194962978363e-05, -9.347870945930481e-05, -8.991546928882599e-05, -8.635222911834717e-05, -8.278898894786835e-05, -7.922574877738953e-05, -7.56625086069107e-05, -7.209926843643188e-05, -6.853602826595306e-05, -6.497278809547424e-05, -6.140954792499542e-05, -5.78463077545166e-05, -5.428306758403778e-05, -5.071982741355896e-05, -4.715658724308014e-05, -4.359334707260132e-05, -4.00301069021225e-05, -3.646686673164368e-05, -3.2903626561164856e-05, -2.9340386390686035e-05, -2.5777146220207214e-05, -2.2213906049728394e-05, -1.8650665879249573e-05, -1.5087425708770752e-05, -1.1524185538291931e-05, -7.96094536781311e-06, -4.3977051973342896e-06, -8.344650268554688e-07, 2.728775143623352e-06, 6.292015314102173e-06, 9.855255484580994e-06, 1.3418495655059814e-05, 1.6981735825538635e-05, 2.0544975996017456e-05, 2.4108216166496277e-05, 2.7671456336975098e-05, 3.123469650745392e-05, 3.479793667793274e-05, 3.836117684841156e-05, 4.192441701889038e-05, 4.54876571893692e-05, 4.905089735984802e-05, 5.261413753032684e-05, 5.6177377700805664e-05, 5.9740617871284485e-05, 6.33038580417633e-05, 6.686709821224213e-05, 7.043033838272095e-05, 7.399357855319977e-05, 7.755681872367859e-05, 8.112005889415741e-05, 8.468329906463623e-05, 8.824653923511505e-05, 9.180977940559387e-05, 9.537301957607269e-05, 9.893625974655151e-05, 0.00010249949991703033, 0.00010606274008750916, 0.00010962598025798798, 0.0001131892204284668]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 3.0, 5.0, 11.0, 10.0, 13.0, 29.0, 39.0, 45.0, 75.0, 86.0, 146.0, 198.0, 340.0, 478.0, 730.0, 1246.0, 1980.0, 3570.0, 6160.0, 12771.0, 30712.0, 185655.0, 3769349.0, 130185.0, 25358.0, 10750.0, 5714.0, 3094.0, 1761.0, 1104.0, 773.0, 521.0, 351.0, 257.0, 167.0, 141.0, 119.0, 72.0, 53.0, 52.0, 35.0, 25.0, 22.0, 15.0, 19.0, 15.0, 8.0, 10.0, 6.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.502866744995117e-05, -6.247404962778091e-05, -5.991943180561066e-05, -5.73648139834404e-05, -5.481019616127014e-05, -5.2255578339099884e-05, -4.9700960516929626e-05, -4.714634269475937e-05, -4.459172487258911e-05, -4.2037107050418854e-05, -3.9482489228248596e-05, -3.692787140607834e-05, -3.437325358390808e-05, -3.1818635761737823e-05, -2.9264017939567566e-05, -2.670940011739731e-05, -2.415478229522705e-05, -2.1600164473056793e-05, -1.9045546650886536e-05, -1.6490928828716278e-05, -1.393631100654602e-05, -1.1381693184375763e-05, -8.827075362205505e-06, -6.272457540035248e-06, -3.7178397178649902e-06, -1.1632218956947327e-06, 1.391395926475525e-06, 3.9460137486457825e-06, 6.50063157081604e-06, 9.055249392986298e-06, 1.1609867215156555e-05, 1.4164485037326813e-05, 1.671910285949707e-05, 1.9273720681667328e-05, 2.1828338503837585e-05, 2.4382956326007843e-05, 2.69375741481781e-05, 2.9492191970348358e-05, 3.2046809792518616e-05, 3.460142761468887e-05, 3.715604543685913e-05, 3.971066325902939e-05, 4.2265281081199646e-05, 4.4819898903369904e-05, 4.737451672554016e-05, 4.992913454771042e-05, 5.2483752369880676e-05, 5.5038370192050934e-05, 5.759298801422119e-05, 6.014760583639145e-05, 6.27022236585617e-05, 6.525684148073196e-05, 6.781145930290222e-05, 7.036607712507248e-05, 7.292069494724274e-05, 7.5475312769413e-05, 7.802993059158325e-05, 8.058454841375351e-05, 8.313916623592377e-05, 8.569378405809402e-05, 8.824840188026428e-05, 9.080301970243454e-05, 9.33576375246048e-05, 9.591225534677505e-05, 9.846687316894531e-05]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 7.0, 8.0, 12.0, 14.0, 15.0, 23.0, 24.0, 41.0, 38.0, 51.0, 56.0, 43.0, 69.0, 65.0, 73.0, 74.0, 64.0, 45.0, 50.0, 51.0, 43.0, 29.0, 15.0, 16.0, 13.0, 7.0, 7.0, 9.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7404556274414062e-05, -1.6742385923862457e-05, -1.6080215573310852e-05, -1.5418045222759247e-05, -1.4755874872207642e-05, -1.4093704521656036e-05, -1.3431534171104431e-05, -1.2769363820552826e-05, -1.210719347000122e-05, -1.1445023119449615e-05, -1.078285276889801e-05, -1.0120682418346405e-05, -9.4585120677948e-06, -8.796341717243195e-06, -8.13417136669159e-06, -7.472001016139984e-06, -6.809830665588379e-06, -6.147660315036774e-06, -5.4854899644851685e-06, -4.823319613933563e-06, -4.161149263381958e-06, -3.4989789128303528e-06, -2.8368085622787476e-06, -2.1746382117271423e-06, -1.5124678611755371e-06, -8.502975106239319e-07, -1.8812716007232666e-07, 4.7404319047927856e-07, 1.1362135410308838e-06, 1.798383891582489e-06, 2.4605542421340942e-06, 3.1227245926856995e-06, 3.7848949432373047e-06, 4.44706529378891e-06, 5.109235644340515e-06, 5.77140599489212e-06, 6.433576345443726e-06, 7.095746695995331e-06, 7.757917046546936e-06, 8.420087397098541e-06, 9.082257747650146e-06, 9.744428098201752e-06, 1.0406598448753357e-05, 1.1068768799304962e-05, 1.1730939149856567e-05, 1.2393109500408173e-05, 1.3055279850959778e-05, 1.3717450201511383e-05, 1.4379620552062988e-05, 1.5041790902614594e-05, 1.57039612531662e-05, 1.6366131603717804e-05, 1.702830195426941e-05, 1.7690472304821014e-05, 1.835264265537262e-05, 1.9014813005924225e-05, 1.967698335647583e-05, 2.0339153707027435e-05, 2.100132405757904e-05, 2.1663494408130646e-05, 2.232566475868225e-05, 2.2987835109233856e-05, 2.365000545978546e-05, 2.4312175810337067e-05, 2.4974346160888672e-05]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 12.0, 12.0, 17.0, 33.0, 50.0, 87.0, 119.0, 224.0, 355.0, 646.0, 1203.0, 2436.0, 4618.0, 9614.0, 22546.0, 59825.0, 322518.0, 3529214.0, 165056.0, 42950.0, 17104.0, 7515.0, 3706.0, 1963.0, 1015.0, 622.0, 337.0, 183.0, 100.0, 73.0, 33.0, 25.0, 18.0, 11.0, 8.0, 9.0, 2.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.22868537902832e-05, -6.041955202817917e-05, -5.8552250266075134e-05, -5.66849485039711e-05, -5.4817646741867065e-05, -5.295034497976303e-05, -5.1083043217658997e-05, -4.921574145555496e-05, -4.734843969345093e-05, -4.548113793134689e-05, -4.361383616924286e-05, -4.1746534407138824e-05, -3.987923264503479e-05, -3.8011930882930756e-05, -3.614462912082672e-05, -3.427732735872269e-05, -3.241002559661865e-05, -3.054272383451462e-05, -2.8675422072410583e-05, -2.680812031030655e-05, -2.4940818548202515e-05, -2.307351678609848e-05, -2.1206215023994446e-05, -1.933891326189041e-05, -1.7471611499786377e-05, -1.5604309737682343e-05, -1.3737007975578308e-05, -1.1869706213474274e-05, -1.000240445137024e-05, -8.135102689266205e-06, -6.26780092716217e-06, -4.400499165058136e-06, -2.5331974029541016e-06, -6.658956408500671e-07, 1.2014061212539673e-06, 3.0687078833580017e-06, 4.936009645462036e-06, 6.8033114075660706e-06, 8.670613169670105e-06, 1.053791493177414e-05, 1.2405216693878174e-05, 1.4272518455982208e-05, 1.6139820218086243e-05, 1.8007121980190277e-05, 1.987442374229431e-05, 2.1741725504398346e-05, 2.360902726650238e-05, 2.5476329028606415e-05, 2.734363079071045e-05, 2.9210932552814484e-05, 3.107823431491852e-05, 3.294553607702255e-05, 3.481283783912659e-05, 3.668013960123062e-05, 3.8547441363334656e-05, 4.041474312543869e-05, 4.2282044887542725e-05, 4.414934664964676e-05, 4.6016648411750793e-05, 4.788395017385483e-05, 4.975125193595886e-05, 5.16185536980629e-05, 5.348585546016693e-05, 5.5353157222270966e-05, 5.7220458984375e-05]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 7.0, 5.0, 6.0, 12.0, 19.0, 19.0, 19.0, 21.0, 23.0, 45.0, 43.0, 52.0, 107.0, 261.0, 701.0, 1566.0, 579.0, 209.0, 113.0, 66.0, 47.0, 31.0, 24.0, 15.0, 16.0, 9.0, 14.0, 3.0, 6.0, 5.0, 1.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.589557647705078e-05, -4.460196942090988e-05, -4.330836236476898e-05, -4.201475530862808e-05, -4.072114825248718e-05, -3.942754119634628e-05, -3.813393414020538e-05, -3.6840327084064484e-05, -3.5546720027923584e-05, -3.4253112971782684e-05, -3.2959505915641785e-05, -3.1665898859500885e-05, -3.0372291803359985e-05, -2.9078684747219086e-05, -2.7785077691078186e-05, -2.6491470634937286e-05, -2.5197863578796387e-05, -2.3904256522655487e-05, -2.2610649466514587e-05, -2.1317042410373688e-05, -2.0023435354232788e-05, -1.872982829809189e-05, -1.743622124195099e-05, -1.614261418581009e-05, -1.484900712966919e-05, -1.355540007352829e-05, -1.226179301738739e-05, -1.096818596124649e-05, -9.67457890510559e-06, -8.380971848964691e-06, -7.0873647928237915e-06, -5.793757736682892e-06, -4.500150680541992e-06, -3.2065436244010925e-06, -1.912936568260193e-06, -6.193295121192932e-07, 6.742775440216064e-07, 1.967884600162506e-06, 3.2614916563034058e-06, 4.555098712444305e-06, 5.848705768585205e-06, 7.142312824726105e-06, 8.435919880867004e-06, 9.729526937007904e-06, 1.1023133993148804e-05, 1.2316741049289703e-05, 1.3610348105430603e-05, 1.4903955161571503e-05, 1.6197562217712402e-05, 1.7491169273853302e-05, 1.87847763299942e-05, 2.00783833861351e-05, 2.1371990442276e-05, 2.26655974984169e-05, 2.39592045545578e-05, 2.52528116106987e-05, 2.65464186668396e-05, 2.78400257229805e-05, 2.91336327791214e-05, 3.04272398352623e-05, 3.17208468914032e-05, 3.30144539475441e-05, 3.4308061003685e-05, 3.56016680598259e-05, 3.68952751159668e-05]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 5.0, 5.0, 11.0, 8.0, 9.0, 9.0, 14.0, 9.0, 19.0, 22.0, 36.0, 40.0, 36.0, 57.0, 53.0, 81.0, 84.0, 79.0, 77.0, 62.0, 50.0, 30.0, 29.0, 35.0, 26.0, 25.0, 23.0, 8.0, 9.0, 9.0, 6.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.00011356100731063634, -0.00010961868974845856, -0.00010567637218628079, -0.00010173405462410301, -9.779173706192523e-05, -9.384941949974746e-05, -8.990710921352729e-05, -8.596479165134951e-05, -8.202247408917174e-05, -7.808015652699396e-05, -7.413783896481618e-05, -7.01955214026384e-05, -6.625321111641824e-05, -6.231089355424047e-05, -5.836857599206269e-05, -5.442625842988491e-05, -5.048394086770713e-05, -4.6541623305529356e-05, -4.259930574335158e-05, -3.865699181915261e-05, -3.471467425697483e-05, -3.0772356694797054e-05, -2.683004095160868e-05, -2.2887725208420306e-05, -1.894540764624253e-05, -1.5003090993559454e-05, -1.1060774340876378e-05, -7.118457688193303e-06, -3.176141035510227e-06, 7.661765266675502e-07, 4.708492269855924e-06, 8.650808013044298e-06, 1.2593111023306847e-05, 1.6535428585484624e-05, 2.0477744328672998e-05, 2.442006007186137e-05, 2.836237763403915e-05, 3.2304695196216926e-05, 3.6247009120415896e-05, 4.0189326682593673e-05, 4.413164424477145e-05, 4.807396180694923e-05, 5.2016279369127005e-05, 5.5958593293325976e-05, 5.990091085550375e-05, 6.384322477970272e-05, 6.77855423418805e-05, 7.172785990405828e-05, 7.567017746623605e-05, 7.961249502841383e-05, 8.355481259059161e-05, 8.749713015276939e-05, 9.143944771494716e-05, 9.538176527712494e-05, 9.93240755633451e-05, 0.00010326639312552288, 0.00010720871068770066, 0.00011115102824987844, 0.00011509334581205621, 0.00011903566337423399, 0.00012297797366045415, 0.00012692029122263193, 0.0001308626087848097, 0.00013480492634698749, 0.00013874724390916526]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 6.0, 5.0, 7.0, 9.0, 11.0, 11.0, 20.0, 12.0, 19.0, 16.0, 18.0, 22.0, 39.0, 32.0, 28.0, 39.0, 29.0, 35.0, 34.0, 47.0, 39.0, 46.0, 59.0, 44.0, 44.0, 30.0, 42.0, 29.0, 26.0, 25.0, 24.0, 17.0, 27.0, 21.0, 8.0, 9.0, 11.0, 10.0, 12.0, 9.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.191036224365234e-05, -8.89115035533905e-05, -8.591264486312866e-05, -8.291378617286682e-05, -7.991492748260498e-05, -7.691606879234314e-05, -7.39172101020813e-05, -7.091835141181946e-05, -6.791949272155762e-05, -6.492063403129578e-05, -6.192177534103394e-05, -5.8922916650772095e-05, -5.5924057960510254e-05, -5.292519927024841e-05, -4.992634057998657e-05, -4.692748188972473e-05, -4.392862319946289e-05, -4.092976450920105e-05, -3.793090581893921e-05, -3.493204712867737e-05, -3.193318843841553e-05, -2.8934329748153687e-05, -2.5935471057891846e-05, -2.2936612367630005e-05, -1.9937753677368164e-05, -1.6938894987106323e-05, -1.3940036296844482e-05, -1.0941177606582642e-05, -7.9423189163208e-06, -4.94346022605896e-06, -1.944601535797119e-06, 1.0542571544647217e-06, 4.0531158447265625e-06, 7.051974534988403e-06, 1.0050833225250244e-05, 1.3049691915512085e-05, 1.6048550605773926e-05, 1.9047409296035767e-05, 2.2046267986297607e-05, 2.5045126676559448e-05, 2.804398536682129e-05, 3.104284405708313e-05, 3.404170274734497e-05, 3.704056143760681e-05, 4.003942012786865e-05, 4.303827881813049e-05, 4.6037137508392334e-05, 4.9035996198654175e-05, 5.2034854888916016e-05, 5.5033713579177856e-05, 5.80325722694397e-05, 6.103143095970154e-05, 6.403028964996338e-05, 6.702914834022522e-05, 7.002800703048706e-05, 7.30268657207489e-05, 7.602572441101074e-05, 7.902458310127258e-05, 8.202344179153442e-05, 8.502230048179626e-05, 8.80211591720581e-05, 9.102001786231995e-05, 9.401887655258179e-05, 9.701773524284363e-05, 0.00010001659393310547]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 9.0, 7.0, 10.0, 8.0, 19.0, 19.0, 27.0, 34.0, 48.0, 58.0, 86.0, 137.0, 229.0, 438.0, 767.0, 1583.0, 3195.0, 6648.0, 15262.0, 41419.0, 151782.0, 589932.0, 163452.0, 43538.0, 16099.0, 6942.0, 3242.0, 1637.0, 806.0, 432.0, 239.0, 126.0, 81.0, 59.0, 40.0, 32.0, 27.0, 20.0, 16.0, 13.0, 7.0, 15.0, 9.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014352798461914062, -0.00013866648077964783, -0.00013380497694015503, -0.00012894347310066223, -0.00012408196926116943, -0.00011922046542167664, -0.00011435896158218384, -0.00010949745774269104, -0.00010463595390319824, -9.977445006370544e-05, -9.491294622421265e-05, -9.005144238471985e-05, -8.518993854522705e-05, -8.032843470573425e-05, -7.546693086624146e-05, -7.060542702674866e-05, -6.574392318725586e-05, -6.088241934776306e-05, -5.6020915508270264e-05, -5.1159411668777466e-05, -4.629790782928467e-05, -4.143640398979187e-05, -3.657490015029907e-05, -3.1713396310806274e-05, -2.6851892471313477e-05, -2.199038863182068e-05, -1.712888479232788e-05, -1.2267380952835083e-05, -7.405877113342285e-06, -2.5443732738494873e-06, 2.3171305656433105e-06, 7.178634405136108e-06, 1.2040138244628906e-05, 1.6901642084121704e-05, 2.1763145923614502e-05, 2.66246497631073e-05, 3.14861536026001e-05, 3.6347657442092896e-05, 4.120916128158569e-05, 4.607066512107849e-05, 5.093216896057129e-05, 5.579367280006409e-05, 6.0655176639556885e-05, 6.551668047904968e-05, 7.037818431854248e-05, 7.523968815803528e-05, 8.010119199752808e-05, 8.496269583702087e-05, 8.982419967651367e-05, 9.468570351600647e-05, 9.954720735549927e-05, 0.00010440871119499207, 0.00010927021503448486, 0.00011413171887397766, 0.00011899322271347046, 0.00012385472655296326, 0.00012871623039245605, 0.00013357773423194885, 0.00013843923807144165, 0.00014330074191093445, 0.00014816224575042725, 0.00015302374958992004, 0.00015788525342941284, 0.00016274675726890564, 0.00016760826110839844]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 7.0, 8.0, 6.0, 12.0, 12.0, 15.0, 26.0, 13.0, 41.0, 63.0, 87.0, 80.0, 91.0, 92.0, 82.0, 90.0, 74.0, 51.0, 49.0, 28.0, 24.0, 10.0, 11.0, 8.0, 10.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8417835235595703e-05, -1.7561018466949463e-05, -1.6704201698303223e-05, -1.5847384929656982e-05, -1.4990568161010742e-05, -1.4133751392364502e-05, -1.3276934623718262e-05, -1.2420117855072021e-05, -1.1563301086425781e-05, -1.0706484317779541e-05, -9.8496675491333e-06, -8.99285078048706e-06, -8.13603401184082e-06, -7.27921724319458e-06, -6.42240047454834e-06, -5.5655837059021e-06, -4.708766937255859e-06, -3.851950168609619e-06, -2.995133399963379e-06, -2.1383166313171387e-06, -1.2814998626708984e-06, -4.246830940246582e-07, 4.3213367462158203e-07, 1.2889504432678223e-06, 2.1457672119140625e-06, 3.0025839805603027e-06, 3.859400749206543e-06, 4.716217517852783e-06, 5.5730342864990234e-06, 6.429851055145264e-06, 7.286667823791504e-06, 8.143484592437744e-06, 9.000301361083984e-06, 9.857118129730225e-06, 1.0713934898376465e-05, 1.1570751667022705e-05, 1.2427568435668945e-05, 1.3284385204315186e-05, 1.4141201972961426e-05, 1.4998018741607666e-05, 1.5854835510253906e-05, 1.6711652278900146e-05, 1.7568469047546387e-05, 1.8425285816192627e-05, 1.9282102584838867e-05, 2.0138919353485107e-05, 2.0995736122131348e-05, 2.1852552890777588e-05, 2.2709369659423828e-05, 2.356618642807007e-05, 2.442300319671631e-05, 2.527981996536255e-05, 2.613663673400879e-05, 2.699345350265503e-05, 2.785027027130127e-05, 2.870708703994751e-05, 2.956390380859375e-05, 3.042072057723999e-05, 3.127753734588623e-05, 3.213435411453247e-05, 3.299117088317871e-05, 3.384798765182495e-05, 3.470480442047119e-05, 3.556162118911743e-05, 3.641843795776367e-05]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 8.0, 7.0, 16.0, 17.0, 21.0, 24.0, 43.0, 71.0, 137.0, 201.0, 306.0, 546.0, 827.0, 1249.0, 2158.0, 3248.0, 5502.0, 8404.0, 15033.0, 23517.0, 43373.0, 78718.0, 196773.0, 380304.0, 138267.0, 62264.0, 35642.0, 19941.0, 12380.0, 7332.0, 4691.0, 2820.0, 1771.0, 1085.0, 698.0, 391.0, 242.0, 183.0, 134.0, 72.0, 38.0, 29.0, 20.0, 14.0, 13.0, 6.0, 3.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0], "bins": [-5.263090133666992e-05, -5.105137825012207e-05, -4.947185516357422e-05, -4.789233207702637e-05, -4.6312808990478516e-05, -4.4733285903930664e-05, -4.315376281738281e-05, -4.157423973083496e-05, -3.999471664428711e-05, -3.841519355773926e-05, -3.6835670471191406e-05, -3.5256147384643555e-05, -3.36766242980957e-05, -3.209710121154785e-05, -3.0517578125e-05, -2.893805503845215e-05, -2.7358531951904297e-05, -2.5779008865356445e-05, -2.4199485778808594e-05, -2.2619962692260742e-05, -2.104043960571289e-05, -1.946091651916504e-05, -1.7881393432617188e-05, -1.6301870346069336e-05, -1.4722347259521484e-05, -1.3142824172973633e-05, -1.1563301086425781e-05, -9.98377799987793e-06, -8.404254913330078e-06, -6.8247318267822266e-06, -5.245208740234375e-06, -3.6656856536865234e-06, -2.086162567138672e-06, -5.066394805908203e-07, 1.0728836059570312e-06, 2.652406692504883e-06, 4.231929779052734e-06, 5.811452865600586e-06, 7.3909759521484375e-06, 8.970499038696289e-06, 1.055002212524414e-05, 1.2129545211791992e-05, 1.3709068298339844e-05, 1.5288591384887695e-05, 1.6868114471435547e-05, 1.84476375579834e-05, 2.002716064453125e-05, 2.16066837310791e-05, 2.3186206817626953e-05, 2.4765729904174805e-05, 2.6345252990722656e-05, 2.7924776077270508e-05, 2.950429916381836e-05, 3.108382225036621e-05, 3.266334533691406e-05, 3.4242868423461914e-05, 3.5822391510009766e-05, 3.740191459655762e-05, 3.898143768310547e-05, 4.056096076965332e-05, 4.214048385620117e-05, 4.3720006942749023e-05, 4.5299530029296875e-05, 4.6879053115844727e-05, 4.845857620239258e-05]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 5.0, 14.0, 7.0, 6.0, 6.0, 11.0, 4.0, 15.0, 13.0, 24.0, 24.0, 24.0, 23.0, 21.0, 26.0, 30.0, 31.0, 33.0, 31.0, 32.0, 48.0, 46.0, 28.0, 38.0, 44.0, 36.0, 36.0, 31.0, 26.0, 34.0, 30.0, 27.0, 24.0, 22.0, 19.0, 13.0, 21.0, 23.0, 15.0, 10.0, 11.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0], "bins": [-3.838539123535156e-05, -3.722682595252991e-05, -3.606826066970825e-05, -3.49096953868866e-05, -3.375113010406494e-05, -3.2592564821243286e-05, -3.143399953842163e-05, -3.0275434255599976e-05, -2.911686897277832e-05, -2.7958303689956665e-05, -2.679973840713501e-05, -2.5641173124313354e-05, -2.44826078414917e-05, -2.3324042558670044e-05, -2.216547727584839e-05, -2.1006911993026733e-05, -1.9848346710205078e-05, -1.8689781427383423e-05, -1.7531216144561768e-05, -1.6372650861740112e-05, -1.5214085578918457e-05, -1.4055520296096802e-05, -1.2896955013275146e-05, -1.1738389730453491e-05, -1.0579824447631836e-05, -9.42125916481018e-06, -8.262693881988525e-06, -7.10412859916687e-06, -5.945563316345215e-06, -4.7869980335235596e-06, -3.6284327507019043e-06, -2.469867467880249e-06, -1.3113021850585938e-06, -1.5273690223693848e-07, 1.0058283805847168e-06, 2.164393663406372e-06, 3.3229589462280273e-06, 4.481524229049683e-06, 5.640089511871338e-06, 6.798654794692993e-06, 7.957220077514648e-06, 9.115785360336304e-06, 1.0274350643157959e-05, 1.1432915925979614e-05, 1.259148120880127e-05, 1.3750046491622925e-05, 1.490861177444458e-05, 1.6067177057266235e-05, 1.722574234008789e-05, 1.8384307622909546e-05, 1.95428729057312e-05, 2.0701438188552856e-05, 2.1860003471374512e-05, 2.3018568754196167e-05, 2.4177134037017822e-05, 2.5335699319839478e-05, 2.6494264602661133e-05, 2.7652829885482788e-05, 2.8811395168304443e-05, 2.99699604511261e-05, 3.1128525733947754e-05, 3.228709101676941e-05, 3.3445656299591064e-05, 3.460422158241272e-05, 3.5762786865234375e-05]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 9.0, 8.0, 17.0, 27.0, 31.0, 36.0, 66.0, 118.0, 126.0, 200.0, 343.0, 485.0, 789.0, 1261.0, 2183.0, 3905.0, 7770.0, 16145.0, 36829.0, 92493.0, 255624.0, 371746.0, 153008.0, 57380.0, 23915.0, 11036.0, 5499.0, 2923.0, 1685.0, 1008.0, 663.0, 400.0, 255.0, 158.0, 89.0, 78.0, 73.0, 36.0, 34.0, 21.0, 20.0, 12.0, 3.0, 4.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.6954879760742188e-06, -3.5762786865234375e-06, -3.4570693969726562e-06, -3.337860107421875e-06, -3.2186508178710938e-06, -3.0994415283203125e-06, -2.9802322387695312e-06, -2.86102294921875e-06, -2.7418136596679688e-06, -2.6226043701171875e-06, -2.5033950805664062e-06, -2.384185791015625e-06, -2.2649765014648438e-06, -2.1457672119140625e-06, -2.0265579223632812e-06, -1.9073486328125e-06, -1.7881393432617188e-06, -1.6689300537109375e-06, -1.5497207641601562e-06, -1.430511474609375e-06, -1.3113021850585938e-06, -1.1920928955078125e-06, -1.0728836059570312e-06, -9.5367431640625e-07, -8.344650268554688e-07, -7.152557373046875e-07, -5.960464477539062e-07, -4.76837158203125e-07, -3.5762786865234375e-07, -2.384185791015625e-07, -1.1920928955078125e-07, 0.0, 1.1920928955078125e-07, 2.384185791015625e-07, 3.5762786865234375e-07, 4.76837158203125e-07, 5.960464477539062e-07, 7.152557373046875e-07, 8.344650268554688e-07, 9.5367431640625e-07, 1.0728836059570312e-06, 1.1920928955078125e-06, 1.3113021850585938e-06, 1.430511474609375e-06, 1.5497207641601562e-06, 1.6689300537109375e-06, 1.7881393432617188e-06, 1.9073486328125e-06, 2.0265579223632812e-06, 2.1457672119140625e-06, 2.2649765014648438e-06, 2.384185791015625e-06, 2.5033950805664062e-06, 2.6226043701171875e-06, 2.7418136596679688e-06, 2.86102294921875e-06, 2.9802322387695312e-06, 3.0994415283203125e-06, 3.2186508178710938e-06, 3.337860107421875e-06, 3.4570693969726562e-06, 3.5762786865234375e-06, 3.6954879760742188e-06, 3.814697265625e-06, 3.933906555175781e-06]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 11.0, 11.0, 9.0, 0.0, 29.0, 34.0, 37.0, 43.0, 0.0, 59.0, 57.0, 72.0, 80.0, 0.0, 74.0, 71.0, 71.0, 73.0, 59.0, 0.0, 50.0, 46.0, 34.0, 26.0, 0.0, 17.0, 10.0, 8.0, 3.0, 0.0, 9.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5012919902801514e-06, -1.4528632164001465e-06, -1.4044344425201416e-06, -1.3560056686401367e-06, -1.3075768947601318e-06, -1.259148120880127e-06, -1.210719347000122e-06, -1.1622905731201172e-06, -1.1138617992401123e-06, -1.0654330253601074e-06, -1.0170042514801025e-06, -9.685754776000977e-07, -9.201467037200928e-07, -8.717179298400879e-07, -8.23289155960083e-07, -7.748603820800781e-07, -7.264316082000732e-07, -6.780028343200684e-07, -6.295740604400635e-07, -5.811452865600586e-07, -5.327165126800537e-07, -4.842877388000488e-07, -4.3585896492004395e-07, -3.8743019104003906e-07, -3.390014171600342e-07, -2.905726432800293e-07, -2.421438694000244e-07, -1.9371509552001953e-07, -1.4528632164001465e-07, -9.685754776000977e-08, -4.842877388000488e-08, 0.0, 4.842877388000488e-08, 9.685754776000977e-08, 1.4528632164001465e-07, 1.9371509552001953e-07, 2.421438694000244e-07, 2.905726432800293e-07, 3.390014171600342e-07, 3.8743019104003906e-07, 4.3585896492004395e-07, 4.842877388000488e-07, 5.327165126800537e-07, 5.811452865600586e-07, 6.295740604400635e-07, 6.780028343200684e-07, 7.264316082000732e-07, 7.748603820800781e-07, 8.23289155960083e-07, 8.717179298400879e-07, 9.201467037200928e-07, 9.685754776000977e-07, 1.0170042514801025e-06, 1.0654330253601074e-06, 1.1138617992401123e-06, 1.1622905731201172e-06, 1.210719347000122e-06, 1.259148120880127e-06, 1.3075768947601318e-06, 1.3560056686401367e-06, 1.4044344425201416e-06, 1.4528632164001465e-06, 1.5012919902801514e-06, 1.5497207641601562e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 14.0, 5.0, 23.0, 23.0, 61.0, 48.0, 135.0, 86.0, 127.0, 412.0, 342.0, 1107.0, 991.0, 3295.0, 2831.0, 10752.0, 9959.0, 41843.0, 45831.0, 266861.0, 278634.0, 267230.0, 45842.0, 26269.0, 25717.0, 6346.0, 7036.0, 1958.0, 2306.0, 688.0, 822.0, 243.0, 302.0, 102.0, 144.0, 40.0, 59.0, 18.0, 25.0, 5.0, 10.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-06, -2.4158507585525513e-06, -2.3283064365386963e-06, -2.2407621145248413e-06, -2.1532177925109863e-06, -2.0656734704971313e-06, -1.9781291484832764e-06, -1.8905848264694214e-06, -1.8030405044555664e-06, -1.7154961824417114e-06, -1.6279518604278564e-06, -1.5404075384140015e-06, -1.4528632164001465e-06, -1.3653188943862915e-06, -1.2777745723724365e-06, -1.1902302503585815e-06, -1.1026859283447266e-06, -1.0151416063308716e-06, -9.275972843170166e-07, -8.400529623031616e-07, -7.525086402893066e-07, -6.649643182754517e-07, -5.774199962615967e-07, -4.898756742477417e-07, -4.023313522338867e-07, -3.1478703022003174e-07, -2.2724270820617676e-07, -1.3969838619232178e-07, -5.21540641784668e-08, 3.5390257835388184e-08, 1.2293457984924316e-07, 2.1047890186309814e-07, 2.980232238769531e-07, 3.855675458908081e-07, 4.731118679046631e-07, 5.606561899185181e-07, 6.48200511932373e-07, 7.35744833946228e-07, 8.23289155960083e-07, 9.10833477973938e-07, 9.98377799987793e-07, 1.085922122001648e-06, 1.173466444015503e-06, 1.261010766029358e-06, 1.3485550880432129e-06, 1.4360994100570679e-06, 1.5236437320709229e-06, 1.6111880540847778e-06, 1.6987323760986328e-06, 1.7862766981124878e-06, 1.8738210201263428e-06, 1.9613653421401978e-06, 2.0489096641540527e-06, 2.1364539861679077e-06, 2.2239983081817627e-06, 2.3115426301956177e-06, 2.3990869522094727e-06, 2.4866312742233276e-06, 2.5741755962371826e-06, 2.6617199182510376e-06, 2.7492642402648926e-06, 2.8368085622787476e-06, 2.9243528842926025e-06, 3.0118972063064575e-06, 3.0994415283203125e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 8.0, 4.0, 10.0, 5.0, 12.0, 8.0, 13.0, 40.0, 21.0, 25.0, 32.0, 26.0, 28.0, 95.0, 50.0, 45.0, 45.0, 52.0, 57.0, 53.0, 98.0, 43.0, 40.0, 34.0, 30.0, 20.0, 37.0, 12.0, 15.0, 4.0, 9.0, 8.0, 13.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.957640051841736e-06, -1.8887221813201904e-06, -1.819804310798645e-06, -1.7508864402770996e-06, -1.6819685697555542e-06, -1.6130506992340088e-06, -1.5441328287124634e-06, -1.475214958190918e-06, -1.4062970876693726e-06, -1.3373792171478271e-06, -1.2684613466262817e-06, -1.1995434761047363e-06, -1.130625605583191e-06, -1.0617077350616455e-06, -9.927898645401e-07, -9.238719940185547e-07, -8.549541234970093e-07, -7.860362529754639e-07, -7.171183824539185e-07, -6.48200511932373e-07, -5.792826414108276e-07, -5.103647708892822e-07, -4.414469003677368e-07, -3.725290298461914e-07, -3.03611159324646e-07, -2.3469328880310059e-07, -1.6577541828155518e-07, -9.685754776000977e-08, -2.7939677238464355e-08, 4.0978193283081055e-08, 1.0989606380462646e-07, 1.7881393432617188e-07, 2.477318048477173e-07, 3.166496753692627e-07, 3.855675458908081e-07, 4.544854164123535e-07, 5.234032869338989e-07, 5.923211574554443e-07, 6.612390279769897e-07, 7.301568984985352e-07, 7.990747690200806e-07, 8.67992639541626e-07, 9.369105100631714e-07, 1.0058283805847168e-06, 1.0747462511062622e-06, 1.1436641216278076e-06, 1.212581992149353e-06, 1.2814998626708984e-06, 1.3504177331924438e-06, 1.4193356037139893e-06, 1.4882534742355347e-06, 1.55717134475708e-06, 1.6260892152786255e-06, 1.695007085800171e-06, 1.7639249563217163e-06, 1.8328428268432617e-06, 1.9017606973648071e-06, 1.9706785678863525e-06, 2.039596438407898e-06, 2.1085143089294434e-06, 2.1774321794509888e-06, 2.246350049972534e-06, 2.3152679204940796e-06, 2.384185791015625e-06]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 9.0, 9.0, 7.0, 12.0, 13.0, 18.0, 29.0, 29.0, 63.0, 77.0, 141.0, 204.0, 129.0, 53.0, 55.0, 38.0, 25.0, 23.0, 16.0, 10.0, 9.0, 1.0, 2.0, 6.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020673137623816729, -0.00020037242211401463, -0.00019401346798986197, -0.00018765452841762453, -0.00018129557429347187, -0.0001749366201693192, -0.00016857768059708178, -0.00016221872647292912, -0.00015585977234877646, -0.0001495008182246238, -0.00014314186410047114, -0.0001367829245282337, -0.00013042397040408105, -0.00012406501627992839, -0.00011770606943173334, -0.0001113471225835383, -0.00010498816845938563, -9.862921433523297e-05, -9.227026748703793e-05, -8.591132063884288e-05, -7.955236651469022e-05, -7.319341239053756e-05, -6.683446554234251e-05, -6.047551505616866e-05, -5.411656456999481e-05, -4.7757614083820954e-05, -4.13986635976471e-05, -3.503971311147325e-05, -2.8680762625299394e-05, -2.232181213912554e-05, -1.5962861652951688e-05, -9.603911166777834e-06, -3.2449752325192094e-06, 3.113975253654644e-06, 9.472925739828497e-06, 1.583187622600235e-05, 2.2190826712176204e-05, 2.8549777198350057e-05, 3.490872768452391e-05, 4.1267678170697764e-05, 4.762662865687162e-05, 5.398557914304547e-05, 6.0344529629219323e-05, 6.670347647741437e-05, 7.306243060156703e-05, 7.942138472571969e-05, 8.578033157391474e-05, 9.213927842210978e-05, 9.849823254626244e-05, 0.0001048571866704151, 0.00011121613351861015, 0.0001175750803668052, 0.00012393403449095786, 0.00013029298861511052, 0.00013665194273926318, 0.0001430108823115006, 0.00014936983643565327, 0.00015572879055980593, 0.00016208773013204336, 0.00016844668425619602, 0.00017480563838034868, 0.00018116459250450134, 0.000187523546628654, 0.00019388248620089144, 0.0002002414403250441]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 6.0, 11.0, 10.0, 8.0, 14.0, 18.0, 22.0, 18.0, 34.0, 19.0, 36.0, 34.0, 41.0, 45.0, 40.0, 43.0, 56.0, 42.0, 41.0, 37.0, 56.0, 36.0, 38.0, 36.0, 35.0, 29.0, 33.0, 22.0, 19.0, 26.0, 19.0, 17.0, 9.0, 6.0, 9.0, 6.0, 6.0, 8.0, 4.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011271238327026367, -0.00010895729064941406, -0.00010520219802856445, -0.00010144710540771484, -9.769201278686523e-05, -9.393692016601562e-05, -9.018182754516602e-05, -8.64267349243164e-05, -8.26716423034668e-05, -7.891654968261719e-05, -7.516145706176758e-05, -7.140636444091797e-05, -6.765127182006836e-05, -6.389617919921875e-05, -6.014108657836914e-05, -5.638599395751953e-05, -5.263090133666992e-05, -4.887580871582031e-05, -4.51207160949707e-05, -4.1365623474121094e-05, -3.7610530853271484e-05, -3.3855438232421875e-05, -3.0100345611572266e-05, -2.6345252990722656e-05, -2.2590160369873047e-05, -1.8835067749023438e-05, -1.5079975128173828e-05, -1.1324882507324219e-05, -7.569789886474609e-06, -3.814697265625e-06, -5.960464477539063e-08, 3.6954879760742188e-06, 7.450580596923828e-06, 1.1205673217773438e-05, 1.4960765838623047e-05, 1.8715858459472656e-05, 2.2470951080322266e-05, 2.6226043701171875e-05, 2.9981136322021484e-05, 3.3736228942871094e-05, 3.74913215637207e-05, 4.124641418457031e-05, 4.500150680541992e-05, 4.875659942626953e-05, 5.251169204711914e-05, 5.626678466796875e-05, 6.002187728881836e-05, 6.377696990966797e-05, 6.753206253051758e-05, 7.128715515136719e-05, 7.50422477722168e-05, 7.87973403930664e-05, 8.255243301391602e-05, 8.630752563476562e-05, 9.006261825561523e-05, 9.381771087646484e-05, 9.757280349731445e-05, 0.00010132789611816406, 0.00010508298873901367, 0.00010883808135986328, 0.00011259317398071289, 0.0001163482666015625, 0.00012010335922241211, 0.00012385845184326172, 0.00012761354446411133]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 6.0, 19.0, 21.0, 20.0, 43.0, 52.0, 89.0, 152.0, 209.0, 362.0, 677.0, 1259.0, 2345.0, 5087.0, 12608.0, 42236.0, 3278850.0, 800253.0, 29863.0, 10534.0, 4310.0, 2107.0, 1177.0, 700.0, 383.0, 259.0, 148.0, 119.0, 84.0, 61.0, 48.0, 47.0, 30.0, 26.0, 17.0, 13.0, 12.0, 13.0, 10.0, 3.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.369850158691406e-05, -8.977949619293213e-05, -8.58604907989502e-05, -8.194148540496826e-05, -7.802248001098633e-05, -7.41034746170044e-05, -7.018446922302246e-05, -6.626546382904053e-05, -6.23464584350586e-05, -5.842745304107666e-05, -5.4508447647094727e-05, -5.058944225311279e-05, -4.667043685913086e-05, -4.2751431465148926e-05, -3.883242607116699e-05, -3.491342067718506e-05, -3.0994415283203125e-05, -2.707540988922119e-05, -2.3156404495239258e-05, -1.9237399101257324e-05, -1.531839370727539e-05, -1.1399388313293457e-05, -7.4803829193115234e-06, -3.56137752532959e-06, 3.5762786865234375e-07, 4.276633262634277e-06, 8.195638656616211e-06, 1.2114644050598145e-05, 1.6033649444580078e-05, 1.9952654838562012e-05, 2.3871660232543945e-05, 2.779066562652588e-05, 3.170967102050781e-05, 3.5628676414489746e-05, 3.954768180847168e-05, 4.346668720245361e-05, 4.738569259643555e-05, 5.130469799041748e-05, 5.5223703384399414e-05, 5.914270877838135e-05, 6.306171417236328e-05, 6.698071956634521e-05, 7.089972496032715e-05, 7.481873035430908e-05, 7.873773574829102e-05, 8.265674114227295e-05, 8.657574653625488e-05, 9.049475193023682e-05, 9.441375732421875e-05, 9.833276271820068e-05, 0.00010225176811218262, 0.00010617077350616455, 0.00011008977890014648, 0.00011400878429412842, 0.00011792778968811035, 0.00012184679508209229, 0.00012576580047607422, 0.00012968480587005615, 0.00013360381126403809, 0.00013752281665802002, 0.00014144182205200195, 0.0001453608274459839, 0.00014927983283996582, 0.00015319883823394775, 0.0001571178436279297]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 7.0, 15.0, 12.0, 21.0, 44.0, 42.0, 57.0, 86.0, 83.0, 115.0, 108.0, 82.0, 74.0, 63.0, 49.0, 42.0, 31.0, 14.0, 14.0, 11.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1278858184814453e-05, -2.036057412624359e-05, -1.944229006767273e-05, -1.8524006009101868e-05, -1.7605721950531006e-05, -1.6687437891960144e-05, -1.5769153833389282e-05, -1.485086977481842e-05, -1.3932585716247559e-05, -1.3014301657676697e-05, -1.2096017599105835e-05, -1.1177733540534973e-05, -1.0259449481964111e-05, -9.34116542339325e-06, -8.422881364822388e-06, -7.504597306251526e-06, -6.586313247680664e-06, -5.668029189109802e-06, -4.7497451305389404e-06, -3.831461071968079e-06, -2.913177013397217e-06, -1.994892954826355e-06, -1.0766088962554932e-06, -1.5832483768463135e-07, 7.599592208862305e-07, 1.6782432794570923e-06, 2.596527338027954e-06, 3.514811396598816e-06, 4.433095455169678e-06, 5.3513795137405396e-06, 6.269663572311401e-06, 7.187947630882263e-06, 8.106231689453125e-06, 9.024515748023987e-06, 9.942799806594849e-06, 1.086108386516571e-05, 1.1779367923736572e-05, 1.2697651982307434e-05, 1.3615936040878296e-05, 1.4534220099449158e-05, 1.545250415802002e-05, 1.637078821659088e-05, 1.7289072275161743e-05, 1.8207356333732605e-05, 1.9125640392303467e-05, 2.004392445087433e-05, 2.096220850944519e-05, 2.1880492568016052e-05, 2.2798776626586914e-05, 2.3717060685157776e-05, 2.4635344743728638e-05, 2.55536288022995e-05, 2.647191286087036e-05, 2.7390196919441223e-05, 2.8308480978012085e-05, 2.9226765036582947e-05, 3.014504909515381e-05, 3.106333315372467e-05, 3.198161721229553e-05, 3.2899901270866394e-05, 3.3818185329437256e-05, 3.473646938800812e-05, 3.565475344657898e-05, 3.657303750514984e-05, 3.74913215637207e-05]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 6.0, 10.0, 16.0, 35.0, 45.0, 64.0, 100.0, 160.0, 231.0, 388.0, 617.0, 1010.0, 1607.0, 2555.0, 4354.0, 7766.0, 15435.0, 30880.0, 79806.0, 566669.0, 3246876.0, 145360.0, 45713.0, 19909.0, 10244.0, 5893.0, 3279.0, 1927.0, 1219.0, 719.0, 495.0, 314.0, 196.0, 138.0, 83.0, 57.0, 42.0, 25.0, 14.0, 11.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.369020462036133e-05, -4.2195431888103485e-05, -4.070065915584564e-05, -3.92058864235878e-05, -3.7711113691329956e-05, -3.621634095907211e-05, -3.472156822681427e-05, -3.322679549455643e-05, -3.1732022762298584e-05, -3.023725003004074e-05, -2.8742477297782898e-05, -2.7247704565525055e-05, -2.5752931833267212e-05, -2.425815910100937e-05, -2.2763386368751526e-05, -2.1268613636493683e-05, -1.977384090423584e-05, -1.8279068171977997e-05, -1.6784295439720154e-05, -1.528952270746231e-05, -1.3794749975204468e-05, -1.2299977242946625e-05, -1.0805204510688782e-05, -9.310431778430939e-06, -7.815659046173096e-06, -6.320886313915253e-06, -4.82611358165741e-06, -3.3313408493995667e-06, -1.8365681171417236e-06, -3.417953848838806e-07, 1.1529773473739624e-06, 2.6477500796318054e-06, 4.1425228118896484e-06, 5.6372955441474915e-06, 7.1320682764053345e-06, 8.626841008663177e-06, 1.012161374092102e-05, 1.1616386473178864e-05, 1.3111159205436707e-05, 1.460593193769455e-05, 1.6100704669952393e-05, 1.7595477402210236e-05, 1.909025013446808e-05, 2.058502286672592e-05, 2.2079795598983765e-05, 2.3574568331241608e-05, 2.506934106349945e-05, 2.6564113795757294e-05, 2.8058886528015137e-05, 2.955365926027298e-05, 3.104843199253082e-05, 3.2543204724788666e-05, 3.403797745704651e-05, 3.553275018930435e-05, 3.7027522921562195e-05, 3.852229565382004e-05, 4.001706838607788e-05, 4.1511841118335724e-05, 4.300661385059357e-05, 4.450138658285141e-05, 4.599615931510925e-05, 4.7490932047367096e-05, 4.898570477962494e-05, 5.048047751188278e-05, 5.1975250244140625e-05]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 5.0, 9.0, 8.0, 4.0, 15.0, 13.0, 23.0, 22.0, 23.0, 23.0, 47.0, 47.0, 75.0, 169.0, 414.0, 1376.0, 980.0, 377.0, 125.0, 66.0, 49.0, 48.0, 26.0, 16.0, 12.0, 14.0, 12.0, 15.0, 13.0, 8.0, 7.0, 7.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.62396240234375e-05, -3.506802022457123e-05, -3.3896416425704956e-05, -3.2724812626838684e-05, -3.155320882797241e-05, -3.038160502910614e-05, -2.9210001230239868e-05, -2.8038397431373596e-05, -2.6866793632507324e-05, -2.5695189833641052e-05, -2.452358603477478e-05, -2.3351982235908508e-05, -2.2180378437042236e-05, -2.1008774638175964e-05, -1.9837170839309692e-05, -1.866556704044342e-05, -1.749396324157715e-05, -1.6322359442710876e-05, -1.5150755643844604e-05, -1.3979151844978333e-05, -1.280754804611206e-05, -1.1635944247245789e-05, -1.0464340448379517e-05, -9.292736649513245e-06, -8.121132850646973e-06, -6.949529051780701e-06, -5.777925252914429e-06, -4.606321454048157e-06, -3.4347176551818848e-06, -2.263113856315613e-06, -1.0915100574493408e-06, 8.009374141693115e-08, 1.2516975402832031e-06, 2.423301339149475e-06, 3.594905138015747e-06, 4.766508936882019e-06, 5.938112735748291e-06, 7.109716534614563e-06, 8.281320333480835e-06, 9.452924132347107e-06, 1.0624527931213379e-05, 1.1796131730079651e-05, 1.2967735528945923e-05, 1.4139339327812195e-05, 1.5310943126678467e-05, 1.648254692554474e-05, 1.765415072441101e-05, 1.8825754523277283e-05, 1.9997358322143555e-05, 2.1168962121009827e-05, 2.23405659198761e-05, 2.351216971874237e-05, 2.4683773517608643e-05, 2.5855377316474915e-05, 2.7026981115341187e-05, 2.819858491420746e-05, 2.937018871307373e-05, 3.054179251194e-05, 3.1713396310806274e-05, 3.2885000109672546e-05, 3.405660390853882e-05, 3.522820770740509e-05, 3.639981150627136e-05, 3.7571415305137634e-05, 3.8743019104003906e-05]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 6.0, 20.0, 17.0, 32.0, 42.0, 72.0, 117.0, 191.0, 145.0, 127.0, 89.0, 40.0, 27.0, 20.0, 12.0, 10.0, 10.0, 10.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003345058939885348, -0.0003263711405452341, -0.0003182364162057638, -0.0003101016627624631, -0.00030196690931916237, -0.00029383215587586164, -0.0002856974024325609, -0.00027756267809309065, -0.00026942792464978993, -0.0002612931712064892, -0.00025315844686701894, -0.0002450236934237182, -0.0002368889399804175, -0.00022875418653711677, -0.00022061944764573127, -0.00021248470875434577, -0.00020434995531104505, -0.00019621520186774433, -0.00018808046297635883, -0.00017994572408497334, -0.0001718109706416726, -0.0001636762171983719, -0.0001555414783069864, -0.0001474067394156009, -0.00013927198597230017, -0.00013113723252899945, -0.00012300249363761395, -0.00011486774747027084, -0.00010673300130292773, -9.859825513558462e-05, -9.046350896824151e-05, -8.23287628008984e-05, -7.419400208164006e-05, -6.605925591429695e-05, -5.7924509746953845e-05, -4.9789763579610735e-05, -4.1655017412267625e-05, -3.3520271244924515e-05, -2.5385525077581406e-05, -1.7250778910238296e-05, -9.116032742895186e-06, -9.81286575552076e-07, 7.153459591791034e-06, 1.5288205759134144e-05, 2.3422951926477253e-05, 3.155769809382036e-05, 3.969244426116347e-05, 4.782719042850658e-05, 5.596193659584969e-05, 6.40966827631928e-05, 7.223142893053591e-05, 8.036617509787902e-05, 8.850092126522213e-05, 9.663566743256524e-05, 0.00010477041359990835, 0.00011290515976725146, 0.00012103990593459457, 0.00012917464482598007, 0.0001373093982692808, 0.00014544415171258152, 0.000153578890603967, 0.0001617136294953525, 0.00016984838293865323, 0.00017798313638195395, 0.00018611787527333945]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 8.0, 8.0, 7.0, 6.0, 15.0, 10.0, 13.0, 18.0, 23.0, 23.0, 21.0, 25.0, 33.0, 25.0, 41.0, 37.0, 42.0, 49.0, 42.0, 45.0, 51.0, 41.0, 58.0, 34.0, 36.0, 44.0, 38.0, 30.0, 30.0, 27.0, 24.0, 20.0, 18.0, 6.0, 12.0, 6.0, 7.0, 13.0, 4.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010246038436889648, -9.93506982922554e-05, -9.624101221561432e-05, -9.313132613897324e-05, -9.002164006233215e-05, -8.691195398569107e-05, -8.380226790904999e-05, -8.06925818324089e-05, -7.758289575576782e-05, -7.447320967912674e-05, -7.136352360248566e-05, -6.825383752584457e-05, -6.514415144920349e-05, -6.203446537256241e-05, -5.8924779295921326e-05, -5.581509321928024e-05, -5.270540714263916e-05, -4.959572106599808e-05, -4.6486034989356995e-05, -4.337634891271591e-05, -4.026666283607483e-05, -3.7156976759433746e-05, -3.4047290682792664e-05, -3.093760460615158e-05, -2.7827918529510498e-05, -2.4718232452869415e-05, -2.1608546376228333e-05, -1.849886029958725e-05, -1.5389174222946167e-05, -1.2279488146305084e-05, -9.169802069664001e-06, -6.060115993022919e-06, -2.950429916381836e-06, 1.5925616025924683e-07, 3.2689422369003296e-06, 6.378628313541412e-06, 9.488314390182495e-06, 1.2598000466823578e-05, 1.570768654346466e-05, 1.8817372620105743e-05, 2.1927058696746826e-05, 2.503674477338791e-05, 2.8146430850028992e-05, 3.1256116926670074e-05, 3.436580300331116e-05, 3.747548907995224e-05, 4.058517515659332e-05, 4.3694861233234406e-05, 4.680454730987549e-05, 4.991423338651657e-05, 5.3023919463157654e-05, 5.6133605539798737e-05, 5.924329161643982e-05, 6.23529776930809e-05, 6.546266376972198e-05, 6.857234984636307e-05, 7.168203592300415e-05, 7.479172199964523e-05, 7.790140807628632e-05, 8.10110941529274e-05, 8.412078022956848e-05, 8.723046630620956e-05, 9.034015238285065e-05, 9.344983845949173e-05, 9.655952453613281e-05]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 16.0, 2.0, 5.0, 9.0, 8.0, 16.0, 14.0, 24.0, 27.0, 27.0, 54.0, 66.0, 105.0, 250.0, 511.0, 1234.0, 3266.0, 10115.0, 39167.0, 251961.0, 647903.0, 69648.0, 15999.0, 4871.0, 1726.0, 758.0, 308.0, 155.0, 60.0, 50.0, 29.0, 32.0, 25.0, 22.0, 10.0, 10.0, 13.0, 11.0, 5.0, 8.0, 11.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0002570152282714844, -0.00024970993399620056, -0.00024240463972091675, -0.00023509934544563293, -0.00022779405117034912, -0.0002204887568950653, -0.0002131834626197815, -0.00020587816834449768, -0.00019857287406921387, -0.00019126757979393005, -0.00018396228551864624, -0.00017665699124336243, -0.0001693516969680786, -0.0001620464026927948, -0.00015474110841751099, -0.00014743581414222717, -0.00014013051986694336, -0.00013282522559165955, -0.00012551993131637573, -0.00011821463704109192, -0.0001109093427658081, -0.00010360404849052429, -9.629875421524048e-05, -8.899345993995667e-05, -8.168816566467285e-05, -7.438287138938904e-05, -6.707757711410522e-05, -5.977228283882141e-05, -5.24669885635376e-05, -4.5161694288253784e-05, -3.785640001296997e-05, -3.055110573768616e-05, -2.3245811462402344e-05, -1.594051718711853e-05, -8.635222911834717e-06, -1.3299286365509033e-06, 5.97536563873291e-06, 1.3280659914016724e-05, 2.0585954189300537e-05, 2.789124846458435e-05, 3.5196542739868164e-05, 4.250183701515198e-05, 4.980713129043579e-05, 5.7112425565719604e-05, 6.441771984100342e-05, 7.172301411628723e-05, 7.902830839157104e-05, 8.633360266685486e-05, 9.363889694213867e-05, 0.00010094419121742249, 0.0001082494854927063, 0.00011555477976799011, 0.00012286007404327393, 0.00013016536831855774, 0.00013747066259384155, 0.00014477595686912537, 0.00015208125114440918, 0.000159386545419693, 0.0001666918396949768, 0.00017399713397026062, 0.00018130242824554443, 0.00018860772252082825, 0.00019591301679611206, 0.00020321831107139587, 0.0002105236053466797]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 11.0, 14.0, 22.0, 42.0, 47.0, 69.0, 114.0, 118.0, 119.0, 118.0, 104.0, 64.0, 69.0, 26.0, 21.0, 9.0, 10.0, 8.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6987323760986328e-05, -1.5810132026672363e-05, -1.4632940292358398e-05, -1.3455748558044434e-05, -1.2278556823730469e-05, -1.1101365089416504e-05, -9.924173355102539e-06, -8.746981620788574e-06, -7.569789886474609e-06, -6.3925981521606445e-06, -5.21540641784668e-06, -4.038214683532715e-06, -2.86102294921875e-06, -1.6838312149047852e-06, -5.066394805908203e-07, 6.705522537231445e-07, 1.8477439880371094e-06, 3.0249357223510742e-06, 4.202127456665039e-06, 5.379319190979004e-06, 6.556510925292969e-06, 7.733702659606934e-06, 8.910894393920898e-06, 1.0088086128234863e-05, 1.1265277862548828e-05, 1.2442469596862793e-05, 1.3619661331176758e-05, 1.4796853065490723e-05, 1.5974044799804688e-05, 1.7151236534118652e-05, 1.8328428268432617e-05, 1.9505620002746582e-05, 2.0682811737060547e-05, 2.1860003471374512e-05, 2.3037195205688477e-05, 2.421438694000244e-05, 2.5391578674316406e-05, 2.656877040863037e-05, 2.7745962142944336e-05, 2.89231538772583e-05, 3.0100345611572266e-05, 3.127753734588623e-05, 3.2454729080200195e-05, 3.363192081451416e-05, 3.4809112548828125e-05, 3.598630428314209e-05, 3.7163496017456055e-05, 3.834068775177002e-05, 3.9517879486083984e-05, 4.069507122039795e-05, 4.1872262954711914e-05, 4.304945468902588e-05, 4.4226646423339844e-05, 4.540383815765381e-05, 4.6581029891967773e-05, 4.775822162628174e-05, 4.89354133605957e-05, 5.011260509490967e-05, 5.128979682922363e-05, 5.24669885635376e-05, 5.364418029785156e-05, 5.482137203216553e-05, 5.599856376647949e-05, 5.717575550079346e-05, 5.835294723510742e-05]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 1.0, 3.0, 9.0, 11.0, 12.0, 27.0, 39.0, 45.0, 77.0, 105.0, 192.0, 223.0, 370.0, 535.0, 783.0, 1019.0, 1692.0, 2458.0, 3518.0, 5311.0, 7940.0, 12207.0, 18529.0, 28902.0, 47180.0, 80569.0, 159666.0, 338903.0, 142382.0, 73267.0, 43738.0, 27188.0, 17155.0, 11566.0, 7538.0, 4841.0, 3266.0, 2362.0, 1568.0, 1075.0, 740.0, 495.0, 344.0, 219.0, 165.0, 108.0, 67.0, 49.0, 41.0, 13.0, 14.0, 16.0, 9.0, 5.0, 4.0, 0.0, 1.0, 3.0], "bins": [-3.975629806518555e-05, -3.856699913740158e-05, -3.7377700209617615e-05, -3.618840128183365e-05, -3.499910235404968e-05, -3.3809803426265717e-05, -3.262050449848175e-05, -3.1431205570697784e-05, -3.024190664291382e-05, -2.9052607715129852e-05, -2.7863308787345886e-05, -2.667400985956192e-05, -2.5484710931777954e-05, -2.4295412003993988e-05, -2.3106113076210022e-05, -2.1916814148426056e-05, -2.072751522064209e-05, -1.9538216292858124e-05, -1.8348917365074158e-05, -1.715961843729019e-05, -1.5970319509506226e-05, -1.478102058172226e-05, -1.3591721653938293e-05, -1.2402422726154327e-05, -1.1213123798370361e-05, -1.0023824870586395e-05, -8.83452594280243e-06, -7.645227015018463e-06, -6.455928087234497e-06, -5.266629159450531e-06, -4.077330231666565e-06, -2.888031303882599e-06, -1.6987323760986328e-06, -5.094334483146667e-07, 6.798654794692993e-07, 1.8691644072532654e-06, 3.0584633350372314e-06, 4.2477622628211975e-06, 5.4370611906051636e-06, 6.62636011838913e-06, 7.815659046173096e-06, 9.004957973957062e-06, 1.0194256901741028e-05, 1.1383555829524994e-05, 1.257285475730896e-05, 1.3762153685092926e-05, 1.4951452612876892e-05, 1.6140751540660858e-05, 1.7330050468444824e-05, 1.851934939622879e-05, 1.9708648324012756e-05, 2.0897947251796722e-05, 2.208724617958069e-05, 2.3276545107364655e-05, 2.446584403514862e-05, 2.5655142962932587e-05, 2.6844441890716553e-05, 2.803374081850052e-05, 2.9223039746284485e-05, 3.041233867406845e-05, 3.160163760185242e-05, 3.279093652963638e-05, 3.398023545742035e-05, 3.5169534385204315e-05, 3.635883331298828e-05]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 9.0, 11.0, 10.0, 12.0, 14.0, 11.0, 13.0, 17.0, 26.0, 28.0, 29.0, 34.0, 19.0, 31.0, 39.0, 34.0, 31.0, 30.0, 33.0, 45.0, 44.0, 41.0, 29.0, 35.0, 42.0, 42.0, 28.0, 20.0, 23.0, 26.0, 23.0, 22.0, 22.0, 26.0, 16.0, 15.0, 8.0, 10.0, 13.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.927946090698242e-05, -3.8110651075839996e-05, -3.694184124469757e-05, -3.5773031413555145e-05, -3.460422158241272e-05, -3.3435411751270294e-05, -3.226660192012787e-05, -3.109779208898544e-05, -2.9928982257843018e-05, -2.8760172426700592e-05, -2.7591362595558167e-05, -2.642255276441574e-05, -2.5253742933273315e-05, -2.408493310213089e-05, -2.2916123270988464e-05, -2.174731343984604e-05, -2.0578503608703613e-05, -1.9409693777561188e-05, -1.8240883946418762e-05, -1.7072074115276337e-05, -1.590326428413391e-05, -1.4734454452991486e-05, -1.356564462184906e-05, -1.2396834790706635e-05, -1.1228024959564209e-05, -1.0059215128421783e-05, -8.890405297279358e-06, -7.721595466136932e-06, -6.552785634994507e-06, -5.383975803852081e-06, -4.215165972709656e-06, -3.0463561415672302e-06, -1.8775463104248047e-06, -7.087364792823792e-07, 4.600733518600464e-07, 1.628883183002472e-06, 2.7976930141448975e-06, 3.966502845287323e-06, 5.1353126764297485e-06, 6.304122507572174e-06, 7.4729323387146e-06, 8.641742169857025e-06, 9.81055200099945e-06, 1.0979361832141876e-05, 1.2148171663284302e-05, 1.3316981494426727e-05, 1.4485791325569153e-05, 1.565460115671158e-05, 1.6823410987854004e-05, 1.799222081899643e-05, 1.9161030650138855e-05, 2.032984048128128e-05, 2.1498650312423706e-05, 2.266746014356613e-05, 2.3836269974708557e-05, 2.5005079805850983e-05, 2.6173889636993408e-05, 2.7342699468135834e-05, 2.851150929927826e-05, 2.9680319130420685e-05, 3.084912896156311e-05, 3.2017938792705536e-05, 3.318674862384796e-05, 3.435555845499039e-05, 3.552436828613281e-05]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 5.0, 8.0, 5.0, 18.0, 12.0, 17.0, 31.0, 24.0, 99.0, 156.0, 151.0, 380.0, 737.0, 839.0, 2235.0, 2950.0, 9923.0, 29051.0, 53705.0, 310695.0, 482647.0, 87846.0, 43181.0, 13785.0, 4028.0, 3046.0, 973.0, 922.0, 469.0, 185.0, 164.0, 99.0, 44.0, 49.0, 19.0, 8.0, 9.0, 12.0, 2.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.066394805908203e-06, -4.909001290798187e-06, -4.751607775688171e-06, -4.5942142605781555e-06, -4.43682074546814e-06, -4.279427230358124e-06, -4.122033715248108e-06, -3.964640200138092e-06, -3.807246685028076e-06, -3.6498531699180603e-06, -3.4924596548080444e-06, -3.3350661396980286e-06, -3.1776726245880127e-06, -3.020279109477997e-06, -2.862885594367981e-06, -2.705492079257965e-06, -2.5480985641479492e-06, -2.3907050490379333e-06, -2.2333115339279175e-06, -2.0759180188179016e-06, -1.9185245037078857e-06, -1.7611309885978699e-06, -1.603737473487854e-06, -1.4463439583778381e-06, -1.2889504432678223e-06, -1.1315569281578064e-06, -9.741634130477905e-07, -8.167698979377747e-07, -6.593763828277588e-07, -5.019828677177429e-07, -3.4458935260772705e-07, -1.8719583749771118e-07, -2.9802322387695312e-08, 1.2759119272232056e-07, 2.849847078323364e-07, 4.423782229423523e-07, 5.997717380523682e-07, 7.57165253162384e-07, 9.145587682723999e-07, 1.0719522833824158e-06, 1.2293457984924316e-06, 1.3867393136024475e-06, 1.5441328287124634e-06, 1.7015263438224792e-06, 1.8589198589324951e-06, 2.016313374042511e-06, 2.173706889152527e-06, 2.3311004042625427e-06, 2.4884939193725586e-06, 2.6458874344825745e-06, 2.8032809495925903e-06, 2.960674464702606e-06, 3.118067979812622e-06, 3.275461494922638e-06, 3.432855010032654e-06, 3.5902485251426697e-06, 3.7476420402526855e-06, 3.905035555362701e-06, 4.062429070472717e-06, 4.219822585582733e-06, 4.377216100692749e-06, 4.534609615802765e-06, 4.692003130912781e-06, 4.849396646022797e-06, 5.0067901611328125e-06]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 5.0, 9.0, 0.0, 19.0, 0.0, 13.0, 17.0, 0.0, 23.0, 29.0, 0.0, 37.0, 0.0, 53.0, 52.0, 0.0, 69.0, 59.0, 0.0, 78.0, 0.0, 89.0, 83.0, 0.0, 71.0, 66.0, 0.0, 55.0, 0.0, 40.0, 33.0, 0.0, 36.0, 30.0, 0.0, 15.0, 0.0, 10.0, 4.0, 0.0, 4.0, 7.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1548399925231934e-06, -1.1175870895385742e-06, -1.080334186553955e-06, -1.043081283569336e-06, -1.0058283805847168e-06, -9.685754776000977e-07, -9.313225746154785e-07, -8.940696716308594e-07, -8.568167686462402e-07, -8.195638656616211e-07, -7.82310962677002e-07, -7.450580596923828e-07, -7.078051567077637e-07, -6.705522537231445e-07, -6.332993507385254e-07, -5.960464477539062e-07, -5.587935447692871e-07, -5.21540641784668e-07, -4.842877388000488e-07, -4.470348358154297e-07, -4.0978193283081055e-07, -3.725290298461914e-07, -3.3527612686157227e-07, -2.980232238769531e-07, -2.60770320892334e-07, -2.2351741790771484e-07, -1.862645149230957e-07, -1.4901161193847656e-07, -1.1175870895385742e-07, -7.450580596923828e-08, -3.725290298461914e-08, 0.0, 3.725290298461914e-08, 7.450580596923828e-08, 1.1175870895385742e-07, 1.4901161193847656e-07, 1.862645149230957e-07, 2.2351741790771484e-07, 2.60770320892334e-07, 2.980232238769531e-07, 3.3527612686157227e-07, 3.725290298461914e-07, 4.0978193283081055e-07, 4.470348358154297e-07, 4.842877388000488e-07, 5.21540641784668e-07, 5.587935447692871e-07, 5.960464477539062e-07, 6.332993507385254e-07, 6.705522537231445e-07, 7.078051567077637e-07, 7.450580596923828e-07, 7.82310962677002e-07, 8.195638656616211e-07, 8.568167686462402e-07, 8.940696716308594e-07, 9.313225746154785e-07, 9.685754776000977e-07, 1.0058283805847168e-06, 1.043081283569336e-06, 1.080334186553955e-06, 1.1175870895385742e-06, 1.1548399925231934e-06, 1.1920928955078125e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 11.0, 6.0, 13.0, 22.0, 14.0, 58.0, 34.0, 112.0, 93.0, 99.0, 352.0, 255.0, 843.0, 677.0, 2302.0, 1933.0, 6937.0, 6205.0, 9418.0, 40599.0, 44632.0, 265576.0, 289346.0, 264028.0, 44751.0, 25630.0, 24647.0, 6077.0, 6948.0, 1938.0, 2377.0, 682.0, 870.0, 254.0, 185.0, 253.0, 85.0, 121.0, 40.0, 45.0, 16.0, 23.0, 16.0, 9.0, 6.0, 3.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4437904357910156e-06, -2.3581087589263916e-06, -2.2724270820617676e-06, -2.1867454051971436e-06, -2.1010637283325195e-06, -2.0153820514678955e-06, -1.9297003746032715e-06, -1.8440186977386475e-06, -1.7583370208740234e-06, -1.6726553440093994e-06, -1.5869736671447754e-06, -1.5012919902801514e-06, -1.4156103134155273e-06, -1.3299286365509033e-06, -1.2442469596862793e-06, -1.1585652828216553e-06, -1.0728836059570312e-06, -9.872019290924072e-07, -9.015202522277832e-07, -8.158385753631592e-07, -7.301568984985352e-07, -6.444752216339111e-07, -5.587935447692871e-07, -4.731118679046631e-07, -3.8743019104003906e-07, -3.0174851417541504e-07, -2.1606683731079102e-07, -1.30385160446167e-07, -4.470348358154297e-08, 4.0978193283081055e-08, 1.2665987014770508e-07, 2.123415470123291e-07, 2.980232238769531e-07, 3.8370490074157715e-07, 4.6938657760620117e-07, 5.550682544708252e-07, 6.407499313354492e-07, 7.264316082000732e-07, 8.121132850646973e-07, 8.977949619293213e-07, 9.834766387939453e-07, 1.0691583156585693e-06, 1.1548399925231934e-06, 1.2405216693878174e-06, 1.3262033462524414e-06, 1.4118850231170654e-06, 1.4975666999816895e-06, 1.5832483768463135e-06, 1.6689300537109375e-06, 1.7546117305755615e-06, 1.8402934074401855e-06, 1.9259750843048096e-06, 2.0116567611694336e-06, 2.0973384380340576e-06, 2.1830201148986816e-06, 2.2687017917633057e-06, 2.3543834686279297e-06, 2.4400651454925537e-06, 2.5257468223571777e-06, 2.6114284992218018e-06, 2.6971101760864258e-06, 2.78279185295105e-06, 2.868473529815674e-06, 2.954155206680298e-06, 3.039836883544922e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 4.0, 4.0, 18.0, 8.0, 7.0, 20.0, 14.0, 19.0, 42.0, 24.0, 43.0, 84.0, 34.0, 51.0, 128.0, 65.0, 54.0, 38.0, 103.0, 28.0, 31.0, 50.0, 16.0, 22.0, 35.0, 12.0, 6.0, 15.0, 3.0, 1.0, 9.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.1867454051971436e-06, -2.1085143089294434e-06, -2.030283212661743e-06, -1.952052116394043e-06, -1.8738210201263428e-06, -1.7955899238586426e-06, -1.7173588275909424e-06, -1.6391277313232422e-06, -1.560896635055542e-06, -1.4826655387878418e-06, -1.4044344425201416e-06, -1.3262033462524414e-06, -1.2479722499847412e-06, -1.169741153717041e-06, -1.0915100574493408e-06, -1.0132789611816406e-06, -9.350478649139404e-07, -8.568167686462402e-07, -7.7858567237854e-07, -7.003545761108398e-07, -6.221234798431396e-07, -5.438923835754395e-07, -4.6566128730773926e-07, -3.8743019104003906e-07, -3.0919909477233887e-07, -2.3096799850463867e-07, -1.5273690223693848e-07, -7.450580596923828e-08, 3.725290298461914e-09, 8.195638656616211e-08, 1.601874828338623e-07, 2.384185791015625e-07, 3.166496753692627e-07, 3.948807716369629e-07, 4.731118679046631e-07, 5.513429641723633e-07, 6.295740604400635e-07, 7.078051567077637e-07, 7.860362529754639e-07, 8.642673492431641e-07, 9.424984455108643e-07, 1.0207295417785645e-06, 1.0989606380462646e-06, 1.1771917343139648e-06, 1.255422830581665e-06, 1.3336539268493652e-06, 1.4118850231170654e-06, 1.4901161193847656e-06, 1.5683472156524658e-06, 1.646578311920166e-06, 1.7248094081878662e-06, 1.8030405044555664e-06, 1.8812716007232666e-06, 1.959502696990967e-06, 2.037733793258667e-06, 2.115964889526367e-06, 2.1941959857940674e-06, 2.2724270820617676e-06, 2.3506581783294678e-06, 2.428889274597168e-06, 2.507120370864868e-06, 2.5853514671325684e-06, 2.6635825634002686e-06, 2.7418136596679688e-06]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 8.0, 20.0, 38.0, 51.0, 101.0, 271.0, 190.0, 103.0, 67.0, 37.0, 35.0, 19.0, 18.0, 14.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019151484593749046, -0.00018231006106361747, -0.00017310527618974447, -0.0001639005058677867, -0.0001546957209939137, -0.00014549093612004071, -0.00013628616579808295, -0.00012708138092420995, -0.00011787659605033696, -0.00010867181117646396, -9.946703357854858e-05, -9.02622559806332e-05, -8.10574711067602e-05, -7.185268623288721e-05, -6.264790863497183e-05, -5.3443131037056446e-05, -4.423834616318345e-05, -3.503356492728926e-05, -2.5828783691395074e-05, -1.6624002455500886e-05, -7.4192212196066976e-06, 1.7855600162874907e-06, 1.0990341252181679e-05, 2.019511885009706e-05, 2.9399903723970056e-05, 3.8604684959864244e-05, 4.780946619575843e-05, 5.701424743165262e-05, 6.621902866754681e-05, 7.54238135414198e-05, 8.462859113933519e-05, 9.383336873725057e-05, 0.00010303818271495402, 0.00011224296758882701, 0.0001214477451867424, 0.00013065252278465778, 0.00013985730765853077, 0.00014906209253240377, 0.00015826686285436153, 0.00016747164772823453, 0.00017667643260210752, 0.00018588121747598052, 0.00019508600234985352, 0.00020429077267181128, 0.00021349555754568428, 0.00022270034241955727, 0.00023190511274151504, 0.00024110989761538804, 0.00025031468248926103, 0.000259519467363134, 0.000268724252237007, 0.00027792903711088, 0.00028713379288092256, 0.00029633857775479555, 0.00030554336262866855, 0.00031474814750254154, 0.00032395293237641454, 0.00033315771725028753, 0.00034236250212416053, 0.0003515672869980335, 0.0003607720718719065, 0.00036997682764194906, 0.00037918161251582205, 0.00038838639738969505, 0.00039759118226356804]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 5.0, 5.0, 5.0, 9.0, 10.0, 16.0, 8.0, 18.0, 12.0, 11.0, 19.0, 30.0, 24.0, 39.0, 29.0, 33.0, 41.0, 43.0, 49.0, 43.0, 47.0, 47.0, 45.0, 27.0, 37.0, 33.0, 45.0, 34.0, 34.0, 24.0, 22.0, 19.0, 26.0, 23.0, 16.0, 13.0, 12.0, 6.0, 14.0, 6.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00011211633682250977, -0.00010863319039344788, -0.00010515004396438599, -0.0001016668975353241, -9.818375110626221e-05, -9.470060467720032e-05, -9.121745824813843e-05, -8.773431181907654e-05, -8.425116539001465e-05, -8.076801896095276e-05, -7.728487253189087e-05, -7.380172610282898e-05, -7.031857967376709e-05, -6.68354332447052e-05, -6.335228681564331e-05, -5.986914038658142e-05, -5.638599395751953e-05, -5.290284752845764e-05, -4.941970109939575e-05, -4.593655467033386e-05, -4.245340824127197e-05, -3.897026181221008e-05, -3.548711538314819e-05, -3.2003968954086304e-05, -2.8520822525024414e-05, -2.5037676095962524e-05, -2.1554529666900635e-05, -1.8071383237838745e-05, -1.4588236808776855e-05, -1.1105090379714966e-05, -7.621943950653076e-06, -4.1387975215911865e-06, -6.556510925292969e-07, 2.8274953365325928e-06, 6.310641765594482e-06, 9.793788194656372e-06, 1.3276934623718262e-05, 1.676008105278015e-05, 2.024322748184204e-05, 2.372637391090393e-05, 2.720952033996582e-05, 3.069266676902771e-05, 3.41758131980896e-05, 3.765895962715149e-05, 4.114210605621338e-05, 4.462525248527527e-05, 4.810839891433716e-05, 5.159154534339905e-05, 5.507469177246094e-05, 5.855783820152283e-05, 6.204098463058472e-05, 6.55241310596466e-05, 6.90072774887085e-05, 7.249042391777039e-05, 7.597357034683228e-05, 7.945671677589417e-05, 8.293986320495605e-05, 8.642300963401794e-05, 8.990615606307983e-05, 9.338930249214172e-05, 9.687244892120361e-05, 0.0001003555953502655, 0.00010383874177932739, 0.00010732188820838928, 0.00011080503463745117]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 5.0, 6.0, 9.0, 10.0, 24.0, 35.0, 66.0, 93.0, 152.0, 239.0, 405.0, 735.0, 1364.0, 2659.0, 5580.0, 14439.0, 57867.0, 3770817.0, 296705.0, 25452.0, 9025.0, 3820.0, 1927.0, 1064.0, 607.0, 409.0, 240.0, 167.0, 105.0, 72.0, 37.0, 48.0, 34.0, 13.0, 12.0, 7.0, 7.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.432699203491211e-05, -7.090996950864792e-05, -6.749294698238373e-05, -6.407592445611954e-05, -6.065890192985535e-05, -5.7241879403591156e-05, -5.3824856877326965e-05, -5.0407834351062775e-05, -4.6990811824798584e-05, -4.357378929853439e-05, -4.01567667722702e-05, -3.673974424600601e-05, -3.332272171974182e-05, -2.990569919347763e-05, -2.648867666721344e-05, -2.307165414094925e-05, -1.965463161468506e-05, -1.6237609088420868e-05, -1.2820586562156677e-05, -9.403564035892487e-06, -5.986541509628296e-06, -2.5695189833641052e-06, 8.475035429000854e-07, 4.264526069164276e-06, 7.681548595428467e-06, 1.1098571121692657e-05, 1.4515593647956848e-05, 1.793261617422104e-05, 2.134963870048523e-05, 2.476666122674942e-05, 2.818368375301361e-05, 3.16007062792778e-05, 3.501772880554199e-05, 3.843475133180618e-05, 4.1851773858070374e-05, 4.5268796384334564e-05, 4.8685818910598755e-05, 5.2102841436862946e-05, 5.5519863963127136e-05, 5.893688648939133e-05, 6.235390901565552e-05, 6.577093154191971e-05, 6.91879540681839e-05, 7.260497659444809e-05, 7.602199912071228e-05, 7.943902164697647e-05, 8.285604417324066e-05, 8.627306669950485e-05, 8.969008922576904e-05, 9.310711175203323e-05, 9.652413427829742e-05, 9.994115680456161e-05, 0.0001033581793308258, 0.00010677520185709, 0.00011019222438335419, 0.00011360924690961838, 0.00011702626943588257, 0.00012044329196214676, 0.00012386031448841095, 0.00012727733701467514, 0.00013069435954093933, 0.00013411138206720352, 0.0001375284045934677, 0.0001409454271197319, 0.0001443624496459961]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 4.0, 5.0, 4.0, 9.0, 12.0, 12.0, 20.0, 19.0, 25.0, 34.0, 51.0, 67.0, 83.0, 85.0, 86.0, 101.0, 59.0, 63.0, 61.0, 45.0, 43.0, 27.0, 23.0, 19.0, 9.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.704692840576172e-05, -1.6271136701107025e-05, -1.549534499645233e-05, -1.4719553291797638e-05, -1.3943761587142944e-05, -1.316796988248825e-05, -1.2392178177833557e-05, -1.1616386473178864e-05, -1.084059476852417e-05, -1.0064803063869476e-05, -9.289011359214783e-06, -8.513219654560089e-06, -7.737427949905396e-06, -6.961636245250702e-06, -6.185844540596008e-06, -5.410052835941315e-06, -4.634261131286621e-06, -3.8584694266319275e-06, -3.082677721977234e-06, -2.3068860173225403e-06, -1.5310943126678467e-06, -7.553026080131531e-07, 2.0489096641540527e-08, 7.962808012962341e-07, 1.5720725059509277e-06, 2.3478642106056213e-06, 3.123655915260315e-06, 3.8994476199150085e-06, 4.675239324569702e-06, 5.451031029224396e-06, 6.226822733879089e-06, 7.002614438533783e-06, 7.778406143188477e-06, 8.55419784784317e-06, 9.329989552497864e-06, 1.0105781257152557e-05, 1.0881572961807251e-05, 1.1657364666461945e-05, 1.2433156371116638e-05, 1.3208948075771332e-05, 1.3984739780426025e-05, 1.4760531485080719e-05, 1.5536323189735413e-05, 1.6312114894390106e-05, 1.70879065990448e-05, 1.7863698303699493e-05, 1.8639490008354187e-05, 1.941528171300888e-05, 2.0191073417663574e-05, 2.0966865122318268e-05, 2.174265682697296e-05, 2.2518448531627655e-05, 2.329424023628235e-05, 2.4070031940937042e-05, 2.4845823645591736e-05, 2.562161535024643e-05, 2.6397407054901123e-05, 2.7173198759555817e-05, 2.794899046421051e-05, 2.8724782168865204e-05, 2.9500573873519897e-05, 3.027636557817459e-05, 3.1052157282829285e-05, 3.182794898748398e-05, 3.260374069213867e-05]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 8.0, 9.0, 6.0, 13.0, 18.0, 28.0, 30.0, 51.0, 67.0, 121.0, 160.0, 268.0, 360.0, 562.0, 843.0, 1275.0, 2056.0, 3579.0, 5692.0, 9696.0, 17383.0, 37482.0, 88212.0, 482207.0, 3224373.0, 198310.0, 59307.0, 27020.0, 14844.0, 7815.0, 4577.0, 2929.0, 1730.0, 1055.0, 739.0, 457.0, 290.0, 218.0, 153.0, 111.0, 71.0, 48.0, 38.0, 26.0, 13.0, 15.0, 8.0, 2.0, 2.0, 0.0, 3.0, 7.0, 1.0, 1.0, 1.0], "bins": [-4.029273986816406e-05, -3.9082951843738556e-05, -3.787316381931305e-05, -3.666337579488754e-05, -3.5453587770462036e-05, -3.424379974603653e-05, -3.303401172161102e-05, -3.1824223697185516e-05, -3.061443567276001e-05, -2.9404647648334503e-05, -2.8194859623908997e-05, -2.698507159948349e-05, -2.5775283575057983e-05, -2.4565495550632477e-05, -2.335570752620697e-05, -2.2145919501781464e-05, -2.0936131477355957e-05, -1.972634345293045e-05, -1.8516555428504944e-05, -1.7306767404079437e-05, -1.609697937965393e-05, -1.4887191355228424e-05, -1.3677403330802917e-05, -1.2467615306377411e-05, -1.1257827281951904e-05, -1.0048039257526398e-05, -8.838251233100891e-06, -7.6284632086753845e-06, -6.418675184249878e-06, -5.208887159824371e-06, -3.999099135398865e-06, -2.789311110973358e-06, -1.5795230865478516e-06, -3.6973506212234497e-07, 8.400529623031616e-07, 2.0498409867286682e-06, 3.259629011154175e-06, 4.469417035579681e-06, 5.679205060005188e-06, 6.888993084430695e-06, 8.098781108856201e-06, 9.308569133281708e-06, 1.0518357157707214e-05, 1.1728145182132721e-05, 1.2937933206558228e-05, 1.4147721230983734e-05, 1.535750925540924e-05, 1.6567297279834747e-05, 1.7777085304260254e-05, 1.898687332868576e-05, 2.0196661353111267e-05, 2.1406449377536774e-05, 2.261623740196228e-05, 2.3826025426387787e-05, 2.5035813450813293e-05, 2.62456014752388e-05, 2.7455389499664307e-05, 2.8665177524089813e-05, 2.987496554851532e-05, 3.1084753572940826e-05, 3.229454159736633e-05, 3.350432962179184e-05, 3.4714117646217346e-05, 3.592390567064285e-05, 3.713369369506836e-05]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 12.0, 10.0, 5.0, 15.0, 14.0, 16.0, 16.0, 20.0, 35.0, 41.0, 72.0, 104.0, 255.0, 690.0, 1355.0, 729.0, 268.0, 104.0, 75.0, 36.0, 46.0, 18.0, 30.0, 15.0, 19.0, 12.0, 14.0, 11.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.8683414459228516e-05, -3.7563033401966095e-05, -3.6442652344703674e-05, -3.5322271287441254e-05, -3.420189023017883e-05, -3.308150917291641e-05, -3.196112811565399e-05, -3.084074705839157e-05, -2.972036600112915e-05, -2.859998494386673e-05, -2.747960388660431e-05, -2.635922282934189e-05, -2.5238841772079468e-05, -2.4118460714817047e-05, -2.2998079657554626e-05, -2.1877698600292206e-05, -2.0757317543029785e-05, -1.9636936485767365e-05, -1.8516555428504944e-05, -1.7396174371242523e-05, -1.6275793313980103e-05, -1.5155412256717682e-05, -1.4035031199455261e-05, -1.291465014219284e-05, -1.179426908493042e-05, -1.0673888027668e-05, -9.553506970405579e-06, -8.433125913143158e-06, -7.312744855880737e-06, -6.192363798618317e-06, -5.071982741355896e-06, -3.951601684093475e-06, -2.8312206268310547e-06, -1.710839569568634e-06, -5.904585123062134e-07, 5.299225449562073e-07, 1.650303602218628e-06, 2.7706846594810486e-06, 3.891065716743469e-06, 5.01144677400589e-06, 6.1318278312683105e-06, 7.252208888530731e-06, 8.372589945793152e-06, 9.492971003055573e-06, 1.0613352060317993e-05, 1.1733733117580414e-05, 1.2854114174842834e-05, 1.3974495232105255e-05, 1.5094876289367676e-05, 1.6215257346630096e-05, 1.7335638403892517e-05, 1.8456019461154938e-05, 1.957640051841736e-05, 2.069678157567978e-05, 2.18171626329422e-05, 2.293754369020462e-05, 2.405792474746704e-05, 2.517830580472946e-05, 2.6298686861991882e-05, 2.7419067919254303e-05, 2.8539448976516724e-05, 2.9659830033779144e-05, 3.0780211091041565e-05, 3.1900592148303986e-05, 3.3020973205566406e-05]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 4.0, 14.0, 24.0, 27.0, 32.0, 46.0, 58.0, 77.0, 98.0, 115.0, 130.0, 104.0, 51.0, 45.0, 42.0, 28.0, 18.0, 13.0, 14.0, 10.0, 8.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001730033109197393, -0.00016766312182880938, -0.00016232294728979468, -0.00015698275819886476, -0.00015164258365985006, -0.00014630239456892014, -0.00014096222002990544, -0.0001356220309389755, -0.0001302818418480456, -0.00012494165275711566, -0.00011960147821810097, -0.00011426128912717104, -0.00010892111458815634, -0.00010358092549722642, -9.82407436822541e-05, -9.29005618672818e-05, -8.75603873282671e-05, -8.222020551329479e-05, -7.688002369832247e-05, -7.153983460739255e-05, -6.619966006837785e-05, -6.0859474615426734e-05, -5.5519289162475616e-05, -5.0179107347503304e-05, -4.483892553253099e-05, -3.949874371755868e-05, -3.415856190258637e-05, -2.8818376449635252e-05, -2.347819463466294e-05, -1.813801281969063e-05, -1.2797827366739511e-05, -7.4576455517672e-06, -2.117463736794889e-06, 3.222718987672124e-06, 8.562901712139137e-06, 1.3903085346100852e-05, 1.9243267161073163e-05, 2.4583448976045474e-05, 2.9923634428996593e-05, 3.5263816243968904e-05, 4.0603998058941215e-05, 4.5944179873913527e-05, 5.128436168888584e-05, 5.6624547141836956e-05, 6.196473259478807e-05, 6.730490713380277e-05, 7.26450962247327e-05, 7.798527803970501e-05, 8.332545985467732e-05, 8.866564166964963e-05, 9.400582348462194e-05, 9.934601257555187e-05, 0.00010468618711456656, 0.00011002637620549649, 0.0001153665580204688, 0.00012070673983544111, 0.0001260469143744558, 0.00013138710346538574, 0.00013672727800440043, 0.00014206746709533036, 0.00014740764163434505, 0.00015274783072527498, 0.0001580880198162049, 0.0001634281943552196, 0.00016876838344614953]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 3.0, 7.0, 7.0, 10.0, 10.0, 15.0, 19.0, 14.0, 17.0, 24.0, 16.0, 30.0, 31.0, 22.0, 33.0, 30.0, 33.0, 40.0, 33.0, 43.0, 40.0, 42.0, 44.0, 48.0, 36.0, 19.0, 30.0, 40.0, 23.0, 25.0, 24.0, 22.0, 24.0, 22.0, 15.0, 7.0, 15.0, 17.0, 13.0, 3.0, 7.0, 9.0, 6.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.064508438110352e-05, -7.816869765520096e-05, -7.56923109292984e-05, -7.321592420339584e-05, -7.073953747749329e-05, -6.826315075159073e-05, -6.578676402568817e-05, -6.331037729978561e-05, -6.083399057388306e-05, -5.83576038479805e-05, -5.588121712207794e-05, -5.3404830396175385e-05, -5.092844367027283e-05, -4.845205694437027e-05, -4.597567021846771e-05, -4.3499283492565155e-05, -4.10228967666626e-05, -3.854651004076004e-05, -3.607012331485748e-05, -3.3593736588954926e-05, -3.111734986305237e-05, -2.864096313714981e-05, -2.6164576411247253e-05, -2.3688189685344696e-05, -2.121180295944214e-05, -1.873541623353958e-05, -1.6259029507637024e-05, -1.3782642781734467e-05, -1.130625605583191e-05, -8.829869329929352e-06, -6.3534826040267944e-06, -3.877095878124237e-06, -1.4007091522216797e-06, 1.0756775736808777e-06, 3.552064299583435e-06, 6.0284510254859924e-06, 8.50483775138855e-06, 1.0981224477291107e-05, 1.3457611203193665e-05, 1.5933997929096222e-05, 1.841038465499878e-05, 2.0886771380901337e-05, 2.3363158106803894e-05, 2.583954483270645e-05, 2.831593155860901e-05, 3.0792318284511566e-05, 3.3268705010414124e-05, 3.574509173631668e-05, 3.822147846221924e-05, 4.0697865188121796e-05, 4.317425191402435e-05, 4.565063863992691e-05, 4.812702536582947e-05, 5.0603412091732025e-05, 5.307979881763458e-05, 5.555618554353714e-05, 5.80325722694397e-05, 6.0508958995342255e-05, 6.298534572124481e-05, 6.546173244714737e-05, 6.793811917304993e-05, 7.041450589895248e-05, 7.289089262485504e-05, 7.53672793507576e-05, 7.784366607666016e-05]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 5.0, 6.0, 10.0, 19.0, 30.0, 38.0, 57.0, 73.0, 136.0, 195.0, 347.0, 589.0, 1126.0, 2118.0, 4252.0, 9041.0, 21108.0, 55739.0, 211421.0, 571238.0, 108945.0, 35076.0, 14102.0, 6326.0, 3073.0, 1526.0, 812.0, 421.0, 268.0, 172.0, 82.0, 60.0, 36.0, 28.0, 25.0, 11.0, 13.0, 9.0, 3.0, 2.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00013256072998046875, -0.0001283213496208191, -0.00012408196926116943, -0.00011984258890151978, -0.00011560320854187012, -0.00011136382818222046, -0.0001071244478225708, -0.00010288506746292114, -9.864568710327148e-05, -9.440630674362183e-05, -9.016692638397217e-05, -8.592754602432251e-05, -8.168816566467285e-05, -7.74487853050232e-05, -7.320940494537354e-05, -6.897002458572388e-05, -6.473064422607422e-05, -6.049126386642456e-05, -5.62518835067749e-05, -5.2012503147125244e-05, -4.7773122787475586e-05, -4.353374242782593e-05, -3.929436206817627e-05, -3.505498170852661e-05, -3.081560134887695e-05, -2.6576220989227295e-05, -2.2336840629577637e-05, -1.809746026992798e-05, -1.385807991027832e-05, -9.618699550628662e-06, -5.379319190979004e-06, -1.1399388313293457e-06, 3.0994415283203125e-06, 7.338821887969971e-06, 1.1578202247619629e-05, 1.5817582607269287e-05, 2.0056962966918945e-05, 2.4296343326568604e-05, 2.8535723686218262e-05, 3.277510404586792e-05, 3.701448440551758e-05, 4.1253864765167236e-05, 4.5493245124816895e-05, 4.973262548446655e-05, 5.397200584411621e-05, 5.821138620376587e-05, 6.245076656341553e-05, 6.669014692306519e-05, 7.092952728271484e-05, 7.51689076423645e-05, 7.940828800201416e-05, 8.364766836166382e-05, 8.788704872131348e-05, 9.212642908096313e-05, 9.636580944061279e-05, 0.00010060518980026245, 0.00010484457015991211, 0.00010908395051956177, 0.00011332333087921143, 0.00011756271123886108, 0.00012180209159851074, 0.0001260414719581604, 0.00013028085231781006, 0.00013452023267745972, 0.00013875961303710938]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 5.0, 2.0, 8.0, 4.0, 8.0, 12.0, 11.0, 16.0, 22.0, 35.0, 32.0, 27.0, 52.0, 56.0, 93.0, 64.0, 85.0, 78.0, 70.0, 66.0, 57.0, 45.0, 27.0, 33.0, 16.0, 23.0, 16.0, 7.0, 4.0, 13.0, 7.0, 6.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4424324035644531e-05, -1.3736076653003693e-05, -1.3047829270362854e-05, -1.2359581887722015e-05, -1.1671334505081177e-05, -1.0983087122440338e-05, -1.02948397397995e-05, -9.606592357158661e-06, -8.918344974517822e-06, -8.230097591876984e-06, -7.541850209236145e-06, -6.853602826595306e-06, -6.165355443954468e-06, -5.477108061313629e-06, -4.7888606786727905e-06, -4.100613296031952e-06, -3.4123659133911133e-06, -2.7241185307502747e-06, -2.035871148109436e-06, -1.3476237654685974e-06, -6.593763828277588e-07, 2.8870999813079834e-08, 7.171183824539185e-07, 1.405365765094757e-06, 2.0936131477355957e-06, 2.7818605303764343e-06, 3.470107913017273e-06, 4.1583552956581116e-06, 4.84660267829895e-06, 5.534850060939789e-06, 6.2230974435806274e-06, 6.911344826221466e-06, 7.599592208862305e-06, 8.287839591503143e-06, 8.976086974143982e-06, 9.66433435678482e-06, 1.035258173942566e-05, 1.1040829122066498e-05, 1.1729076504707336e-05, 1.2417323887348175e-05, 1.3105571269989014e-05, 1.3793818652629852e-05, 1.4482066035270691e-05, 1.517031341791153e-05, 1.5858560800552368e-05, 1.6546808183193207e-05, 1.7235055565834045e-05, 1.7923302948474884e-05, 1.8611550331115723e-05, 1.929979771375656e-05, 1.99880450963974e-05, 2.067629247903824e-05, 2.1364539861679077e-05, 2.2052787244319916e-05, 2.2741034626960754e-05, 2.3429282009601593e-05, 2.411752939224243e-05, 2.480577677488327e-05, 2.549402415752411e-05, 2.6182271540164948e-05, 2.6870518922805786e-05, 2.7558766305446625e-05, 2.8247013688087463e-05, 2.8935261070728302e-05, 2.962350845336914e-05]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 12.0, 16.0, 20.0, 45.0, 62.0, 93.0, 150.0, 239.0, 326.0, 533.0, 787.0, 1203.0, 1807.0, 2750.0, 4263.0, 6551.0, 10990.0, 16940.0, 27610.0, 46144.0, 82231.0, 171990.0, 359869.0, 136875.0, 70049.0, 40827.0, 24245.0, 15053.0, 9555.0, 6282.0, 3771.0, 2518.0, 1584.0, 1104.0, 692.0, 465.0, 320.0, 192.0, 148.0, 83.0, 58.0, 36.0, 17.0, 14.0, 14.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7550926208496094e-05, -3.6354176700115204e-05, -3.5157427191734314e-05, -3.3960677683353424e-05, -3.2763928174972534e-05, -3.1567178666591644e-05, -3.0370429158210754e-05, -2.9173679649829865e-05, -2.7976930141448975e-05, -2.6780180633068085e-05, -2.5583431124687195e-05, -2.4386681616306305e-05, -2.3189932107925415e-05, -2.1993182599544525e-05, -2.0796433091163635e-05, -1.9599683582782745e-05, -1.8402934074401855e-05, -1.7206184566020966e-05, -1.6009435057640076e-05, -1.4812685549259186e-05, -1.3615936040878296e-05, -1.2419186532497406e-05, -1.1222437024116516e-05, -1.0025687515735626e-05, -8.828938007354736e-06, -7.632188498973846e-06, -6.4354389905929565e-06, -5.238689482212067e-06, -4.041939973831177e-06, -2.845190465450287e-06, -1.648440957069397e-06, -4.516914486885071e-07, 7.450580596923828e-07, 1.9418075680732727e-06, 3.1385570764541626e-06, 4.3353065848350525e-06, 5.532056093215942e-06, 6.728805601596832e-06, 7.925555109977722e-06, 9.122304618358612e-06, 1.0319054126739502e-05, 1.1515803635120392e-05, 1.2712553143501282e-05, 1.3909302651882172e-05, 1.5106052160263062e-05, 1.630280166864395e-05, 1.749955117702484e-05, 1.869630068540573e-05, 1.989305019378662e-05, 2.108979970216751e-05, 2.22865492105484e-05, 2.348329871892929e-05, 2.468004822731018e-05, 2.587679773569107e-05, 2.707354724407196e-05, 2.827029675245285e-05, 2.946704626083374e-05, 3.066379576921463e-05, 3.186054527759552e-05, 3.305729478597641e-05, 3.42540442943573e-05, 3.545079380273819e-05, 3.664754331111908e-05, 3.784429281949997e-05, 3.904104232788086e-05]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 8.0, 2.0, 11.0, 6.0, 15.0, 6.0, 20.0, 23.0, 20.0, 25.0, 21.0, 21.0, 24.0, 36.0, 40.0, 34.0, 42.0, 43.0, 37.0, 44.0, 51.0, 46.0, 43.0, 30.0, 41.0, 22.0, 35.0, 41.0, 25.0, 30.0, 29.0, 18.0, 25.0, 15.0, 11.0, 13.0, 10.0, 7.0, 12.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-4.297494888305664e-05, -4.1783787310123444e-05, -4.0592625737190247e-05, -3.940146416425705e-05, -3.821030259132385e-05, -3.7019141018390656e-05, -3.582797944545746e-05, -3.463681787252426e-05, -3.3445656299591064e-05, -3.225449472665787e-05, -3.106333315372467e-05, -2.9872171580791473e-05, -2.8681010007858276e-05, -2.748984843492508e-05, -2.6298686861991882e-05, -2.5107525289058685e-05, -2.3916363716125488e-05, -2.272520214319229e-05, -2.1534040570259094e-05, -2.0342878997325897e-05, -1.91517174243927e-05, -1.7960555851459503e-05, -1.6769394278526306e-05, -1.557823270559311e-05, -1.4387071132659912e-05, -1.3195909559726715e-05, -1.2004747986793518e-05, -1.0813586413860321e-05, -9.622424840927124e-06, -8.431263267993927e-06, -7.24010169506073e-06, -6.048940122127533e-06, -4.857778549194336e-06, -3.666616976261139e-06, -2.475455403327942e-06, -1.2842938303947449e-06, -9.313225746154785e-08, 1.0980293154716492e-06, 2.289190888404846e-06, 3.4803524613380432e-06, 4.67151403427124e-06, 5.862675607204437e-06, 7.053837180137634e-06, 8.244998753070831e-06, 9.436160326004028e-06, 1.0627321898937225e-05, 1.1818483471870422e-05, 1.300964504480362e-05, 1.4200806617736816e-05, 1.5391968190670013e-05, 1.658312976360321e-05, 1.7774291336536407e-05, 1.8965452909469604e-05, 2.01566144824028e-05, 2.1347776055336e-05, 2.2538937628269196e-05, 2.3730099201202393e-05, 2.492126077413559e-05, 2.6112422347068787e-05, 2.7303583920001984e-05, 2.849474549293518e-05, 2.9685907065868378e-05, 3.0877068638801575e-05, 3.206823021173477e-05, 3.325939178466797e-05]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 9.0, 1.0, 12.0, 13.0, 36.0, 21.0, 61.0, 64.0, 129.0, 153.0, 305.0, 361.0, 764.0, 860.0, 2394.0, 2820.0, 7792.0, 10248.0, 36237.0, 61005.0, 302350.0, 442142.0, 94455.0, 52059.0, 14120.0, 10140.0, 3510.0, 2952.0, 1058.0, 1057.0, 381.0, 392.0, 190.0, 159.0, 65.0, 88.0, 34.0, 44.0, 17.0, 18.0, 10.0, 9.0, 9.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.827976226806641e-06, -4.678033292293549e-06, -4.5280903577804565e-06, -4.3781474232673645e-06, -4.2282044887542725e-06, -4.07826155424118e-06, -3.928318619728088e-06, -3.7783756852149963e-06, -3.6284327507019043e-06, -3.4784898161888123e-06, -3.3285468816757202e-06, -3.178603947162628e-06, -3.028661012649536e-06, -2.878718078136444e-06, -2.728775143623352e-06, -2.57883220911026e-06, -2.428889274597168e-06, -2.278946340084076e-06, -2.129003405570984e-06, -1.979060471057892e-06, -1.8291175365447998e-06, -1.6791746020317078e-06, -1.5292316675186157e-06, -1.3792887330055237e-06, -1.2293457984924316e-06, -1.0794028639793396e-06, -9.294599294662476e-07, -7.795169949531555e-07, -6.295740604400635e-07, -4.796311259269714e-07, -3.296881914138794e-07, -1.7974525690078735e-07, -2.9802322387695312e-08, 1.2014061212539673e-07, 2.7008354663848877e-07, 4.200264811515808e-07, 5.699694156646729e-07, 7.199123501777649e-07, 8.698552846908569e-07, 1.019798219203949e-06, 1.169741153717041e-06, 1.319684088230133e-06, 1.469627022743225e-06, 1.6195699572563171e-06, 1.7695128917694092e-06, 1.9194558262825012e-06, 2.0693987607955933e-06, 2.2193416953086853e-06, 2.3692846298217773e-06, 2.5192275643348694e-06, 2.6691704988479614e-06, 2.8191134333610535e-06, 2.9690563678741455e-06, 3.1189993023872375e-06, 3.2689422369003296e-06, 3.4188851714134216e-06, 3.5688281059265137e-06, 3.7187710404396057e-06, 3.868713974952698e-06, 4.01865690946579e-06, 4.168599843978882e-06, 4.318542778491974e-06, 4.468485713005066e-06, 4.618428647518158e-06, 4.76837158203125e-06]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 10.0, 6.0, 8.0, 13.0, 0.0, 10.0, 15.0, 15.0, 22.0, 0.0, 29.0, 41.0, 44.0, 54.0, 0.0, 51.0, 67.0, 63.0, 63.0, 84.0, 0.0, 55.0, 51.0, 59.0, 61.0, 0.0, 29.0, 32.0, 33.0, 25.0, 0.0, 11.0, 18.0, 6.0, 10.0, 7.0, 0.0, 3.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6801059246063232e-06, -1.6316771507263184e-06, -1.5832483768463135e-06, -1.5348196029663086e-06, -1.4863908290863037e-06, -1.4379620552062988e-06, -1.389533281326294e-06, -1.341104507446289e-06, -1.2926757335662842e-06, -1.2442469596862793e-06, -1.1958181858062744e-06, -1.1473894119262695e-06, -1.0989606380462646e-06, -1.0505318641662598e-06, -1.0021030902862549e-06, -9.5367431640625e-07, -9.052455425262451e-07, -8.568167686462402e-07, -8.083879947662354e-07, -7.599592208862305e-07, -7.115304470062256e-07, -6.631016731262207e-07, -6.146728992462158e-07, -5.662441253662109e-07, -5.178153514862061e-07, -4.6938657760620117e-07, -4.209578037261963e-07, -3.725290298461914e-07, -3.241002559661865e-07, -2.7567148208618164e-07, -2.2724270820617676e-07, -1.7881393432617188e-07, -1.30385160446167e-07, -8.195638656616211e-08, -3.3527612686157227e-08, 1.4901161193847656e-08, 6.332993507385254e-08, 1.1175870895385742e-07, 1.601874828338623e-07, 2.086162567138672e-07, 2.5704503059387207e-07, 3.0547380447387695e-07, 3.5390257835388184e-07, 4.023313522338867e-07, 4.507601261138916e-07, 4.991888999938965e-07, 5.476176738739014e-07, 5.960464477539062e-07, 6.444752216339111e-07, 6.92903995513916e-07, 7.413327693939209e-07, 7.897615432739258e-07, 8.381903171539307e-07, 8.866190910339355e-07, 9.350478649139404e-07, 9.834766387939453e-07, 1.0319054126739502e-06, 1.080334186553955e-06, 1.12876296043396e-06, 1.1771917343139648e-06, 1.2256205081939697e-06, 1.2740492820739746e-06, 1.3224780559539795e-06, 1.3709068298339844e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 7.0, 2.0, 16.0, 12.0, 37.0, 17.0, 24.0, 87.0, 59.0, 84.0, 196.0, 158.0, 223.0, 255.0, 799.0, 666.0, 898.0, 2707.0, 2266.0, 3102.0, 10851.0, 9325.0, 14080.0, 21334.0, 87367.0, 92929.0, 162020.0, 391323.0, 92647.0, 54441.0, 33594.0, 35183.0, 9192.0, 6526.0, 7649.0, 2137.0, 1706.0, 2001.0, 640.0, 447.0, 345.0, 473.0, 179.0, 116.0, 182.0, 57.0, 39.0, 73.0, 21.0, 21.0, 9.0, 21.0, 9.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-2.562999725341797e-06, -2.485699951648712e-06, -2.4084001779556274e-06, -2.3311004042625427e-06, -2.253800630569458e-06, -2.1765008568763733e-06, -2.0992010831832886e-06, -2.021901309490204e-06, -1.944601535797119e-06, -1.8673017621040344e-06, -1.7900019884109497e-06, -1.712702214717865e-06, -1.6354024410247803e-06, -1.5581026673316956e-06, -1.4808028936386108e-06, -1.4035031199455261e-06, -1.3262033462524414e-06, -1.2489035725593567e-06, -1.171603798866272e-06, -1.0943040251731873e-06, -1.0170042514801025e-06, -9.397044777870178e-07, -8.624047040939331e-07, -7.851049304008484e-07, -7.078051567077637e-07, -6.30505383014679e-07, -5.532056093215942e-07, -4.759058356285095e-07, -3.986060619354248e-07, -3.213062882423401e-07, -2.4400651454925537e-07, -1.6670674085617065e-07, -8.940696716308594e-08, -1.210719347000122e-08, 6.51925802230835e-08, 1.424923539161682e-07, 2.1979212760925293e-07, 2.9709190130233765e-07, 3.7439167499542236e-07, 4.516914486885071e-07, 5.289912223815918e-07, 6.062909960746765e-07, 6.835907697677612e-07, 7.60890543460846e-07, 8.381903171539307e-07, 9.154900908470154e-07, 9.927898645401e-07, 1.0700896382331848e-06, 1.1473894119262695e-06, 1.2246891856193542e-06, 1.301988959312439e-06, 1.3792887330055237e-06, 1.4565885066986084e-06, 1.5338882803916931e-06, 1.6111880540847778e-06, 1.6884878277778625e-06, 1.7657876014709473e-06, 1.843087375164032e-06, 1.9203871488571167e-06, 1.9976869225502014e-06, 2.074986696243286e-06, 2.152286469936371e-06, 2.2295862436294556e-06, 2.3068860173225403e-06, 2.384185791015625e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 5.0, 16.0, 9.0, 9.0, 14.0, 31.0, 18.0, 22.0, 24.0, 55.0, 27.0, 37.0, 40.0, 42.0, 91.0, 45.0, 43.0, 34.0, 86.0, 31.0, 32.0, 26.0, 45.0, 36.0, 24.0, 24.0, 32.0, 11.0, 11.0, 10.0, 8.0, 16.0, 4.0, 5.0, 3.0, 7.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.682209014892578e-06, -2.6086345314979553e-06, -2.5350600481033325e-06, -2.4614855647087097e-06, -2.387911081314087e-06, -2.314336597919464e-06, -2.2407621145248413e-06, -2.1671876311302185e-06, -2.0936131477355957e-06, -2.020038664340973e-06, -1.94646418094635e-06, -1.8728896975517273e-06, -1.7993152141571045e-06, -1.7257407307624817e-06, -1.6521662473678589e-06, -1.578591763973236e-06, -1.5050172805786133e-06, -1.4314427971839905e-06, -1.3578683137893677e-06, -1.2842938303947449e-06, -1.210719347000122e-06, -1.1371448636054993e-06, -1.0635703802108765e-06, -9.899958968162537e-07, -9.164214134216309e-07, -8.428469300270081e-07, -7.692724466323853e-07, -6.956979632377625e-07, -6.221234798431396e-07, -5.485489964485168e-07, -4.7497451305389404e-07, -4.0140002965927124e-07, -3.2782554626464844e-07, -2.5425106287002563e-07, -1.8067657947540283e-07, -1.0710209608078003e-07, -3.3527612686157227e-08, 4.0046870708465576e-08, 1.1362135410308838e-07, 1.8719583749771118e-07, 2.60770320892334e-07, 3.343448042869568e-07, 4.079192876815796e-07, 4.814937710762024e-07, 5.550682544708252e-07, 6.28642737865448e-07, 7.022172212600708e-07, 7.757917046546936e-07, 8.493661880493164e-07, 9.229406714439392e-07, 9.96515154838562e-07, 1.0700896382331848e-06, 1.1436641216278076e-06, 1.2172386050224304e-06, 1.2908130884170532e-06, 1.364387571811676e-06, 1.4379620552062988e-06, 1.5115365386009216e-06, 1.5851110219955444e-06, 1.6586855053901672e-06, 1.73225998878479e-06, 1.8058344721794128e-06, 1.8794089555740356e-06, 1.9529834389686584e-06, 2.0265579223632812e-06]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 5.0, 16.0, 17.0, 18.0, 27.0, 42.0, 59.0, 113.0, 156.0, 131.0, 80.0, 64.0, 48.0, 30.0, 30.0, 18.0, 19.0, 17.0, 10.0, 12.0, 15.0, 14.0, 9.0, 7.0, 3.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001015548114082776, -9.703602700028569e-05, -9.251724986825138e-05, -8.799846546025947e-05, -8.347968105226755e-05, -7.896090392023325e-05, -7.444211951224133e-05, -6.992333510424942e-05, -6.540455797221512e-05, -6.088577720220201e-05, -5.636699279421009e-05, -5.184821202419698e-05, -4.7329427616205066e-05, -4.281064684619196e-05, -3.829186607617885e-05, -3.377308166818693e-05, -2.9254297260195017e-05, -2.4735514671192504e-05, -2.0216732082189992e-05, -1.5697951312176883e-05, -1.117916872317437e-05, -6.6603861341718584e-06, -2.1416053641587496e-06, 2.3771790438331664e-06, 6.895959813846275e-06, 1.1414742402848788e-05, 1.59335249918513e-05, 2.045230576186441e-05, 2.497108835086692e-05, 2.9489870939869434e-05, 3.400865170988254e-05, 3.852743611787446e-05, 4.304620961192995e-05, 4.756499038194306e-05, 5.208377478993498e-05, 5.660255555994809e-05, 6.112133996794e-05, 6.564012437593192e-05, 7.015890150796622e-05, 7.467768591595814e-05, 7.919647032395005e-05, 8.371525473194197e-05, 8.823403186397627e-05, 9.275281627196819e-05, 9.72716006799601e-05, 0.00010179038508795202, 0.00010630916221998632, 0.00011082794662797824, 0.00011534672376001254, 0.00011986550816800445, 0.00012438428530003875, 0.00012890307698398829, 0.0001334218541160226, 0.0001379406312480569, 0.0001424594083800912, 0.00014697820006404072, 0.00015149697719607502, 0.00015601575432810932, 0.00016053454601205885, 0.00016505332314409316, 0.00016957210027612746, 0.000174090891960077, 0.0001786096690921113, 0.00018312846077606082, 0.00018764723790809512]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 9.0, 15.0, 8.0, 11.0, 22.0, 25.0, 28.0, 27.0, 25.0, 34.0, 37.0, 50.0, 40.0, 36.0, 42.0, 43.0, 44.0, 48.0, 49.0, 47.0, 41.0, 29.0, 43.0, 34.0, 23.0, 23.0, 22.0, 24.0, 24.0, 12.0, 9.0, 11.0, 10.0, 9.0, 9.0, 5.0, 5.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0], "bins": [-0.00011980533599853516, -0.0001164628192782402, -0.00011312030255794525, -0.0001097777858376503, -0.00010643526911735535, -0.0001030927523970604, -9.975023567676544e-05, -9.640771895647049e-05, -9.306520223617554e-05, -8.972268551588058e-05, -8.638016879558563e-05, -8.303765207529068e-05, -7.969513535499573e-05, -7.635261863470078e-05, -7.301010191440582e-05, -6.966758519411087e-05, -6.632506847381592e-05, -6.298255175352097e-05, -5.964003503322601e-05, -5.629751831293106e-05, -5.295500159263611e-05, -4.9612484872341156e-05, -4.6269968152046204e-05, -4.292745143175125e-05, -3.95849347114563e-05, -3.6242417991161346e-05, -3.2899901270866394e-05, -2.955738455057144e-05, -2.621486783027649e-05, -2.2872351109981537e-05, -1.9529834389686584e-05, -1.6187317669391632e-05, -1.284480094909668e-05, -9.502284228801727e-06, -6.159767508506775e-06, -2.8172507882118225e-06, 5.252659320831299e-07, 3.867782652378082e-06, 7.210299372673035e-06, 1.0552816092967987e-05, 1.389533281326294e-05, 1.7237849533557892e-05, 2.0580366253852844e-05, 2.3922882974147797e-05, 2.726539969444275e-05, 3.06079164147377e-05, 3.3950433135032654e-05, 3.7292949855327606e-05, 4.063546657562256e-05, 4.397798329591751e-05, 4.732050001621246e-05, 5.0663016736507416e-05, 5.400553345680237e-05, 5.734805017709732e-05, 6.069056689739227e-05, 6.403308361768723e-05, 6.737560033798218e-05, 7.071811705827713e-05, 7.406063377857208e-05, 7.740315049886703e-05, 8.074566721916199e-05, 8.408818393945694e-05, 8.743070065975189e-05, 9.077321738004684e-05, 9.41157341003418e-05]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 7.0, 13.0, 14.0, 23.0, 31.0, 75.0, 104.0, 168.0, 255.0, 464.0, 788.0, 1598.0, 3216.0, 7069.0, 17167.0, 55848.0, 1776680.0, 2251095.0, 49131.0, 15789.0, 6851.0, 3230.0, 1803.0, 966.0, 626.0, 379.0, 247.0, 185.0, 119.0, 69.0, 68.0, 52.0, 26.0, 24.0, 20.0, 10.0, 10.0, 9.0, 11.0, 8.0, 11.0, 4.0, 4.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.622076034545898e-05, -6.290990859270096e-05, -5.959905683994293e-05, -5.6288205087184906e-05, -5.297735333442688e-05, -4.9666501581668854e-05, -4.635564982891083e-05, -4.30447980761528e-05, -3.9733946323394775e-05, -3.642309457063675e-05, -3.311224281787872e-05, -2.9801391065120697e-05, -2.649053931236267e-05, -2.3179687559604645e-05, -1.986883580684662e-05, -1.6557984054088593e-05, -1.3247132301330566e-05, -9.93628054857254e-06, -6.625428795814514e-06, -3.314577043056488e-06, -3.725290298461914e-09, 3.307126462459564e-06, 6.61797821521759e-06, 9.928829967975616e-06, 1.3239681720733643e-05, 1.655053347349167e-05, 1.9861385226249695e-05, 2.317223697900772e-05, 2.6483088731765747e-05, 2.9793940484523773e-05, 3.31047922372818e-05, 3.6415643990039825e-05, 3.972649574279785e-05, 4.303734749555588e-05, 4.6348199248313904e-05, 4.965905100107193e-05, 5.2969902753829956e-05, 5.628075450658798e-05, 5.959160625934601e-05, 6.290245801210403e-05, 6.621330976486206e-05, 6.952416151762009e-05, 7.283501327037811e-05, 7.614586502313614e-05, 7.945671677589417e-05, 8.276756852865219e-05, 8.607842028141022e-05, 8.938927203416824e-05, 9.270012378692627e-05, 9.60109755396843e-05, 9.932182729244232e-05, 0.00010263267904520035, 0.00010594353079795837, 0.0001092543825507164, 0.00011256523430347443, 0.00011587608605623245, 0.00011918693780899048, 0.0001224977895617485, 0.00012580864131450653, 0.00012911949306726456, 0.00013243034482002258, 0.0001357411965727806, 0.00013905204832553864, 0.00014236290007829666, 0.0001456737518310547]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 15.0, 22.0, 24.0, 35.0, 44.0, 83.0, 80.0, 93.0, 94.0, 108.0, 77.0, 83.0, 70.0, 36.0, 37.0, 25.0, 18.0, 15.0, 7.0, 3.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.704692840576172e-05, -1.6153790056705475e-05, -1.526065170764923e-05, -1.4367513358592987e-05, -1.3474375009536743e-05, -1.25812366604805e-05, -1.1688098311424255e-05, -1.0794959962368011e-05, -9.901821613311768e-06, -9.008683264255524e-06, -8.11554491519928e-06, -7.222406566143036e-06, -6.329268217086792e-06, -5.436129868030548e-06, -4.542991518974304e-06, -3.6498531699180603e-06, -2.7567148208618164e-06, -1.8635764718055725e-06, -9.704381227493286e-07, -7.729977369308472e-08, 8.158385753631592e-07, 1.708976924419403e-06, 2.602115273475647e-06, 3.495253622531891e-06, 4.388391971588135e-06, 5.281530320644379e-06, 6.1746686697006226e-06, 7.0678070187568665e-06, 7.96094536781311e-06, 8.854083716869354e-06, 9.747222065925598e-06, 1.0640360414981842e-05, 1.1533498764038086e-05, 1.242663711309433e-05, 1.3319775462150574e-05, 1.4212913811206818e-05, 1.5106052160263062e-05, 1.5999190509319305e-05, 1.689232885837555e-05, 1.7785467207431793e-05, 1.8678605556488037e-05, 1.957174390554428e-05, 2.0464882254600525e-05, 2.135802060365677e-05, 2.2251158952713013e-05, 2.3144297301769257e-05, 2.40374356508255e-05, 2.4930573999881744e-05, 2.5823712348937988e-05, 2.6716850697994232e-05, 2.7609989047050476e-05, 2.850312739610672e-05, 2.9396265745162964e-05, 3.0289404094219208e-05, 3.118254244327545e-05, 3.2075680792331696e-05, 3.296881914138794e-05, 3.386195749044418e-05, 3.475509583950043e-05, 3.564823418855667e-05, 3.6541372537612915e-05, 3.743451088666916e-05, 3.83276492357254e-05, 3.922078758478165e-05, 4.011392593383789e-05]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 7.0, 7.0, 15.0, 27.0, 38.0, 58.0, 84.0, 125.0, 180.0, 248.0, 451.0, 694.0, 1111.0, 1831.0, 3195.0, 5861.0, 10516.0, 22340.0, 49801.0, 147669.0, 2898538.0, 862271.0, 111187.0, 38944.0, 17875.0, 9211.0, 4868.0, 2751.0, 1606.0, 1009.0, 632.0, 372.0, 257.0, 157.0, 116.0, 77.0, 50.0, 31.0, 20.0, 20.0, 9.0, 7.0, 6.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.220008850097656e-05, -4.0685757994651794e-05, -3.9171427488327026e-05, -3.765709698200226e-05, -3.614276647567749e-05, -3.462843596935272e-05, -3.3114105463027954e-05, -3.1599774956703186e-05, -3.0085444450378418e-05, -2.857111394405365e-05, -2.7056783437728882e-05, -2.5542452931404114e-05, -2.4028122425079346e-05, -2.2513791918754578e-05, -2.099946141242981e-05, -1.948513090610504e-05, -1.7970800399780273e-05, -1.6456469893455505e-05, -1.4942139387130737e-05, -1.342780888080597e-05, -1.1913478374481201e-05, -1.0399147868156433e-05, -8.884817361831665e-06, -7.370486855506897e-06, -5.856156349182129e-06, -4.341825842857361e-06, -2.8274953365325928e-06, -1.3131648302078247e-06, 2.0116567611694336e-07, 1.7154961824417114e-06, 3.2298266887664795e-06, 4.7441571950912476e-06, 6.258487701416016e-06, 7.772818207740784e-06, 9.287148714065552e-06, 1.080147922039032e-05, 1.2315809726715088e-05, 1.3830140233039856e-05, 1.5344470739364624e-05, 1.6858801245689392e-05, 1.837313175201416e-05, 1.9887462258338928e-05, 2.1401792764663696e-05, 2.2916123270988464e-05, 2.4430453777313232e-05, 2.5944784283638e-05, 2.745911478996277e-05, 2.8973445296287537e-05, 3.0487775802612305e-05, 3.200210630893707e-05, 3.351643681526184e-05, 3.503076732158661e-05, 3.654509782791138e-05, 3.8059428334236145e-05, 3.957375884056091e-05, 4.108808934688568e-05, 4.260241985321045e-05, 4.411675035953522e-05, 4.5631080865859985e-05, 4.7145411372184753e-05, 4.865974187850952e-05, 5.017407238483429e-05, 5.168840289115906e-05, 5.3202733397483826e-05, 5.4717063903808594e-05]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 9.0, 12.0, 8.0, 14.0, 19.0, 29.0, 30.0, 46.0, 54.0, 99.0, 120.0, 382.0, 1093.0, 1250.0, 363.0, 140.0, 87.0, 70.0, 50.0, 35.0, 34.0, 19.0, 18.0, 16.0, 17.0, 12.0, 13.0, 4.0, 3.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.314018249511719e-05, -3.181491047143936e-05, -3.0489638447761536e-05, -2.916436642408371e-05, -2.7839094400405884e-05, -2.6513822376728058e-05, -2.5188550353050232e-05, -2.3863278329372406e-05, -2.253800630569458e-05, -2.1212734282016754e-05, -1.9887462258338928e-05, -1.8562190234661102e-05, -1.7236918210983276e-05, -1.591164618730545e-05, -1.4586374163627625e-05, -1.3261102139949799e-05, -1.1935830116271973e-05, -1.0610558092594147e-05, -9.28528606891632e-06, -7.960014045238495e-06, -6.634742021560669e-06, -5.309469997882843e-06, -3.984197974205017e-06, -2.658925950527191e-06, -1.3336539268493652e-06, -8.381903171539307e-09, 1.3168901205062866e-06, 2.6421621441841125e-06, 3.9674341678619385e-06, 5.292706191539764e-06, 6.61797821521759e-06, 7.943250238895416e-06, 9.268522262573242e-06, 1.0593794286251068e-05, 1.1919066309928894e-05, 1.324433833360672e-05, 1.4569610357284546e-05, 1.5894882380962372e-05, 1.7220154404640198e-05, 1.8545426428318024e-05, 1.987069845199585e-05, 2.1195970475673676e-05, 2.25212424993515e-05, 2.3846514523029327e-05, 2.5171786546707153e-05, 2.649705857038498e-05, 2.7822330594062805e-05, 2.914760261774063e-05, 3.0472874641418457e-05, 3.179814666509628e-05, 3.312341868877411e-05, 3.4448690712451935e-05, 3.577396273612976e-05, 3.709923475980759e-05, 3.842450678348541e-05, 3.974977880716324e-05, 4.1075050830841064e-05, 4.240032285451889e-05, 4.3725594878196716e-05, 4.505086690187454e-05, 4.637613892555237e-05, 4.7701410949230194e-05, 4.902668297290802e-05, 5.0351954996585846e-05, 5.167722702026367e-05]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 8.0, 15.0, 20.0, 33.0, 44.0, 59.0, 115.0, 149.0, 135.0, 109.0, 68.0, 57.0, 43.0, 35.0, 23.0, 18.0, 18.0, 11.0, 6.0, 7.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027326837880536914, -0.00026493685436435044, -0.0002566053590271622, -0.0002482738345861435, -0.0002399423101451248, -0.00023161080025602132, -0.00022327929036691785, -0.00021494776592589915, -0.00020661625603679568, -0.0001982847461476922, -0.0001899532217066735, -0.00018162171181757003, -0.00017329020192846656, -0.00016495867748744786, -0.00015662716759834439, -0.0001482956577092409, -0.0001399641332682222, -0.00013163262337911874, -0.00012330109893810004, -0.00011496958904899657, -0.00010663807188393548, -9.83065547188744e-05, -8.997504482977092e-05, -8.164352766470984e-05, -7.331201049964875e-05, -6.498049333458766e-05, -5.6648979807505384e-05, -4.8317466280423105e-05, -3.998594911536202e-05, -3.165443195030093e-05, -2.3322918423218653e-05, -1.4991404896136373e-05, -6.659887731075287e-06, 1.671627614996396e-06, 1.0003142961068079e-05, 1.8334658307139762e-05, 2.6666173653211445e-05, 3.499769081827253e-05, 4.332920434535481e-05, 5.166071787243709e-05, 5.9992235037498176e-05, 6.832375220255926e-05, 7.665526936762035e-05, 8.498677925672382e-05, 9.331829642178491e-05, 0.000101649813586846, 0.00010998132347594947, 0.00011831284064101055, 0.00012664435780607164, 0.0001349758676951751, 0.0001433073921361938, 0.00015163890202529728, 0.00015997042646631598, 0.00016830193635541946, 0.00017663344624452293, 0.00018496497068554163, 0.0001932964805746451, 0.00020162799046374857, 0.00020995951490476727, 0.00021829102479387075, 0.00022662253468297422, 0.00023495405912399292, 0.0002432855690130964, 0.00025161707890219986, 0.00025994860334321856]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 9.0, 2.0, 7.0, 7.0, 9.0, 11.0, 20.0, 22.0, 27.0, 23.0, 30.0, 23.0, 21.0, 23.0, 37.0, 27.0, 42.0, 40.0, 45.0, 36.0, 35.0, 43.0, 29.0, 37.0, 39.0, 28.0, 34.0, 39.0, 31.0, 22.0, 21.0, 27.0, 30.0, 14.0, 26.0, 14.0, 14.0, 6.0, 10.0, 9.0, 2.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0001087188720703125, -0.00010519009083509445, -0.0001016613095998764, -9.813252836465836e-05, -9.460374712944031e-05, -9.107496589422226e-05, -8.754618465900421e-05, -8.401740342378616e-05, -8.048862218856812e-05, -7.695984095335007e-05, -7.343105971813202e-05, -6.990227848291397e-05, -6.637349724769592e-05, -6.284471601247787e-05, -5.931593477725983e-05, -5.578715354204178e-05, -5.225837230682373e-05, -4.872959107160568e-05, -4.5200809836387634e-05, -4.1672028601169586e-05, -3.814324736595154e-05, -3.461446613073349e-05, -3.108568489551544e-05, -2.7556903660297394e-05, -2.4028122425079346e-05, -2.0499341189861298e-05, -1.697055995464325e-05, -1.3441778719425201e-05, -9.912997484207153e-06, -6.384216248989105e-06, -2.855435013771057e-06, 6.73346221446991e-07, 4.202127456665039e-06, 7.730908691883087e-06, 1.1259689927101135e-05, 1.4788471162319183e-05, 1.831725239753723e-05, 2.184603363275528e-05, 2.5374814867973328e-05, 2.8903596103191376e-05, 3.2432377338409424e-05, 3.596115857362747e-05, 3.948993980884552e-05, 4.301872104406357e-05, 4.6547502279281616e-05, 5.0076283514499664e-05, 5.360506474971771e-05, 5.713384598493576e-05, 6.066262722015381e-05, 6.419140845537186e-05, 6.77201896905899e-05, 7.124897092580795e-05, 7.4777752161026e-05, 7.830653339624405e-05, 8.18353146314621e-05, 8.536409586668015e-05, 8.88928771018982e-05, 9.242165833711624e-05, 9.595043957233429e-05, 9.947922080755234e-05, 0.00010300800204277039, 0.00010653678327798843, 0.00011006556451320648, 0.00011359434574842453, 0.00011712312698364258]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 9.0, 15.0, 17.0, 15.0, 22.0, 32.0, 37.0, 55.0, 79.0, 113.0, 220.0, 379.0, 757.0, 1651.0, 4128.0, 11532.0, 39511.0, 198453.0, 662888.0, 93086.0, 22746.0, 7299.0, 2851.0, 1274.0, 547.0, 285.0, 180.0, 101.0, 60.0, 52.0, 36.0, 31.0, 20.0, 12.0, 15.0, 8.0, 7.0, 6.0, 7.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016188621520996094, -0.0001563597470521927, -0.00015083327889442444, -0.0001453068107366562, -0.00013978034257888794, -0.0001342538744211197, -0.00012872740626335144, -0.0001232009381055832, -0.00011767446994781494, -0.00011214800179004669, -0.00010662153363227844, -0.00010109506547451019, -9.556859731674194e-05, -9.00421291589737e-05, -8.451566100120544e-05, -7.89891928434372e-05, -7.346272468566895e-05, -6.79362565279007e-05, -6.240978837013245e-05, -5.68833202123642e-05, -5.135685205459595e-05, -4.58303838968277e-05, -4.030391573905945e-05, -3.47774475812912e-05, -2.925097942352295e-05, -2.37245112657547e-05, -1.819804310798645e-05, -1.26715749502182e-05, -7.145106792449951e-06, -1.6186386346817017e-06, 3.907829523086548e-06, 9.434297680854797e-06, 1.4960765838623047e-05, 2.0487233996391296e-05, 2.6013702154159546e-05, 3.1540170311927795e-05, 3.7066638469696045e-05, 4.2593106627464294e-05, 4.8119574785232544e-05, 5.3646042943000793e-05, 5.917251110076904e-05, 6.469897925853729e-05, 7.022544741630554e-05, 7.575191557407379e-05, 8.127838373184204e-05, 8.680485188961029e-05, 9.233132004737854e-05, 9.785778820514679e-05, 0.00010338425636291504, 0.00010891072452068329, 0.00011443719267845154, 0.00011996366083621979, 0.00012549012899398804, 0.0001310165971517563, 0.00013654306530952454, 0.00014206953346729279, 0.00014759600162506104, 0.00015312246978282928, 0.00015864893794059753, 0.00016417540609836578, 0.00016970187425613403, 0.00017522834241390228, 0.00018075481057167053, 0.00018628127872943878, 0.00019180774688720703]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 18.0, 13.0, 21.0, 28.0, 45.0, 59.0, 77.0, 129.0, 111.0, 98.0, 87.0, 85.0, 53.0, 49.0, 44.0, 25.0, 16.0, 11.0, 6.0, 1.0, 7.0, 8.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7702579498291016e-05, -1.6722828149795532e-05, -1.574307680130005e-05, -1.4763325452804565e-05, -1.3783574104309082e-05, -1.2803822755813599e-05, -1.1824071407318115e-05, -1.0844320058822632e-05, -9.864568710327148e-06, -8.884817361831665e-06, -7.905066013336182e-06, -6.925314664840698e-06, -5.945563316345215e-06, -4.9658119678497314e-06, -3.986060619354248e-06, -3.0063092708587646e-06, -2.0265579223632812e-06, -1.0468065738677979e-06, -6.705522537231445e-08, 9.126961231231689e-07, 1.8924474716186523e-06, 2.8721988201141357e-06, 3.851950168609619e-06, 4.8317015171051025e-06, 5.811452865600586e-06, 6.791204214096069e-06, 7.770955562591553e-06, 8.750706911087036e-06, 9.73045825958252e-06, 1.0710209608078003e-05, 1.1689960956573486e-05, 1.266971230506897e-05, 1.3649463653564453e-05, 1.4629215002059937e-05, 1.560896635055542e-05, 1.6588717699050903e-05, 1.7568469047546387e-05, 1.854822039604187e-05, 1.9527971744537354e-05, 2.0507723093032837e-05, 2.148747444152832e-05, 2.2467225790023804e-05, 2.3446977138519287e-05, 2.442672848701477e-05, 2.5406479835510254e-05, 2.6386231184005737e-05, 2.736598253250122e-05, 2.8345733880996704e-05, 2.9325485229492188e-05, 3.030523657798767e-05, 3.1284987926483154e-05, 3.226473927497864e-05, 3.324449062347412e-05, 3.4224241971969604e-05, 3.520399332046509e-05, 3.618374466896057e-05, 3.7163496017456055e-05, 3.814324736595154e-05, 3.912299871444702e-05, 4.0102750062942505e-05, 4.108250141143799e-05, 4.206225275993347e-05, 4.3042004108428955e-05, 4.402175545692444e-05, 4.500150680541992e-05]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 11.0, 15.0, 22.0, 38.0, 60.0, 82.0, 119.0, 172.0, 230.0, 365.0, 554.0, 886.0, 1396.0, 2162.0, 3296.0, 4971.0, 8615.0, 14098.0, 24181.0, 42490.0, 78646.0, 174956.0, 387448.0, 142763.0, 68505.0, 37365.0, 21555.0, 12594.0, 7493.0, 4770.0, 3038.0, 1958.0, 1302.0, 793.0, 501.0, 362.0, 217.0, 160.0, 117.0, 79.0, 39.0, 42.0, 23.0, 15.0, 14.0, 10.0, 5.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0], "bins": [-3.653764724731445e-05, -3.540981560945511e-05, -3.4281983971595764e-05, -3.315415233373642e-05, -3.2026320695877075e-05, -3.089848905801773e-05, -2.9770657420158386e-05, -2.8642825782299042e-05, -2.7514994144439697e-05, -2.6387162506580353e-05, -2.5259330868721008e-05, -2.4131499230861664e-05, -2.300366759300232e-05, -2.1875835955142975e-05, -2.074800431728363e-05, -1.9620172679424286e-05, -1.849234104156494e-05, -1.7364509403705597e-05, -1.6236677765846252e-05, -1.5108846127986908e-05, -1.3981014490127563e-05, -1.2853182852268219e-05, -1.1725351214408875e-05, -1.059751957654953e-05, -9.469687938690186e-06, -8.341856300830841e-06, -7.214024662971497e-06, -6.086193025112152e-06, -4.958361387252808e-06, -3.830529749393463e-06, -2.7026981115341187e-06, -1.5748664736747742e-06, -4.470348358154297e-07, 6.807968020439148e-07, 1.8086284399032593e-06, 2.9364600777626038e-06, 4.064291715621948e-06, 5.192123353481293e-06, 6.319954991340637e-06, 7.447786629199982e-06, 8.575618267059326e-06, 9.70344990491867e-06, 1.0831281542778015e-05, 1.195911318063736e-05, 1.3086944818496704e-05, 1.4214776456356049e-05, 1.5342608094215393e-05, 1.6470439732074738e-05, 1.7598271369934082e-05, 1.8726103007793427e-05, 1.985393464565277e-05, 2.0981766283512115e-05, 2.210959792137146e-05, 2.3237429559230804e-05, 2.436526119709015e-05, 2.5493092834949493e-05, 2.6620924472808838e-05, 2.7748756110668182e-05, 2.8876587748527527e-05, 3.000441938638687e-05, 3.1132251024246216e-05, 3.226008266210556e-05, 3.3387914299964905e-05, 3.451574593782425e-05, 3.5643577575683594e-05]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 6.0, 8.0, 9.0, 11.0, 13.0, 14.0, 24.0, 20.0, 30.0, 27.0, 29.0, 32.0, 29.0, 28.0, 47.0, 42.0, 41.0, 55.0, 35.0, 35.0, 38.0, 36.0, 34.0, 32.0, 41.0, 42.0, 26.0, 21.0, 31.0, 27.0, 19.0, 14.0, 17.0, 14.0, 9.0, 11.0, 7.0, 10.0, 8.0, 1.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.218650817871094e-05, -3.105495125055313e-05, -2.9923394322395325e-05, -2.879183739423752e-05, -2.7660280466079712e-05, -2.6528723537921906e-05, -2.53971666097641e-05, -2.4265609681606293e-05, -2.3134052753448486e-05, -2.200249582529068e-05, -2.0870938897132874e-05, -1.9739381968975067e-05, -1.860782504081726e-05, -1.7476268112659454e-05, -1.6344711184501648e-05, -1.5213154256343842e-05, -1.4081597328186035e-05, -1.2950040400028229e-05, -1.1818483471870422e-05, -1.0686926543712616e-05, -9.55536961555481e-06, -8.423812687397003e-06, -7.292255759239197e-06, -6.16069883108139e-06, -5.029141902923584e-06, -3.897584974765778e-06, -2.766028046607971e-06, -1.6344711184501648e-06, -5.029141902923584e-07, 6.28642737865448e-07, 1.7601996660232544e-06, 2.891756594181061e-06, 4.023313522338867e-06, 5.154870450496674e-06, 6.28642737865448e-06, 7.417984306812286e-06, 8.549541234970093e-06, 9.6810981631279e-06, 1.0812655091285706e-05, 1.1944212019443512e-05, 1.3075768947601318e-05, 1.4207325875759125e-05, 1.533888280391693e-05, 1.6470439732074738e-05, 1.7601996660232544e-05, 1.873355358839035e-05, 1.9865110516548157e-05, 2.0996667444705963e-05, 2.212822437286377e-05, 2.3259781301021576e-05, 2.4391338229179382e-05, 2.552289515733719e-05, 2.6654452085494995e-05, 2.77860090136528e-05, 2.8917565941810608e-05, 3.0049122869968414e-05, 3.118067979812622e-05, 3.231223672628403e-05, 3.3443793654441833e-05, 3.457535058259964e-05, 3.5706907510757446e-05, 3.683846443891525e-05, 3.797002136707306e-05, 3.9101578295230865e-05, 4.023313522338867e-05]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 4.0, 13.0, 15.0, 18.0, 36.0, 41.0, 67.0, 112.0, 118.0, 169.0, 352.0, 449.0, 758.0, 1750.0, 2528.0, 4789.0, 15336.0, 31981.0, 192368.0, 547148.0, 170110.0, 53813.0, 12976.0, 5906.0, 3752.0, 1466.0, 826.0, 675.0, 316.0, 237.0, 118.0, 77.0, 76.0, 34.0, 29.0, 22.0, 11.0, 7.0, 13.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.7220458984375e-06, -5.521811544895172e-06, -5.321577191352844e-06, -5.121342837810516e-06, -4.9211084842681885e-06, -4.720874130725861e-06, -4.520639777183533e-06, -4.320405423641205e-06, -4.120171070098877e-06, -3.919936716556549e-06, -3.719702363014221e-06, -3.5194680094718933e-06, -3.3192336559295654e-06, -3.1189993023872375e-06, -2.9187649488449097e-06, -2.7185305953025818e-06, -2.518296241760254e-06, -2.318061888217926e-06, -2.117827534675598e-06, -1.9175931811332703e-06, -1.7173588275909424e-06, -1.5171244740486145e-06, -1.3168901205062866e-06, -1.1166557669639587e-06, -9.164214134216309e-07, -7.16187059879303e-07, -5.159527063369751e-07, -3.157183527946472e-07, -1.1548399925231934e-07, 8.475035429000854e-08, 2.849847078323364e-07, 4.852190613746643e-07, 6.854534149169922e-07, 8.856877684593201e-07, 1.085922122001648e-06, 1.2861564755439758e-06, 1.4863908290863037e-06, 1.6866251826286316e-06, 1.8868595361709595e-06, 2.0870938897132874e-06, 2.2873282432556152e-06, 2.487562596797943e-06, 2.687796950340271e-06, 2.888031303882599e-06, 3.0882656574249268e-06, 3.2885000109672546e-06, 3.4887343645095825e-06, 3.6889687180519104e-06, 3.889203071594238e-06, 4.089437425136566e-06, 4.289671778678894e-06, 4.489906132221222e-06, 4.69014048576355e-06, 4.890374839305878e-06, 5.0906091928482056e-06, 5.2908435463905334e-06, 5.491077899932861e-06, 5.691312253475189e-06, 5.891546607017517e-06, 6.091780960559845e-06, 6.292015314102173e-06, 6.492249667644501e-06, 6.692484021186829e-06, 6.8927183747291565e-06, 7.092952728271484e-06]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 8.0, 8.0, 36.0, 25.0, 29.0, 101.0, 49.0, 67.0, 69.0, 166.0, 71.0, 76.0, 59.0, 83.0, 36.0, 37.0, 23.0, 33.0, 5.0, 6.0, 10.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86102294921875e-06, -2.7855858206748962e-06, -2.7101486921310425e-06, -2.6347115635871887e-06, -2.559274435043335e-06, -2.483837306499481e-06, -2.4084001779556274e-06, -2.3329630494117737e-06, -2.25752592086792e-06, -2.182088792324066e-06, -2.1066516637802124e-06, -2.0312145352363586e-06, -1.955777406692505e-06, -1.8803402781486511e-06, -1.8049031496047974e-06, -1.7294660210609436e-06, -1.6540288925170898e-06, -1.578591763973236e-06, -1.5031546354293823e-06, -1.4277175068855286e-06, -1.3522803783416748e-06, -1.276843249797821e-06, -1.2014061212539673e-06, -1.1259689927101135e-06, -1.0505318641662598e-06, -9.75094735622406e-07, -8.996576070785522e-07, -8.242204785346985e-07, -7.487833499908447e-07, -6.73346221446991e-07, -5.979090929031372e-07, -5.224719643592834e-07, -4.470348358154297e-07, -3.7159770727157593e-07, -2.9616057872772217e-07, -2.207234501838684e-07, -1.4528632164001465e-07, -6.984919309616089e-08, 5.587935447692871e-09, 8.102506399154663e-08, 1.564621925354004e-07, 2.3189932107925415e-07, 3.073364496231079e-07, 3.8277357816696167e-07, 4.5821070671081543e-07, 5.336478352546692e-07, 6.09084963798523e-07, 6.845220923423767e-07, 7.599592208862305e-07, 8.353963494300842e-07, 9.10833477973938e-07, 9.862706065177917e-07, 1.0617077350616455e-06, 1.1371448636054993e-06, 1.212581992149353e-06, 1.2880191206932068e-06, 1.3634562492370605e-06, 1.4388933777809143e-06, 1.514330506324768e-06, 1.5897676348686218e-06, 1.6652047634124756e-06, 1.7406418919563293e-06, 1.816079020500183e-06, 1.8915161490440369e-06, 1.9669532775878906e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 6.0, 16.0, 12.0, 29.0, 17.0, 75.0, 56.0, 119.0, 229.0, 174.0, 466.0, 320.0, 996.0, 749.0, 2345.0, 1870.0, 5924.0, 5057.0, 18607.0, 17253.0, 75084.0, 84765.0, 452493.0, 168449.0, 130973.0, 45195.0, 11183.0, 12494.0, 3585.0, 4376.0, 1354.0, 1742.0, 587.0, 765.0, 229.0, 363.0, 107.0, 170.0, 64.0, 94.0, 60.0, 20.0, 26.0, 6.0, 18.0, 7.0, 5.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.8014183044433594e-06, -2.7101486921310425e-06, -2.6188790798187256e-06, -2.5276094675064087e-06, -2.436339855194092e-06, -2.345070242881775e-06, -2.253800630569458e-06, -2.162531018257141e-06, -2.0712614059448242e-06, -1.9799917936325073e-06, -1.8887221813201904e-06, -1.7974525690078735e-06, -1.7061829566955566e-06, -1.6149133443832397e-06, -1.5236437320709229e-06, -1.432374119758606e-06, -1.341104507446289e-06, -1.2498348951339722e-06, -1.1585652828216553e-06, -1.0672956705093384e-06, -9.760260581970215e-07, -8.847564458847046e-07, -7.934868335723877e-07, -7.022172212600708e-07, -6.109476089477539e-07, -5.19677996635437e-07, -4.284083843231201e-07, -3.371387720108032e-07, -2.4586915969848633e-07, -1.5459954738616943e-07, -6.332993507385254e-08, 2.7939677238464355e-08, 1.1920928955078125e-07, 2.1047890186309814e-07, 3.0174851417541504e-07, 3.9301812648773193e-07, 4.842877388000488e-07, 5.755573511123657e-07, 6.668269634246826e-07, 7.580965757369995e-07, 8.493661880493164e-07, 9.406358003616333e-07, 1.0319054126739502e-06, 1.123175024986267e-06, 1.214444637298584e-06, 1.3057142496109009e-06, 1.3969838619232178e-06, 1.4882534742355347e-06, 1.5795230865478516e-06, 1.6707926988601685e-06, 1.7620623111724854e-06, 1.8533319234848022e-06, 1.944601535797119e-06, 2.035871148109436e-06, 2.127140760421753e-06, 2.21841037273407e-06, 2.3096799850463867e-06, 2.4009495973587036e-06, 2.4922192096710205e-06, 2.5834888219833374e-06, 2.6747584342956543e-06, 2.766028046607971e-06, 2.857297658920288e-06, 2.948567271232605e-06, 3.039836883544922e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 6.0, 9.0, 5.0, 4.0, 11.0, 7.0, 16.0, 9.0, 9.0, 29.0, 11.0, 41.0, 42.0, 56.0, 39.0, 87.0, 37.0, 87.0, 47.0, 45.0, 74.0, 32.0, 66.0, 34.0, 56.0, 28.0, 38.0, 14.0, 10.0, 10.0, 4.0, 13.0, 6.0, 5.0, 0.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.682209014892578e-06, -2.5955960154533386e-06, -2.508983016014099e-06, -2.4223700165748596e-06, -2.33575701713562e-06, -2.2491440176963806e-06, -2.162531018257141e-06, -2.0759180188179016e-06, -1.989305019378662e-06, -1.9026920199394226e-06, -1.816079020500183e-06, -1.7294660210609436e-06, -1.642853021621704e-06, -1.5562400221824646e-06, -1.469627022743225e-06, -1.3830140233039856e-06, -1.296401023864746e-06, -1.2097880244255066e-06, -1.123175024986267e-06, -1.0365620255470276e-06, -9.499490261077881e-07, -8.633360266685486e-07, -7.767230272293091e-07, -6.901100277900696e-07, -6.034970283508301e-07, -5.168840289115906e-07, -4.302710294723511e-07, -3.4365803003311157e-07, -2.5704503059387207e-07, -1.7043203115463257e-07, -8.381903171539307e-08, 2.7939677238464355e-09, 8.940696716308594e-08, 1.7601996660232544e-07, 2.6263296604156494e-07, 3.4924596548080444e-07, 4.3585896492004395e-07, 5.224719643592834e-07, 6.09084963798523e-07, 6.956979632377625e-07, 7.82310962677002e-07, 8.689239621162415e-07, 9.55536961555481e-07, 1.0421499609947205e-06, 1.12876296043396e-06, 1.2153759598731995e-06, 1.301988959312439e-06, 1.3886019587516785e-06, 1.475214958190918e-06, 1.5618279576301575e-06, 1.648440957069397e-06, 1.7350539565086365e-06, 1.821666955947876e-06, 1.9082799553871155e-06, 1.994892954826355e-06, 2.0815059542655945e-06, 2.168118953704834e-06, 2.2547319531440735e-06, 2.341344952583313e-06, 2.4279579520225525e-06, 2.514570951461792e-06, 2.6011839509010315e-06, 2.687796950340271e-06, 2.7744099497795105e-06, 2.86102294921875e-06]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 9.0, 8.0, 12.0, 10.0, 18.0, 17.0, 29.0, 23.0, 49.0, 65.0, 100.0, 121.0, 146.0, 101.0, 77.0, 44.0, 34.0, 32.0, 27.0, 10.0, 13.0, 10.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012000883725704625, -0.00011558320693438873, -0.0001111575766117312, -0.00010673194628907368, -0.00010230631596641615, -9.788068564375862e-05, -9.345506259705871e-05, -8.902943227440119e-05, -8.460380195174366e-05, -8.017817162908614e-05, -7.575254130642861e-05, -7.132691098377109e-05, -6.690128066111356e-05, -6.247565033845603e-05, -5.8050023653777316e-05, -5.362439333111979e-05, -4.919875937048346e-05, -4.477312904782593e-05, -4.034749872516841e-05, -3.592186840251088e-05, -3.1496238079853356e-05, -2.7070609576185234e-05, -2.2644981072517112e-05, -1.8219350749859586e-05, -1.379372042720206e-05, -9.368090104544535e-06, -4.9424606913817115e-06, -5.168312782188877e-07, 3.908799044438638e-06, 8.334429367096163e-06, 1.2760057870764285e-05, 1.718568819342181e-05, 2.1611311240121722e-05, 2.6036941562779248e-05, 3.0462571885436773e-05, 3.48882022080943e-05, 3.9313832530751824e-05, 4.373946285340935e-05, 4.816508953808807e-05, 5.2590719860745594e-05, 5.701635018340312e-05, 6.144197686808184e-05, 6.586760719073936e-05, 7.029323751339689e-05, 7.471886783605441e-05, 7.914449815871194e-05, 8.357012848136947e-05, 8.799575880402699e-05, 9.242138912668452e-05, 9.684701944934204e-05, 0.00010127264977199957, 0.0001056982800946571, 0.00011012391041731462, 0.00011454954073997214, 0.00011897516378667206, 0.00012340079410932958, 0.0001278264244319871, 0.00013225205475464463, 0.00013667768507730216, 0.00014110331539995968, 0.0001455289457226172, 0.00014995457604527473, 0.00015438020636793226, 0.00015880583669058979, 0.0001632314670132473]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 4.0, 10.0, 7.0, 8.0, 17.0, 10.0, 25.0, 29.0, 26.0, 26.0, 41.0, 24.0, 36.0, 33.0, 31.0, 40.0, 45.0, 50.0, 42.0, 52.0, 48.0, 35.0, 40.0, 37.0, 35.0, 32.0, 32.0, 28.0, 25.0, 21.0, 18.0, 17.0, 13.0, 12.0, 7.0, 9.0, 8.0, 7.0, 2.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.626150131225586e-05, -9.318534284830093e-05, -9.010918438434601e-05, -8.703302592039108e-05, -8.395686745643616e-05, -8.088070899248123e-05, -7.78045505285263e-05, -7.472839206457138e-05, -7.165223360061646e-05, -6.857607513666153e-05, -6.54999166727066e-05, -6.242375820875168e-05, -5.934759974479675e-05, -5.627144128084183e-05, -5.31952828168869e-05, -5.0119124352931976e-05, -4.704296588897705e-05, -4.3966807425022125e-05, -4.08906489610672e-05, -3.7814490497112274e-05, -3.473833203315735e-05, -3.166217356920242e-05, -2.8586015105247498e-05, -2.5509856641292572e-05, -2.2433698177337646e-05, -1.935753971338272e-05, -1.6281381249427795e-05, -1.320522278547287e-05, -1.0129064321517944e-05, -7.052905857563019e-06, -3.976747393608093e-06, -9.005889296531677e-07, 2.175569534301758e-06, 5.251727998256683e-06, 8.327886462211609e-06, 1.1404044926166534e-05, 1.448020339012146e-05, 1.7556361854076385e-05, 2.063252031803131e-05, 2.3708678781986237e-05, 2.6784837245941162e-05, 2.9860995709896088e-05, 3.293715417385101e-05, 3.601331263780594e-05, 3.9089471101760864e-05, 4.216562956571579e-05, 4.5241788029670715e-05, 4.831794649362564e-05, 5.1394104957580566e-05, 5.447026342153549e-05, 5.754642188549042e-05, 6.062258034944534e-05, 6.369873881340027e-05, 6.67748972773552e-05, 6.985105574131012e-05, 7.292721420526505e-05, 7.600337266921997e-05, 7.90795311331749e-05, 8.215568959712982e-05, 8.523184806108475e-05, 8.830800652503967e-05, 9.13841649889946e-05, 9.446032345294952e-05, 9.753648191690445e-05, 0.00010061264038085938]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 5.0, 8.0, 9.0, 24.0, 31.0, 57.0, 108.0, 191.0, 273.0, 480.0, 916.0, 1682.0, 3428.0, 7699.0, 20947.0, 89695.0, 3901271.0, 129474.0, 22086.0, 8372.0, 3440.0, 1680.0, 923.0, 498.0, 288.0, 201.0, 110.0, 106.0, 59.0, 39.0, 39.0, 31.0, 18.0, 20.0, 13.0, 6.0, 6.0, 11.0, 11.0, 6.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.793571472167969e-05, -5.463697016239166e-05, -5.133822560310364e-05, -4.803948104381561e-05, -4.474073648452759e-05, -4.144199192523956e-05, -3.814324736595154e-05, -3.484450280666351e-05, -3.154575824737549e-05, -2.8247013688087463e-05, -2.494826912879944e-05, -2.1649524569511414e-05, -1.835078001022339e-05, -1.5052035450935364e-05, -1.1753290891647339e-05, -8.454546332359314e-06, -5.155801773071289e-06, -1.8570572137832642e-06, 1.4416873455047607e-06, 4.740431904792786e-06, 8.03917646408081e-06, 1.1337921023368835e-05, 1.463666558265686e-05, 1.7935410141944885e-05, 2.123415470123291e-05, 2.4532899260520935e-05, 2.783164381980896e-05, 3.1130388379096985e-05, 3.442913293838501e-05, 3.7727877497673035e-05, 4.102662205696106e-05, 4.4325366616249084e-05, 4.762411117553711e-05, 5.0922855734825134e-05, 5.422160029411316e-05, 5.7520344853401184e-05, 6.081908941268921e-05, 6.411783397197723e-05, 6.741657853126526e-05, 7.071532309055328e-05, 7.401406764984131e-05, 7.731281220912933e-05, 8.061155676841736e-05, 8.391030132770538e-05, 8.720904588699341e-05, 9.050779044628143e-05, 9.380653500556946e-05, 9.710527956485748e-05, 0.00010040402412414551, 0.00010370276868343353, 0.00010700151324272156, 0.00011030025780200958, 0.00011359900236129761, 0.00011689774692058563, 0.00012019649147987366, 0.00012349523603916168, 0.0001267939805984497, 0.00013009272515773773, 0.00013339146971702576, 0.00013669021427631378, 0.0001399889588356018, 0.00014328770339488983, 0.00014658644795417786, 0.00014988519251346588, 0.0001531839370727539]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 4.0, 3.0, 7.0, 13.0, 19.0, 14.0, 40.0, 38.0, 54.0, 67.0, 89.0, 100.0, 100.0, 83.0, 79.0, 87.0, 55.0, 44.0, 36.0, 24.0, 13.0, 10.0, 7.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6748905181884766e-05, -1.585017889738083e-05, -1.4951452612876892e-05, -1.4052726328372955e-05, -1.3154000043869019e-05, -1.2255273759365082e-05, -1.1356547474861145e-05, -1.0457821190357208e-05, -9.559094905853271e-06, -8.660368621349335e-06, -7.761642336845398e-06, -6.862916052341461e-06, -5.964189767837524e-06, -5.065463483333588e-06, -4.166737198829651e-06, -3.268010914325714e-06, -2.3692846298217773e-06, -1.4705583453178406e-06, -5.718320608139038e-07, 3.2689422369003296e-07, 1.2256205081939697e-06, 2.1243467926979065e-06, 3.0230730772018433e-06, 3.92179936170578e-06, 4.820525646209717e-06, 5.7192519307136536e-06, 6.61797821521759e-06, 7.516704499721527e-06, 8.415430784225464e-06, 9.3141570687294e-06, 1.0212883353233337e-05, 1.1111609637737274e-05, 1.2010335922241211e-05, 1.2909062206745148e-05, 1.3807788491249084e-05, 1.4706514775753021e-05, 1.5605241060256958e-05, 1.6503967344760895e-05, 1.740269362926483e-05, 1.830141991376877e-05, 1.9200146198272705e-05, 2.0098872482776642e-05, 2.099759876728058e-05, 2.1896325051784515e-05, 2.2795051336288452e-05, 2.369377762079239e-05, 2.4592503905296326e-05, 2.5491230189800262e-05, 2.63899564743042e-05, 2.7288682758808136e-05, 2.8187409043312073e-05, 2.908613532781601e-05, 2.9984861612319946e-05, 3.088358789682388e-05, 3.178231418132782e-05, 3.2681040465831757e-05, 3.357976675033569e-05, 3.447849303483963e-05, 3.537721931934357e-05, 3.6275945603847504e-05, 3.717467188835144e-05, 3.807339817285538e-05, 3.8972124457359314e-05, 3.987085074186325e-05, 4.076957702636719e-05]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 6.0, 10.0, 17.0, 27.0, 22.0, 51.0, 66.0, 73.0, 138.0, 199.0, 315.0, 479.0, 655.0, 1088.0, 1831.0, 2943.0, 5232.0, 9257.0, 17536.0, 38452.0, 96465.0, 964037.0, 2819841.0, 144357.0, 45675.0, 20443.0, 10422.0, 5767.0, 3103.0, 2089.0, 1333.0, 815.0, 508.0, 318.0, 220.0, 166.0, 92.0, 66.0, 62.0, 32.0, 24.0, 11.0, 9.0, 7.0, 6.0, 4.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.725290298461914e-05, -3.612786531448364e-05, -3.5002827644348145e-05, -3.3877789974212646e-05, -3.275275230407715e-05, -3.162771463394165e-05, -3.0502676963806152e-05, -2.9377639293670654e-05, -2.8252601623535156e-05, -2.7127563953399658e-05, -2.600252628326416e-05, -2.4877488613128662e-05, -2.3752450942993164e-05, -2.2627413272857666e-05, -2.1502375602722168e-05, -2.037733793258667e-05, -1.9252300262451172e-05, -1.8127262592315674e-05, -1.7002224922180176e-05, -1.5877187252044678e-05, -1.475214958190918e-05, -1.3627111911773682e-05, -1.2502074241638184e-05, -1.1377036571502686e-05, -1.0251998901367188e-05, -9.12696123123169e-06, -8.001923561096191e-06, -6.876885890960693e-06, -5.751848220825195e-06, -4.626810550689697e-06, -3.5017728805541992e-06, -2.376735210418701e-06, -1.2516975402832031e-06, -1.2665987014770508e-07, 9.98377799987793e-07, 2.123415470123291e-06, 3.248453140258789e-06, 4.373490810394287e-06, 5.498528480529785e-06, 6.623566150665283e-06, 7.748603820800781e-06, 8.87364149093628e-06, 9.998679161071777e-06, 1.1123716831207275e-05, 1.2248754501342773e-05, 1.3373792171478271e-05, 1.449882984161377e-05, 1.5623867511749268e-05, 1.6748905181884766e-05, 1.7873942852020264e-05, 1.8998980522155762e-05, 2.012401819229126e-05, 2.1249055862426758e-05, 2.2374093532562256e-05, 2.3499131202697754e-05, 2.4624168872833252e-05, 2.574920654296875e-05, 2.6874244213104248e-05, 2.7999281883239746e-05, 2.9124319553375244e-05, 3.0249357223510742e-05, 3.137439489364624e-05, 3.249943256378174e-05, 3.3624470233917236e-05, 3.4749507904052734e-05]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 4.0, 10.0, 8.0, 14.0, 9.0, 12.0, 25.0, 20.0, 30.0, 55.0, 64.0, 127.0, 290.0, 711.0, 1331.0, 710.0, 265.0, 99.0, 66.0, 35.0, 37.0, 25.0, 30.0, 14.0, 15.0, 11.0, 9.0, 3.0, 11.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.814697265625e-05, -3.707129508256912e-05, -3.5995617508888245e-05, -3.491993993520737e-05, -3.384426236152649e-05, -3.276858478784561e-05, -3.1692907214164734e-05, -3.0617229640483856e-05, -2.954155206680298e-05, -2.84658744931221e-05, -2.7390196919441223e-05, -2.6314519345760345e-05, -2.5238841772079468e-05, -2.416316419839859e-05, -2.3087486624717712e-05, -2.2011809051036835e-05, -2.0936131477355957e-05, -1.986045390367508e-05, -1.87847763299942e-05, -1.7709098756313324e-05, -1.6633421182632446e-05, -1.555774360895157e-05, -1.4482066035270691e-05, -1.3406388461589813e-05, -1.2330710887908936e-05, -1.1255033314228058e-05, -1.017935574054718e-05, -9.103678166866302e-06, -8.028000593185425e-06, -6.952323019504547e-06, -5.8766454458236694e-06, -4.800967872142792e-06, -3.725290298461914e-06, -2.6496127247810364e-06, -1.5739351511001587e-06, -4.98257577419281e-07, 5.774199962615967e-07, 1.6530975699424744e-06, 2.728775143623352e-06, 3.8044527173042297e-06, 4.880130290985107e-06, 5.955807864665985e-06, 7.031485438346863e-06, 8.10716301202774e-06, 9.182840585708618e-06, 1.0258518159389496e-05, 1.1334195733070374e-05, 1.2409873306751251e-05, 1.3485550880432129e-05, 1.4561228454113007e-05, 1.5636906027793884e-05, 1.6712583601474762e-05, 1.778826117515564e-05, 1.8863938748836517e-05, 1.9939616322517395e-05, 2.1015293896198273e-05, 2.209097146987915e-05, 2.3166649043560028e-05, 2.4242326617240906e-05, 2.5318004190921783e-05, 2.639368176460266e-05, 2.746935933828354e-05, 2.8545036911964417e-05, 2.9620714485645294e-05, 3.069639205932617e-05]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 8.0, 7.0, 6.0, 13.0, 14.0, 19.0, 26.0, 46.0, 54.0, 91.0, 90.0, 135.0, 111.0, 91.0, 72.0, 65.0, 33.0, 31.0, 21.0, 8.0, 12.0, 9.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0002107468608301133, -0.0002054389624390751, -0.0002001310494961217, -0.00019482315110508353, -0.00018951525271404535, -0.00018420733977109194, -0.00017889944138005376, -0.00017359154298901558, -0.00016828363004606217, -0.000162975731655024, -0.00015766781871207058, -0.0001523599203210324, -0.00014705202192999423, -0.00014174410898704082, -0.00013643621059600264, -0.00013112829765304923, -0.00012582039926201105, -0.00012051249359501526, -0.00011520459520397708, -0.00010989668953698128, -0.00010458878386998549, -9.92808782029897e-05, -9.397297981195152e-05, -8.866507414495572e-05, -8.335718302987516e-05, -7.804927736287937e-05, -7.274137897184119e-05, -6.743347330484539e-05, -6.21255676378496e-05, -5.681766560883261e-05, -5.1509763579815626e-05, -4.620185791281983e-05, -4.089395224582404e-05, -3.558605021680705e-05, -3.027814454981126e-05, -2.4970242520794272e-05, -1.9662338672787882e-05, -1.4354434824781492e-05, -9.046532795764506e-06, -3.7386271287687123e-06, 1.5692749002482742e-06, 6.877178293507313e-06, 1.2185081686766353e-05, 1.749298462527804e-05, 2.280088847328443e-05, 2.810879232129082e-05, 3.341669435030781e-05, 3.87246000173036e-05, 4.403250204632059e-05, 4.9340404075337574e-05, 5.464830974233337e-05, 5.9956211771350354e-05, 6.526411743834615e-05, 7.057201582938433e-05, 7.587992149638012e-05, 8.118782716337591e-05, 8.64957255544141e-05, 9.180363122140989e-05, 9.711152961244807e-05, 0.00010241943527944386, 0.00010772734094643965, 0.00011303524661343545, 0.00011834314500447363, 0.00012365105794742703, 0.00012895895633846521]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 4.0, 4.0, 5.0, 3.0, 6.0, 8.0, 11.0, 19.0, 19.0, 19.0, 24.0, 29.0, 21.0, 39.0, 28.0, 35.0, 37.0, 53.0, 33.0, 40.0, 40.0, 35.0, 40.0, 45.0, 35.0, 36.0, 29.0, 52.0, 29.0, 35.0, 25.0, 22.0, 23.0, 13.0, 18.0, 19.0, 7.0, 17.0, 9.0, 12.0, 5.0, 1.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.666515350341797e-05, -8.411798626184464e-05, -8.15708190202713e-05, -7.902365177869797e-05, -7.647648453712463e-05, -7.39293172955513e-05, -7.138215005397797e-05, -6.883498281240463e-05, -6.62878155708313e-05, -6.374064832925797e-05, -6.119348108768463e-05, -5.86463138461113e-05, -5.6099146604537964e-05, -5.355197936296463e-05, -5.1004812121391296e-05, -4.845764487981796e-05, -4.591047763824463e-05, -4.3363310396671295e-05, -4.081614315509796e-05, -3.826897591352463e-05, -3.5721808671951294e-05, -3.317464143037796e-05, -3.0627474188804626e-05, -2.8080306947231293e-05, -2.553313970565796e-05, -2.2985972464084625e-05, -2.043880522251129e-05, -1.7891637980937958e-05, -1.5344470739364624e-05, -1.279730349779129e-05, -1.0250136256217957e-05, -7.702969014644623e-06, -5.155801773071289e-06, -2.6086345314979553e-06, -6.146728992462158e-08, 2.485699951648712e-06, 5.032867193222046e-06, 7.58003443479538e-06, 1.0127201676368713e-05, 1.2674368917942047e-05, 1.5221536159515381e-05, 1.7768703401088715e-05, 2.031587064266205e-05, 2.2863037884235382e-05, 2.5410205125808716e-05, 2.795737236738205e-05, 3.0504539608955383e-05, 3.305170685052872e-05, 3.559887409210205e-05, 3.8146041333675385e-05, 4.069320857524872e-05, 4.324037581682205e-05, 4.5787543058395386e-05, 4.833471029996872e-05, 5.088187754154205e-05, 5.342904478311539e-05, 5.597621202468872e-05, 5.8523379266262054e-05, 6.107054650783539e-05, 6.361771374940872e-05, 6.616488099098206e-05, 6.871204823255539e-05, 7.125921547412872e-05, 7.380638271570206e-05, 7.635354995727539e-05]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 0.0, 3.0, 5.0, 9.0, 6.0, 6.0, 7.0, 16.0, 20.0, 25.0, 34.0, 39.0, 71.0, 124.0, 229.0, 460.0, 772.0, 1447.0, 2955.0, 6619.0, 16551.0, 47397.0, 168304.0, 578489.0, 152877.0, 44323.0, 15460.0, 6300.0, 2869.0, 1400.0, 708.0, 406.0, 235.0, 124.0, 82.0, 55.0, 34.0, 15.0, 13.0, 14.0, 8.0, 3.0, 11.0, 9.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.0001347064971923828, -0.0001309085637331009, -0.00012711063027381897, -0.00012331269681453705, -0.00011951476335525513, -0.0001157168298959732, -0.00011191889643669128, -0.00010812096297740936, -0.00010432302951812744, -0.00010052509605884552, -9.67271625995636e-05, -9.292922914028168e-05, -8.913129568099976e-05, -8.533336222171783e-05, -8.153542876243591e-05, -7.773749530315399e-05, -7.393956184387207e-05, -7.014162838459015e-05, -6.634369492530823e-05, -6.25457614660263e-05, -5.8747828006744385e-05, -5.494989454746246e-05, -5.115196108818054e-05, -4.735402762889862e-05, -4.35560941696167e-05, -3.975816071033478e-05, -3.5960227251052856e-05, -3.2162293791770935e-05, -2.8364360332489014e-05, -2.4566426873207092e-05, -2.076849341392517e-05, -1.697055995464325e-05, -1.3172626495361328e-05, -9.374693036079407e-06, -5.576759576797485e-06, -1.778826117515564e-06, 2.0191073417663574e-06, 5.817040801048279e-06, 9.6149742603302e-06, 1.3412907719612122e-05, 1.7210841178894043e-05, 2.1008774638175964e-05, 2.4806708097457886e-05, 2.8604641556739807e-05, 3.240257501602173e-05, 3.620050847530365e-05, 3.999844193458557e-05, 4.379637539386749e-05, 4.7594308853149414e-05, 5.1392242312431335e-05, 5.519017577171326e-05, 5.898810923099518e-05, 6.27860426902771e-05, 6.658397614955902e-05, 7.038190960884094e-05, 7.417984306812286e-05, 7.797777652740479e-05, 8.17757099866867e-05, 8.557364344596863e-05, 8.937157690525055e-05, 9.316951036453247e-05, 9.696744382381439e-05, 0.00010076537728309631, 0.00010456331074237823, 0.00010836124420166016]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 7.0, 6.0, 18.0, 34.0, 38.0, 35.0, 65.0, 59.0, 88.0, 96.0, 76.0, 94.0, 75.0, 70.0, 56.0, 43.0, 33.0, 33.0, 20.0, 7.0, 11.0, 5.0, 6.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5854835510253906e-05, -1.5003606677055359e-05, -1.4152377843856812e-05, -1.3301149010658264e-05, -1.2449920177459717e-05, -1.159869134426117e-05, -1.0747462511062622e-05, -9.896233677864075e-06, -9.045004844665527e-06, -8.19377601146698e-06, -7.342547178268433e-06, -6.491318345069885e-06, -5.640089511871338e-06, -4.7888606786727905e-06, -3.937631845474243e-06, -3.086403012275696e-06, -2.2351741790771484e-06, -1.383945345878601e-06, -5.327165126800537e-07, 3.1851232051849365e-07, 1.169741153717041e-06, 2.0209699869155884e-06, 2.8721988201141357e-06, 3.723427653312683e-06, 4.5746564865112305e-06, 5.425885319709778e-06, 6.277114152908325e-06, 7.1283429861068726e-06, 7.97957181930542e-06, 8.830800652503967e-06, 9.682029485702515e-06, 1.0533258318901062e-05, 1.138448715209961e-05, 1.2235715985298157e-05, 1.3086944818496704e-05, 1.3938173651695251e-05, 1.4789402484893799e-05, 1.5640631318092346e-05, 1.6491860151290894e-05, 1.734308898448944e-05, 1.8194317817687988e-05, 1.9045546650886536e-05, 1.9896775484085083e-05, 2.074800431728363e-05, 2.1599233150482178e-05, 2.2450461983680725e-05, 2.3301690816879272e-05, 2.415291965007782e-05, 2.5004148483276367e-05, 2.5855377316474915e-05, 2.6706606149673462e-05, 2.755783498287201e-05, 2.8409063816070557e-05, 2.9260292649269104e-05, 3.011152148246765e-05, 3.09627503156662e-05, 3.1813979148864746e-05, 3.2665207982063293e-05, 3.351643681526184e-05, 3.436766564846039e-05, 3.5218894481658936e-05, 3.607012331485748e-05, 3.692135214805603e-05, 3.777258098125458e-05, 3.8623809814453125e-05]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 5.0, 7.0, 9.0, 19.0, 18.0, 52.0, 60.0, 80.0, 115.0, 133.0, 190.0, 302.0, 366.0, 515.0, 781.0, 1042.0, 1417.0, 2104.0, 3109.0, 4511.0, 6577.0, 10154.0, 14002.0, 23705.0, 38707.0, 66717.0, 133486.0, 356899.0, 169913.0, 84596.0, 47306.0, 28374.0, 17411.0, 11629.0, 7473.0, 4850.0, 3503.0, 2512.0, 1768.0, 1145.0, 853.0, 595.0, 435.0, 326.0, 217.0, 180.0, 107.0, 80.0, 70.0, 33.0, 33.0, 22.0, 14.0, 14.0, 13.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.3484230041503906e-05, -2.2718682885169983e-05, -2.195313572883606e-05, -2.1187588572502136e-05, -2.0422041416168213e-05, -1.965649425983429e-05, -1.8890947103500366e-05, -1.8125399947166443e-05, -1.735985279083252e-05, -1.6594305634498596e-05, -1.5828758478164673e-05, -1.506321132183075e-05, -1.4297664165496826e-05, -1.3532117009162903e-05, -1.276656985282898e-05, -1.2001022696495056e-05, -1.1235475540161133e-05, -1.046992838382721e-05, -9.704381227493286e-06, -8.938834071159363e-06, -8.17328691482544e-06, -7.407739758491516e-06, -6.642192602157593e-06, -5.8766454458236694e-06, -5.111098289489746e-06, -4.345551133155823e-06, -3.5800039768218994e-06, -2.814456820487976e-06, -2.0489096641540527e-06, -1.2833625078201294e-06, -5.178153514862061e-07, 2.477318048477173e-07, 1.0132789611816406e-06, 1.778826117515564e-06, 2.5443732738494873e-06, 3.3099204301834106e-06, 4.075467586517334e-06, 4.841014742851257e-06, 5.606561899185181e-06, 6.372109055519104e-06, 7.137656211853027e-06, 7.90320336818695e-06, 8.668750524520874e-06, 9.434297680854797e-06, 1.019984483718872e-05, 1.0965391993522644e-05, 1.1730939149856567e-05, 1.249648630619049e-05, 1.3262033462524414e-05, 1.4027580618858337e-05, 1.479312777519226e-05, 1.5558674931526184e-05, 1.6324222087860107e-05, 1.708976924419403e-05, 1.7855316400527954e-05, 1.8620863556861877e-05, 1.93864107131958e-05, 2.0151957869529724e-05, 2.0917505025863647e-05, 2.168305218219757e-05, 2.2448599338531494e-05, 2.3214146494865417e-05, 2.397969365119934e-05, 2.4745240807533264e-05, 2.5510787963867188e-05]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 5.0, 9.0, 6.0, 8.0, 9.0, 12.0, 13.0, 12.0, 20.0, 34.0, 16.0, 34.0, 29.0, 37.0, 32.0, 45.0, 27.0, 45.0, 43.0, 43.0, 47.0, 41.0, 40.0, 33.0, 36.0, 46.0, 31.0, 31.0, 31.0, 27.0, 19.0, 21.0, 23.0, 15.0, 13.0, 18.0, 13.0, 5.0, 9.0, 7.0, 2.0, 2.0, 5.0, 0.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2782554626464844e-05, -3.1735748052597046e-05, -3.068894147872925e-05, -2.964213490486145e-05, -2.8595328330993652e-05, -2.7548521757125854e-05, -2.6501715183258057e-05, -2.545490860939026e-05, -2.440810203552246e-05, -2.3361295461654663e-05, -2.2314488887786865e-05, -2.1267682313919067e-05, -2.022087574005127e-05, -1.917406916618347e-05, -1.8127262592315674e-05, -1.7080456018447876e-05, -1.6033649444580078e-05, -1.498684287071228e-05, -1.3940036296844482e-05, -1.2893229722976685e-05, -1.1846423149108887e-05, -1.0799616575241089e-05, -9.752810001373291e-06, -8.706003427505493e-06, -7.659196853637695e-06, -6.6123902797698975e-06, -5.5655837059021e-06, -4.518777132034302e-06, -3.471970558166504e-06, -2.425163984298706e-06, -1.3783574104309082e-06, -3.3155083656311035e-07, 7.152557373046875e-07, 1.7620623111724854e-06, 2.808868885040283e-06, 3.855675458908081e-06, 4.902482032775879e-06, 5.949288606643677e-06, 6.996095180511475e-06, 8.042901754379272e-06, 9.08970832824707e-06, 1.0136514902114868e-05, 1.1183321475982666e-05, 1.2230128049850464e-05, 1.3276934623718262e-05, 1.432374119758606e-05, 1.5370547771453857e-05, 1.6417354345321655e-05, 1.7464160919189453e-05, 1.851096749305725e-05, 1.955777406692505e-05, 2.0604580640792847e-05, 2.1651387214660645e-05, 2.2698193788528442e-05, 2.374500036239624e-05, 2.4791806936264038e-05, 2.5838613510131836e-05, 2.6885420083999634e-05, 2.793222665786743e-05, 2.897903323173523e-05, 3.0025839805603027e-05, 3.1072646379470825e-05, 3.211945295333862e-05, 3.316625952720642e-05, 3.421306610107422e-05]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 11.0, 4.0, 13.0, 15.0, 11.0, 26.0, 39.0, 47.0, 78.0, 106.0, 205.0, 234.0, 372.0, 708.0, 1001.0, 2216.0, 3465.0, 6779.0, 21672.0, 65710.0, 688137.0, 192442.0, 42207.0, 11136.0, 5052.0, 3113.0, 1321.0, 952.0, 479.0, 302.0, 254.0, 134.0, 103.0, 48.0, 51.0, 36.0, 28.0, 14.0, 5.0, 11.0, 10.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.1205673217773438e-05, -1.0883435606956482e-05, -1.0561197996139526e-05, -1.023896038532257e-05, -9.916722774505615e-06, -9.59448516368866e-06, -9.272247552871704e-06, -8.950009942054749e-06, -8.627772331237793e-06, -8.305534720420837e-06, -7.983297109603882e-06, -7.661059498786926e-06, -7.338821887969971e-06, -7.016584277153015e-06, -6.6943466663360596e-06, -6.372109055519104e-06, -6.0498714447021484e-06, -5.727633833885193e-06, -5.405396223068237e-06, -5.083158612251282e-06, -4.760921001434326e-06, -4.438683390617371e-06, -4.116445779800415e-06, -3.7942081689834595e-06, -3.471970558166504e-06, -3.1497329473495483e-06, -2.8274953365325928e-06, -2.505257725715637e-06, -2.1830201148986816e-06, -1.860782504081726e-06, -1.5385448932647705e-06, -1.216307282447815e-06, -8.940696716308594e-07, -5.718320608139038e-07, -2.4959444999694824e-07, 7.264316082000732e-08, 3.948807716369629e-07, 7.171183824539185e-07, 1.039355993270874e-06, 1.3615936040878296e-06, 1.6838312149047852e-06, 2.0060688257217407e-06, 2.3283064365386963e-06, 2.650544047355652e-06, 2.9727816581726074e-06, 3.295019268989563e-06, 3.6172568798065186e-06, 3.939494490623474e-06, 4.26173210144043e-06, 4.583969712257385e-06, 4.906207323074341e-06, 5.228444933891296e-06, 5.550682544708252e-06, 5.8729201555252075e-06, 6.195157766342163e-06, 6.517395377159119e-06, 6.839632987976074e-06, 7.16187059879303e-06, 7.484108209609985e-06, 7.806345820426941e-06, 8.128583431243896e-06, 8.450821042060852e-06, 8.773058652877808e-06, 9.095296263694763e-06, 9.417533874511719e-06]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 8.0, 1.0, 0.0, 8.0, 7.0, 15.0, 0.0, 15.0, 11.0, 0.0, 29.0, 33.0, 60.0, 0.0, 54.0, 57.0, 79.0, 0.0, 98.0, 71.0, 99.0, 0.0, 75.0, 60.0, 0.0, 51.0, 33.0, 35.0, 0.0, 32.0, 20.0, 19.0, 0.0, 14.0, 9.0, 5.0, 0.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2079253792762756e-06, -1.1641532182693481e-06, -1.1203810572624207e-06, -1.0766088962554932e-06, -1.0328367352485657e-06, -9.890645742416382e-07, -9.452924132347107e-07, -9.015202522277832e-07, -8.577480912208557e-07, -8.139759302139282e-07, -7.702037692070007e-07, -7.264316082000732e-07, -6.826594471931458e-07, -6.388872861862183e-07, -5.951151251792908e-07, -5.513429641723633e-07, -5.075708031654358e-07, -4.637986421585083e-07, -4.200264811515808e-07, -3.762543201446533e-07, -3.3248215913772583e-07, -2.8870999813079834e-07, -2.4493783712387085e-07, -2.0116567611694336e-07, -1.5739351511001587e-07, -1.1362135410308838e-07, -6.984919309616089e-08, -2.60770320892334e-08, 1.7695128917694092e-08, 6.146728992462158e-08, 1.0523945093154907e-07, 1.4901161193847656e-07, 1.9278377294540405e-07, 2.3655593395233154e-07, 2.8032809495925903e-07, 3.241002559661865e-07, 3.67872416973114e-07, 4.116445779800415e-07, 4.55416738986969e-07, 4.991888999938965e-07, 5.42961061000824e-07, 5.867332220077515e-07, 6.30505383014679e-07, 6.742775440216064e-07, 7.180497050285339e-07, 7.618218660354614e-07, 8.055940270423889e-07, 8.493661880493164e-07, 8.931383490562439e-07, 9.369105100631714e-07, 9.806826710700989e-07, 1.0244548320770264e-06, 1.0682269930839539e-06, 1.1119991540908813e-06, 1.1557713150978088e-06, 1.1995434761047363e-06, 1.2433156371116638e-06, 1.2870877981185913e-06, 1.3308599591255188e-06, 1.3746321201324463e-06, 1.4184042811393738e-06, 1.4621764421463013e-06, 1.5059486031532288e-06, 1.5497207641601562e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 9.0, 10.0, 14.0, 18.0, 29.0, 33.0, 35.0, 70.0, 92.0, 135.0, 169.0, 271.0, 388.0, 269.0, 713.0, 1078.0, 1683.0, 2740.0, 4858.0, 8725.0, 17376.0, 40214.0, 118012.0, 491184.0, 240397.0, 65760.0, 25870.0, 12089.0, 6292.0, 3793.0, 2180.0, 1342.0, 889.0, 565.0, 214.0, 304.0, 214.0, 159.0, 106.0, 73.0, 61.0, 34.0, 28.0, 20.0, 11.0, 10.0, 5.0, 3.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.6954879760742188e-06, -3.579072654247284e-06, -3.462657332420349e-06, -3.3462420105934143e-06, -3.2298266887664795e-06, -3.1134113669395447e-06, -2.99699604511261e-06, -2.880580723285675e-06, -2.7641654014587402e-06, -2.6477500796318054e-06, -2.5313347578048706e-06, -2.414919435977936e-06, -2.298504114151001e-06, -2.182088792324066e-06, -2.0656734704971313e-06, -1.9492581486701965e-06, -1.8328428268432617e-06, -1.716427505016327e-06, -1.600012183189392e-06, -1.4835968613624573e-06, -1.3671815395355225e-06, -1.2507662177085876e-06, -1.1343508958816528e-06, -1.017935574054718e-06, -9.015202522277832e-07, -7.851049304008484e-07, -6.686896085739136e-07, -5.522742867469788e-07, -4.3585896492004395e-07, -3.1944364309310913e-07, -2.0302832126617432e-07, -8.66129994392395e-08, 2.9802322387695312e-08, 1.4621764421463013e-07, 2.6263296604156494e-07, 3.7904828786849976e-07, 4.954636096954346e-07, 6.118789315223694e-07, 7.282942533493042e-07, 8.44709575176239e-07, 9.611248970031738e-07, 1.0775402188301086e-06, 1.1939555406570435e-06, 1.3103708624839783e-06, 1.426786184310913e-06, 1.543201506137848e-06, 1.6596168279647827e-06, 1.7760321497917175e-06, 1.8924474716186523e-06, 2.008862793445587e-06, 2.125278115272522e-06, 2.2416934370994568e-06, 2.3581087589263916e-06, 2.4745240807533264e-06, 2.5909394025802612e-06, 2.707354724407196e-06, 2.823770046234131e-06, 2.9401853680610657e-06, 3.0566006898880005e-06, 3.1730160117149353e-06, 3.28943133354187e-06, 3.405846655368805e-06, 3.5222619771957397e-06, 3.6386772990226746e-06, 3.7550926208496094e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 10.0, 14.0, 16.0, 10.0, 10.0, 17.0, 36.0, 41.0, 59.0, 60.0, 66.0, 131.0, 92.0, 95.0, 59.0, 52.0, 46.0, 53.0, 29.0, 17.0, 13.0, 17.0, 13.0, 6.0, 9.0, 4.0, 6.0, 2.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-06, -3.4458935260772705e-06, -3.3155083656311035e-06, -3.1851232051849365e-06, -3.0547380447387695e-06, -2.9243528842926025e-06, -2.7939677238464355e-06, -2.6635825634002686e-06, -2.5331974029541016e-06, -2.4028122425079346e-06, -2.2724270820617676e-06, -2.1420419216156006e-06, -2.0116567611694336e-06, -1.8812716007232666e-06, -1.7508864402770996e-06, -1.6205012798309326e-06, -1.4901161193847656e-06, -1.3597309589385986e-06, -1.2293457984924316e-06, -1.0989606380462646e-06, -9.685754776000977e-07, -8.381903171539307e-07, -7.078051567077637e-07, -5.774199962615967e-07, -4.470348358154297e-07, -3.166496753692627e-07, -1.862645149230957e-07, -5.587935447692871e-08, 7.450580596923828e-08, 2.0489096641540527e-07, 3.3527612686157227e-07, 4.6566128730773926e-07, 5.960464477539062e-07, 7.264316082000732e-07, 8.568167686462402e-07, 9.872019290924072e-07, 1.1175870895385742e-06, 1.2479722499847412e-06, 1.3783574104309082e-06, 1.5087425708770752e-06, 1.6391277313232422e-06, 1.7695128917694092e-06, 1.8998980522155762e-06, 2.030283212661743e-06, 2.16066837310791e-06, 2.291053533554077e-06, 2.421438694000244e-06, 2.551823854446411e-06, 2.682209014892578e-06, 2.812594175338745e-06, 2.942979335784912e-06, 3.073364496231079e-06, 3.203749656677246e-06, 3.334134817123413e-06, 3.46451997756958e-06, 3.594905138015747e-06, 3.725290298461914e-06, 3.855675458908081e-06, 3.986060619354248e-06, 4.116445779800415e-06, 4.246830940246582e-06, 4.377216100692749e-06, 4.507601261138916e-06, 4.637986421585083e-06, 4.76837158203125e-06]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 7.0, 4.0, 5.0, 14.0, 17.0, 19.0, 19.0, 23.0, 38.0, 43.0, 68.0, 96.0, 109.0, 113.0, 108.0, 89.0, 40.0, 33.0, 38.0, 24.0, 19.0, 14.0, 15.0, 5.0, 10.0, 4.0, 7.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012536378926597536, -0.00012168462853878736, -0.00011800546053564176, -0.00011432629980845377, -0.00011064713180530816, -0.00010696797107812017, -0.00010328881035093218, -9.960964234778658e-05, -9.593047434464097e-05, -9.225131361745298e-05, -8.857214561430737e-05, -8.489298488711938e-05, -8.121381688397378e-05, -7.753465615678579e-05, -7.38554954295978e-05, -7.017632742645219e-05, -6.64971666992642e-05, -6.281800597207621e-05, -5.91388379689306e-05, -5.545967724174261e-05, -5.1780509238597006e-05, -4.8101348511409014e-05, -4.4422184146242216e-05, -4.074301978107542e-05, -3.706385541590862e-05, -3.338469105074182e-05, -2.9705526685575023e-05, -2.602636413939763e-05, -2.234719977423083e-05, -1.8668035409064032e-05, -1.4988872862886637e-05, -1.130970849771984e-05, -7.630536856595427e-06, -3.9513729461759795e-06, -2.722090357565321e-07, 3.4069544199155644e-06, 7.086118785082363e-06, 1.076528315024916e-05, 1.4444445696426556e-05, 1.8123610061593354e-05, 2.1802774426760152e-05, 2.548193879192695e-05, 2.916110315709375e-05, 3.284026752226055e-05, 3.651942824944854e-05, 4.019859625259414e-05, 4.3877756979782134e-05, 4.755692134494893e-05, 5.123608571011573e-05, 5.491525007528253e-05, 5.859441444044933e-05, 6.227357516763732e-05, 6.595274317078292e-05, 6.963190389797091e-05, 7.33110646251589e-05, 7.699023262830451e-05, 8.066940063145012e-05, 8.434856135863811e-05, 8.802772936178371e-05, 9.17068900889717e-05, 9.538605809211731e-05, 9.90652188193053e-05, 0.00010274437954649329, 0.0001064235475496389, 0.00011010270827682689]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 7.0, 4.0, 8.0, 7.0, 8.0, 25.0, 8.0, 15.0, 16.0, 13.0, 22.0, 15.0, 33.0, 22.0, 29.0, 28.0, 34.0, 31.0, 40.0, 42.0, 36.0, 44.0, 44.0, 35.0, 41.0, 28.0, 41.0, 37.0, 34.0, 32.0, 22.0, 25.0, 31.0, 23.0, 13.0, 16.0, 18.0, 11.0, 8.0, 12.0, 9.0, 6.0, 5.0, 6.0, 0.0, 4.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.783008575439453e-05, -6.553158164024353e-05, -6.323307752609253e-05, -6.093457341194153e-05, -5.863606929779053e-05, -5.6337565183639526e-05, -5.4039061069488525e-05, -5.1740556955337524e-05, -4.9442052841186523e-05, -4.714354872703552e-05, -4.484504461288452e-05, -4.254654049873352e-05, -4.024803638458252e-05, -3.794953227043152e-05, -3.565102815628052e-05, -3.3352524042129517e-05, -3.1054019927978516e-05, -2.8755515813827515e-05, -2.6457011699676514e-05, -2.4158507585525513e-05, -2.1860003471374512e-05, -1.956149935722351e-05, -1.726299524307251e-05, -1.4964491128921509e-05, -1.2665987014770508e-05, -1.0367482900619507e-05, -8.068978786468506e-06, -5.770474672317505e-06, -3.471970558166504e-06, -1.173466444015503e-06, 1.125037670135498e-06, 3.423541784286499e-06, 5.7220458984375e-06, 8.020550012588501e-06, 1.0319054126739502e-05, 1.2617558240890503e-05, 1.4916062355041504e-05, 1.7214566469192505e-05, 1.9513070583343506e-05, 2.1811574697494507e-05, 2.4110078811645508e-05, 2.640858292579651e-05, 2.870708703994751e-05, 3.100559115409851e-05, 3.330409526824951e-05, 3.560259938240051e-05, 3.7901103496551514e-05, 4.0199607610702515e-05, 4.2498111724853516e-05, 4.4796615839004517e-05, 4.709511995315552e-05, 4.939362406730652e-05, 5.169212818145752e-05, 5.399063229560852e-05, 5.628913640975952e-05, 5.858764052391052e-05, 6.0886144638061523e-05, 6.318464875221252e-05, 6.548315286636353e-05, 6.778165698051453e-05, 7.008016109466553e-05, 7.237866520881653e-05, 7.467716932296753e-05, 7.697567343711853e-05, 7.927417755126953e-05]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 9.0, 16.0, 29.0, 54.0, 66.0, 105.0, 193.0, 314.0, 641.0, 1088.0, 2482.0, 6065.0, 16729.0, 110747.0, 3676079.0, 348145.0, 19332.0, 6350.0, 2863.0, 1320.0, 694.0, 334.0, 194.0, 142.0, 87.0, 63.0, 26.0, 29.0, 14.0, 11.0, 9.0, 8.0, 4.0, 11.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.227327346801758e-05, -4.9962662160396576e-05, -4.7652050852775574e-05, -4.534143954515457e-05, -4.303082823753357e-05, -4.072021692991257e-05, -3.8409605622291565e-05, -3.609899431467056e-05, -3.378838300704956e-05, -3.147777169942856e-05, -2.9167160391807556e-05, -2.6856549084186554e-05, -2.4545937776565552e-05, -2.223532646894455e-05, -1.9924715161323547e-05, -1.7614103853702545e-05, -1.5303492546081543e-05, -1.299288123846054e-05, -1.0682269930839539e-05, -8.371658623218536e-06, -6.061047315597534e-06, -3.750436007976532e-06, -1.4398247003555298e-06, 8.707866072654724e-07, 3.1813979148864746e-06, 5.492009222507477e-06, 7.802620530128479e-06, 1.0113231837749481e-05, 1.2423843145370483e-05, 1.4734454452991486e-05, 1.7045065760612488e-05, 1.935567706823349e-05, 2.1666288375854492e-05, 2.3976899683475494e-05, 2.6287510991096497e-05, 2.85981222987175e-05, 3.09087336063385e-05, 3.32193449139595e-05, 3.5529956221580505e-05, 3.784056752920151e-05, 4.015117883682251e-05, 4.246179014444351e-05, 4.4772401452064514e-05, 4.7083012759685516e-05, 4.939362406730652e-05, 5.170423537492752e-05, 5.401484668254852e-05, 5.6325457990169525e-05, 5.863606929779053e-05, 6.094668060541153e-05, 6.325729191303253e-05, 6.556790322065353e-05, 6.787851452827454e-05, 7.018912583589554e-05, 7.249973714351654e-05, 7.481034845113754e-05, 7.712095975875854e-05, 7.943157106637955e-05, 8.174218237400055e-05, 8.405279368162155e-05, 8.636340498924255e-05, 8.867401629686356e-05, 9.098462760448456e-05, 9.329523891210556e-05, 9.560585021972656e-05]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 9.0, 7.0, 6.0, 11.0, 15.0, 25.0, 38.0, 42.0, 50.0, 82.0, 95.0, 115.0, 91.0, 96.0, 86.0, 55.0, 58.0, 37.0, 25.0, 21.0, 12.0, 8.0, 7.0, 8.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.014636993408203e-05, -1.9237399101257324e-05, -1.8328428268432617e-05, -1.741945743560791e-05, -1.6510486602783203e-05, -1.5601515769958496e-05, -1.4692544937133789e-05, -1.3783574104309082e-05, -1.2874603271484375e-05, -1.1965632438659668e-05, -1.1056661605834961e-05, -1.0147690773010254e-05, -9.238719940185547e-06, -8.32974910736084e-06, -7.420778274536133e-06, -6.511807441711426e-06, -5.602836608886719e-06, -4.693865776062012e-06, -3.7848949432373047e-06, -2.8759241104125977e-06, -1.9669532775878906e-06, -1.0579824447631836e-06, -1.4901161193847656e-07, 7.599592208862305e-07, 1.6689300537109375e-06, 2.5779008865356445e-06, 3.4868717193603516e-06, 4.395842552185059e-06, 5.304813385009766e-06, 6.213784217834473e-06, 7.12275505065918e-06, 8.031725883483887e-06, 8.940696716308594e-06, 9.8496675491333e-06, 1.0758638381958008e-05, 1.1667609214782715e-05, 1.2576580047607422e-05, 1.3485550880432129e-05, 1.4394521713256836e-05, 1.5303492546081543e-05, 1.621246337890625e-05, 1.7121434211730957e-05, 1.8030405044555664e-05, 1.893937587738037e-05, 1.9848346710205078e-05, 2.0757317543029785e-05, 2.1666288375854492e-05, 2.25752592086792e-05, 2.3484230041503906e-05, 2.4393200874328613e-05, 2.530217170715332e-05, 2.6211142539978027e-05, 2.7120113372802734e-05, 2.802908420562744e-05, 2.893805503845215e-05, 2.9847025871276855e-05, 3.075599670410156e-05, 3.166496753692627e-05, 3.2573938369750977e-05, 3.3482909202575684e-05, 3.439188003540039e-05, 3.53008508682251e-05, 3.6209821701049805e-05, 3.711879253387451e-05, 3.802776336669922e-05]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 2.0, 13.0, 17.0, 16.0, 22.0, 35.0, 57.0, 74.0, 116.0, 159.0, 255.0, 416.0, 708.0, 1067.0, 1896.0, 3461.0, 6937.0, 14360.0, 35279.0, 104453.0, 1599860.0, 2242328.0, 118197.0, 34856.0, 14406.0, 6807.0, 3496.0, 1994.0, 1137.0, 670.0, 427.0, 246.0, 165.0, 108.0, 75.0, 50.0, 40.0, 31.0, 12.0, 11.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.135204315185547e-05, -3.040209412574768e-05, -2.9452145099639893e-05, -2.8502196073532104e-05, -2.7552247047424316e-05, -2.660229802131653e-05, -2.565234899520874e-05, -2.4702399969100952e-05, -2.3752450942993164e-05, -2.2802501916885376e-05, -2.1852552890777588e-05, -2.09026038646698e-05, -1.9952654838562012e-05, -1.9002705812454224e-05, -1.8052756786346436e-05, -1.7102807760238647e-05, -1.615285873413086e-05, -1.5202909708023071e-05, -1.4252960681915283e-05, -1.3303011655807495e-05, -1.2353062629699707e-05, -1.1403113603591919e-05, -1.0453164577484131e-05, -9.503215551376343e-06, -8.553266525268555e-06, -7.603317499160767e-06, -6.6533684730529785e-06, -5.7034194469451904e-06, -4.753470420837402e-06, -3.8035213947296143e-06, -2.853572368621826e-06, -1.903623342514038e-06, -9.5367431640625e-07, -3.725290298461914e-09, 9.462237358093262e-07, 1.8961727619171143e-06, 2.8461217880249023e-06, 3.7960708141326904e-06, 4.7460198402404785e-06, 5.695968866348267e-06, 6.645917892456055e-06, 7.595866918563843e-06, 8.545815944671631e-06, 9.495764970779419e-06, 1.0445713996887207e-05, 1.1395663022994995e-05, 1.2345612049102783e-05, 1.3295561075210571e-05, 1.424551010131836e-05, 1.5195459127426147e-05, 1.6145408153533936e-05, 1.7095357179641724e-05, 1.8045306205749512e-05, 1.89952552318573e-05, 1.9945204257965088e-05, 2.0895153284072876e-05, 2.1845102310180664e-05, 2.2795051336288452e-05, 2.374500036239624e-05, 2.469494938850403e-05, 2.5644898414611816e-05, 2.6594847440719604e-05, 2.7544796466827393e-05, 2.849474549293518e-05, 2.944469451904297e-05]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 8.0, 2.0, 5.0, 5.0, 15.0, 14.0, 12.0, 25.0, 24.0, 27.0, 28.0, 40.0, 52.0, 78.0, 101.0, 226.0, 433.0, 878.0, 797.0, 555.0, 272.0, 137.0, 73.0, 50.0, 38.0, 38.0, 31.0, 21.0, 14.0, 16.0, 9.0, 8.0, 9.0, 7.0, 5.0, 2.0, 3.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8252601623535156e-05, -2.7342699468135834e-05, -2.643279731273651e-05, -2.552289515733719e-05, -2.4612993001937866e-05, -2.3703090846538544e-05, -2.279318869113922e-05, -2.18832865357399e-05, -2.0973384380340576e-05, -2.0063482224941254e-05, -1.915358006954193e-05, -1.824367791414261e-05, -1.7333775758743286e-05, -1.6423873603343964e-05, -1.551397144794464e-05, -1.4604069292545319e-05, -1.3694167137145996e-05, -1.2784264981746674e-05, -1.1874362826347351e-05, -1.0964460670948029e-05, -1.0054558515548706e-05, -9.144656360149384e-06, -8.234754204750061e-06, -7.3248520493507385e-06, -6.414949893951416e-06, -5.5050477385520935e-06, -4.595145583152771e-06, -3.6852434277534485e-06, -2.775341272354126e-06, -1.8654391169548035e-06, -9.55536961555481e-07, -4.563480615615845e-08, 8.642673492431641e-07, 1.7741695046424866e-06, 2.684071660041809e-06, 3.5939738154411316e-06, 4.503875970840454e-06, 5.413778126239777e-06, 6.323680281639099e-06, 7.233582437038422e-06, 8.143484592437744e-06, 9.053386747837067e-06, 9.96328890323639e-06, 1.0873191058635712e-05, 1.1783093214035034e-05, 1.2692995369434357e-05, 1.360289752483368e-05, 1.4512799680233002e-05, 1.5422701835632324e-05, 1.6332603991031647e-05, 1.724250614643097e-05, 1.8152408301830292e-05, 1.9062310457229614e-05, 1.9972212612628937e-05, 2.088211476802826e-05, 2.1792016923427582e-05, 2.2701919078826904e-05, 2.3611821234226227e-05, 2.452172338962555e-05, 2.5431625545024872e-05, 2.6341527700424194e-05, 2.7251429855823517e-05, 2.816133201122284e-05, 2.9071234166622162e-05, 2.9981136322021484e-05]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 3.0, 7.0, 1.0, 5.0, 11.0, 10.0, 12.0, 11.0, 11.0, 19.0, 23.0, 36.0, 49.0, 72.0, 72.0, 103.0, 104.0, 101.0, 75.0, 61.0, 36.0, 38.0, 33.0, 20.0, 13.0, 7.0, 9.0, 10.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.00016361937741748989, -0.00015875956160016358, -0.00015389974578283727, -0.0001490399445174262, -0.00014418012870009989, -0.00013932031288277358, -0.00013446049706544727, -0.00012960068124812096, -0.00012474087998270988, -0.00011988106416538358, -0.00011502125562401488, -0.00011016143980668858, -0.00010530163126531988, -0.00010044181544799358, -9.558199963066727e-05, -9.072218381334096e-05, -8.586236799601465e-05, -8.100255217868835e-05, -7.614274363731965e-05, -7.128292781999335e-05, -6.642311927862465e-05, -6.156330346129835e-05, -5.670348764397204e-05, -5.184367546462454e-05, -4.698386328527704e-05, -4.212405110592954e-05, -3.726423892658204e-05, -3.240442310925573e-05, -2.754461092990823e-05, -2.268479875056073e-05, -1.7824984752223827e-05, -1.2965170753886923e-05, -8.105358574539423e-06, -3.245545485697221e-06, 1.614267603144981e-06, 6.474080691987183e-06, 1.1333893780829385e-05, 1.6193705960176885e-05, 2.105351995851379e-05, 2.5913333956850693e-05, 3.077314613619819e-05, 3.563295831554569e-05, 4.049277049489319e-05, 4.53525863122195e-05, 5.0212398491567e-05, 5.50722106709145e-05, 5.993202648824081e-05, 6.47918350296095e-05, 6.965165084693581e-05, 7.451146666426212e-05, 7.937127520563081e-05, 8.423109102295712e-05, 8.909089956432581e-05, 9.395071538165212e-05, 9.881053119897842e-05, 0.00010367034701630473, 0.00010853015555767342, 0.00011338997137499973, 0.00011824977991636842, 0.00012310959573369473, 0.00012796941155102104, 0.00013282921281643212, 0.00013768902863375843, 0.00014254884445108473, 0.00014740866026841104]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 7.0, 6.0, 8.0, 8.0, 7.0, 9.0, 11.0, 16.0, 23.0, 17.0, 21.0, 27.0, 36.0, 38.0, 30.0, 36.0, 29.0, 46.0, 44.0, 44.0, 52.0, 52.0, 39.0, 42.0, 40.0, 45.0, 37.0, 25.0, 21.0, 39.0, 26.0, 23.0, 18.0, 16.0, 10.0, 14.0, 11.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010484457015991211, -0.00010188110172748566, -9.89176332950592e-05, -9.595416486263275e-05, -9.29906964302063e-05, -9.002722799777985e-05, -8.70637595653534e-05, -8.410029113292694e-05, -8.113682270050049e-05, -7.817335426807404e-05, -7.520988583564758e-05, -7.224641740322113e-05, -6.928294897079468e-05, -6.631948053836823e-05, -6.335601210594177e-05, -6.039254367351532e-05, -5.742907524108887e-05, -5.4465606808662415e-05, -5.150213837623596e-05, -4.853866994380951e-05, -4.557520151138306e-05, -4.2611733078956604e-05, -3.964826464653015e-05, -3.66847962141037e-05, -3.3721327781677246e-05, -3.0757859349250793e-05, -2.779439091682434e-05, -2.4830922484397888e-05, -2.1867454051971436e-05, -1.8903985619544983e-05, -1.594051718711853e-05, -1.2977048754692078e-05, -1.0013580322265625e-05, -7.050111889839172e-06, -4.08664345741272e-06, -1.123175024986267e-06, 1.8402934074401855e-06, 4.803761839866638e-06, 7.76723027229309e-06, 1.0730698704719543e-05, 1.3694167137145996e-05, 1.665763556957245e-05, 1.96211040019989e-05, 2.2584572434425354e-05, 2.5548040866851807e-05, 2.851150929927826e-05, 3.147497773170471e-05, 3.4438446164131165e-05, 3.740191459655762e-05, 4.036538302898407e-05, 4.332885146141052e-05, 4.6292319893836975e-05, 4.925578832626343e-05, 5.221925675868988e-05, 5.518272519111633e-05, 5.8146193623542786e-05, 6.110966205596924e-05, 6.407313048839569e-05, 6.703659892082214e-05, 7.00000673532486e-05, 7.296353578567505e-05, 7.59270042181015e-05, 7.889047265052795e-05, 8.18539410829544e-05, 8.481740951538086e-05]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 11.0, 8.0, 15.0, 16.0, 33.0, 37.0, 48.0, 85.0, 140.0, 257.0, 467.0, 960.0, 1990.0, 4197.0, 10204.0, 27718.0, 93396.0, 563628.0, 259962.0, 54179.0, 17941.0, 7141.0, 3057.0, 1449.0, 723.0, 368.0, 199.0, 113.0, 75.0, 48.0, 28.0, 20.0, 14.0, 8.0, 12.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001062154769897461, -0.00010287482291460037, -9.953416883945465e-05, -9.619351476430893e-05, -9.285286068916321e-05, -8.951220661401749e-05, -8.617155253887177e-05, -8.283089846372604e-05, -7.949024438858032e-05, -7.61495903134346e-05, -7.280893623828888e-05, -6.946828216314316e-05, -6.612762808799744e-05, -6.278697401285172e-05, -5.9446319937705994e-05, -5.610566586256027e-05, -5.276501178741455e-05, -4.942435771226883e-05, -4.608370363712311e-05, -4.2743049561977386e-05, -3.9402395486831665e-05, -3.6061741411685944e-05, -3.272108733654022e-05, -2.93804332613945e-05, -2.603977918624878e-05, -2.2699125111103058e-05, -1.9358471035957336e-05, -1.6017816960811615e-05, -1.2677162885665894e-05, -9.336508810520172e-06, -5.995854735374451e-06, -2.6552006602287292e-06, 6.854534149169922e-07, 4.026107490062714e-06, 7.366761565208435e-06, 1.0707415640354156e-05, 1.4048069715499878e-05, 1.73887237906456e-05, 2.072937786579132e-05, 2.4070031940937042e-05, 2.7410686016082764e-05, 3.0751340091228485e-05, 3.4091994166374207e-05, 3.743264824151993e-05, 4.077330231666565e-05, 4.411395639181137e-05, 4.745461046695709e-05, 5.0795264542102814e-05, 5.4135918617248535e-05, 5.7476572692394257e-05, 6.081722676753998e-05, 6.41578808426857e-05, 6.749853491783142e-05, 7.083918899297714e-05, 7.417984306812286e-05, 7.752049714326859e-05, 8.08611512184143e-05, 8.420180529356003e-05, 8.754245936870575e-05, 9.088311344385147e-05, 9.422376751899719e-05, 9.756442159414291e-05, 0.00010090507566928864, 0.00010424572974443436, 0.00010758638381958008]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 9.0, 8.0, 15.0, 16.0, 23.0, 34.0, 49.0, 62.0, 57.0, 77.0, 73.0, 82.0, 93.0, 84.0, 73.0, 54.0, 45.0, 37.0, 33.0, 18.0, 18.0, 9.0, 4.0, 8.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8835067749023438e-05, -1.8003396689891815e-05, -1.7171725630760193e-05, -1.634005457162857e-05, -1.5508383512496948e-05, -1.4676712453365326e-05, -1.3845041394233704e-05, -1.3013370335102081e-05, -1.2181699275970459e-05, -1.1350028216838837e-05, -1.0518357157707214e-05, -9.686686098575592e-06, -8.85501503944397e-06, -8.023343980312347e-06, -7.191672921180725e-06, -6.360001862049103e-06, -5.5283308029174805e-06, -4.696659743785858e-06, -3.864988684654236e-06, -3.0333176255226135e-06, -2.201646566390991e-06, -1.369975507259369e-06, -5.383044481277466e-07, 2.9336661100387573e-07, 1.125037670135498e-06, 1.9567087292671204e-06, 2.7883797883987427e-06, 3.620050847530365e-06, 4.451721906661987e-06, 5.28339296579361e-06, 6.115064024925232e-06, 6.946735084056854e-06, 7.778406143188477e-06, 8.610077202320099e-06, 9.441748261451721e-06, 1.0273419320583344e-05, 1.1105090379714966e-05, 1.1936761438846588e-05, 1.276843249797821e-05, 1.3600103557109833e-05, 1.4431774616241455e-05, 1.5263445675373077e-05, 1.60951167345047e-05, 1.6926787793636322e-05, 1.7758458852767944e-05, 1.8590129911899567e-05, 1.942180097103119e-05, 2.025347203016281e-05, 2.1085143089294434e-05, 2.1916814148426056e-05, 2.2748485207557678e-05, 2.35801562666893e-05, 2.4411827325820923e-05, 2.5243498384952545e-05, 2.6075169444084167e-05, 2.690684050321579e-05, 2.7738511562347412e-05, 2.8570182621479034e-05, 2.9401853680610657e-05, 3.023352473974228e-05, 3.10651957988739e-05, 3.1896866858005524e-05, 3.2728537917137146e-05, 3.356020897626877e-05, 3.439188003540039e-05]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 5.0, 2.0, 2.0, 7.0, 6.0, 10.0, 13.0, 14.0, 26.0, 30.0, 45.0, 53.0, 70.0, 124.0, 163.0, 268.0, 379.0, 620.0, 876.0, 1581.0, 2638.0, 5055.0, 9727.0, 24990.0, 73334.0, 497639.0, 326450.0, 64405.0, 20275.0, 9230.0, 4361.0, 2271.0, 1330.0, 833.0, 517.0, 318.0, 280.0, 165.0, 138.0, 77.0, 58.0, 57.0, 39.0, 26.0, 18.0, 9.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.849102020263672e-05, -2.7505680918693542e-05, -2.6520341634750366e-05, -2.553500235080719e-05, -2.4549663066864014e-05, -2.3564323782920837e-05, -2.257898449897766e-05, -2.1593645215034485e-05, -2.060830593109131e-05, -1.9622966647148132e-05, -1.8637627363204956e-05, -1.765228807926178e-05, -1.6666948795318604e-05, -1.5681609511375427e-05, -1.4696270227432251e-05, -1.3710930943489075e-05, -1.2725591659545898e-05, -1.1740252375602722e-05, -1.0754913091659546e-05, -9.76957380771637e-06, -8.784234523773193e-06, -7.798895239830017e-06, -6.813555955886841e-06, -5.8282166719436646e-06, -4.842877388000488e-06, -3.857538104057312e-06, -2.8721988201141357e-06, -1.8868595361709595e-06, -9.015202522277832e-07, 8.381903171539307e-08, 1.0691583156585693e-06, 2.0544975996017456e-06, 3.039836883544922e-06, 4.025176167488098e-06, 5.010515451431274e-06, 5.995854735374451e-06, 6.981194019317627e-06, 7.966533303260803e-06, 8.95187258720398e-06, 9.937211871147156e-06, 1.0922551155090332e-05, 1.1907890439033508e-05, 1.2893229722976685e-05, 1.387856900691986e-05, 1.4863908290863037e-05, 1.5849247574806213e-05, 1.683458685874939e-05, 1.7819926142692566e-05, 1.8805265426635742e-05, 1.979060471057892e-05, 2.0775943994522095e-05, 2.176128327846527e-05, 2.2746622562408447e-05, 2.3731961846351624e-05, 2.47173011302948e-05, 2.5702640414237976e-05, 2.6687979698181152e-05, 2.767331898212433e-05, 2.8658658266067505e-05, 2.964399755001068e-05, 3.062933683395386e-05, 3.1614676117897034e-05, 3.260001540184021e-05, 3.3585354685783386e-05, 3.457069396972656e-05]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 7.0, 3.0, 10.0, 17.0, 13.0, 17.0, 21.0, 25.0, 34.0, 34.0, 43.0, 44.0, 45.0, 61.0, 48.0, 45.0, 53.0, 63.0, 57.0, 53.0, 52.0, 37.0, 27.0, 29.0, 28.0, 15.0, 25.0, 15.0, 11.0, 15.0, 15.0, 9.0, 3.0, 6.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.552436828613281e-05, -3.438815474510193e-05, -3.3251941204071045e-05, -3.211572766304016e-05, -3.097951412200928e-05, -2.9843300580978394e-05, -2.870708703994751e-05, -2.7570873498916626e-05, -2.6434659957885742e-05, -2.529844641685486e-05, -2.4162232875823975e-05, -2.302601933479309e-05, -2.1889805793762207e-05, -2.0753592252731323e-05, -1.961737871170044e-05, -1.8481165170669556e-05, -1.7344951629638672e-05, -1.6208738088607788e-05, -1.5072524547576904e-05, -1.393631100654602e-05, -1.2800097465515137e-05, -1.1663883924484253e-05, -1.0527670383453369e-05, -9.391456842422485e-06, -8.255243301391602e-06, -7.119029760360718e-06, -5.982816219329834e-06, -4.84660267829895e-06, -3.7103891372680664e-06, -2.5741755962371826e-06, -1.4379620552062988e-06, -3.0174851417541504e-07, 8.344650268554688e-07, 1.9706785678863525e-06, 3.1068921089172363e-06, 4.24310564994812e-06, 5.379319190979004e-06, 6.515532732009888e-06, 7.651746273040771e-06, 8.787959814071655e-06, 9.924173355102539e-06, 1.1060386896133423e-05, 1.2196600437164307e-05, 1.333281397819519e-05, 1.4469027519226074e-05, 1.5605241060256958e-05, 1.6741454601287842e-05, 1.7877668142318726e-05, 1.901388168334961e-05, 2.0150095224380493e-05, 2.1286308765411377e-05, 2.242252230644226e-05, 2.3558735847473145e-05, 2.469494938850403e-05, 2.5831162929534912e-05, 2.6967376470565796e-05, 2.810359001159668e-05, 2.9239803552627563e-05, 3.0376017093658447e-05, 3.151223063468933e-05, 3.2648444175720215e-05, 3.37846577167511e-05, 3.492087125778198e-05, 3.6057084798812866e-05, 3.719329833984375e-05]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 7.0, 6.0, 12.0, 6.0, 19.0, 21.0, 33.0, 43.0, 76.0, 80.0, 141.0, 171.0, 367.0, 583.0, 705.0, 1707.0, 3375.0, 4910.0, 15673.0, 30727.0, 169983.0, 668217.0, 93742.0, 36002.0, 11787.0, 3815.0, 2726.0, 1148.0, 910.0, 554.0, 238.0, 267.0, 156.0, 76.0, 77.0, 44.0, 47.0, 31.0, 16.0, 15.0, 10.0, 10.0, 6.0, 6.0, 4.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-7.212162017822266e-06, -6.996095180511475e-06, -6.780028343200684e-06, -6.563961505889893e-06, -6.3478946685791016e-06, -6.1318278312683105e-06, -5.9157609939575195e-06, -5.6996941566467285e-06, -5.4836273193359375e-06, -5.2675604820251465e-06, -5.0514936447143555e-06, -4.8354268074035645e-06, -4.6193599700927734e-06, -4.403293132781982e-06, -4.187226295471191e-06, -3.9711594581604e-06, -3.7550926208496094e-06, -3.5390257835388184e-06, -3.3229589462280273e-06, -3.1068921089172363e-06, -2.8908252716064453e-06, -2.6747584342956543e-06, -2.4586915969848633e-06, -2.2426247596740723e-06, -2.0265579223632812e-06, -1.8104910850524902e-06, -1.5944242477416992e-06, -1.3783574104309082e-06, -1.1622905731201172e-06, -9.462237358093262e-07, -7.301568984985352e-07, -5.140900611877441e-07, -2.980232238769531e-07, -8.195638656616211e-08, 1.341104507446289e-07, 3.501772880554199e-07, 5.662441253662109e-07, 7.82310962677002e-07, 9.98377799987793e-07, 1.214444637298584e-06, 1.430511474609375e-06, 1.646578311920166e-06, 1.862645149230957e-06, 2.078711986541748e-06, 2.294778823852539e-06, 2.51084566116333e-06, 2.726912498474121e-06, 2.942979335784912e-06, 3.159046173095703e-06, 3.375113010406494e-06, 3.591179847717285e-06, 3.807246685028076e-06, 4.023313522338867e-06, 4.239380359649658e-06, 4.455447196960449e-06, 4.67151403427124e-06, 4.887580871582031e-06, 5.103647708892822e-06, 5.319714546203613e-06, 5.535781383514404e-06, 5.751848220825195e-06, 5.967915058135986e-06, 6.183981895446777e-06, 6.400048732757568e-06, 6.616115570068359e-06]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 10.0, 0.0, 7.0, 0.0, 12.0, 13.0, 0.0, 13.0, 0.0, 26.0, 35.0, 0.0, 47.0, 58.0, 0.0, 42.0, 0.0, 66.0, 72.0, 0.0, 62.0, 0.0, 74.0, 75.0, 0.0, 64.0, 0.0, 74.0, 54.0, 0.0, 43.0, 0.0, 42.0, 27.0, 0.0, 31.0, 21.0, 0.0, 14.0, 0.0, 14.0, 3.0, 0.0, 6.0, 0.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-06, -1.0961666703224182e-06, -1.0598450899124146e-06, -1.0235235095024109e-06, -9.872019290924072e-07, -9.508803486824036e-07, -9.145587682723999e-07, -8.782371878623962e-07, -8.419156074523926e-07, -8.055940270423889e-07, -7.692724466323853e-07, -7.329508662223816e-07, -6.966292858123779e-07, -6.603077054023743e-07, -6.239861249923706e-07, -5.876645445823669e-07, -5.513429641723633e-07, -5.150213837623596e-07, -4.78699803352356e-07, -4.423782229423523e-07, -4.0605664253234863e-07, -3.6973506212234497e-07, -3.334134817123413e-07, -2.9709190130233765e-07, -2.60770320892334e-07, -2.2444874048233032e-07, -1.8812716007232666e-07, -1.51805579662323e-07, -1.1548399925231934e-07, -7.916241884231567e-08, -4.284083843231201e-08, -6.51925802230835e-09, 2.9802322387695312e-08, 6.612390279769897e-08, 1.0244548320770264e-07, 1.387670636177063e-07, 1.7508864402770996e-07, 2.1141022443771362e-07, 2.477318048477173e-07, 2.8405338525772095e-07, 3.203749656677246e-07, 3.5669654607772827e-07, 3.9301812648773193e-07, 4.293397068977356e-07, 4.6566128730773926e-07, 5.019828677177429e-07, 5.383044481277466e-07, 5.746260285377502e-07, 6.109476089477539e-07, 6.472691893577576e-07, 6.835907697677612e-07, 7.199123501777649e-07, 7.562339305877686e-07, 7.925555109977722e-07, 8.288770914077759e-07, 8.651986718177795e-07, 9.015202522277832e-07, 9.378418326377869e-07, 9.741634130477905e-07, 1.0104849934577942e-06, 1.0468065738677979e-06, 1.0831281542778015e-06, 1.1194497346878052e-06, 1.1557713150978088e-06, 1.1920928955078125e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 10.0, 5.0, 7.0, 12.0, 24.0, 31.0, 38.0, 47.0, 98.0, 189.0, 427.0, 1148.0, 2746.0, 11604.0, 89425.0, 894158.0, 37694.0, 7290.0, 2050.0, 843.0, 332.0, 139.0, 91.0, 43.0, 22.0, 14.0, 9.0, 8.0, 14.0, 4.0, 4.0, 6.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.609325408935547e-05, -1.5525147318840027e-05, -1.4957040548324585e-05, -1.4388933777809143e-05, -1.3820827007293701e-05, -1.325272023677826e-05, -1.2684613466262817e-05, -1.2116506695747375e-05, -1.1548399925231934e-05, -1.0980293154716492e-05, -1.041218638420105e-05, -9.844079613685608e-06, -9.275972843170166e-06, -8.707866072654724e-06, -8.139759302139282e-06, -7.57165253162384e-06, -7.0035457611083984e-06, -6.4354389905929565e-06, -5.867332220077515e-06, -5.299225449562073e-06, -4.731118679046631e-06, -4.163011908531189e-06, -3.594905138015747e-06, -3.026798367500305e-06, -2.4586915969848633e-06, -1.8905848264694214e-06, -1.3224780559539795e-06, -7.543712854385376e-07, -1.862645149230957e-07, 3.818422555923462e-07, 9.499490261077881e-07, 1.51805579662323e-06, 2.086162567138672e-06, 2.6542693376541138e-06, 3.2223761081695557e-06, 3.7904828786849976e-06, 4.3585896492004395e-06, 4.926696419715881e-06, 5.494803190231323e-06, 6.062909960746765e-06, 6.631016731262207e-06, 7.199123501777649e-06, 7.76723027229309e-06, 8.335337042808533e-06, 8.903443813323975e-06, 9.471550583839417e-06, 1.0039657354354858e-05, 1.06077641248703e-05, 1.1175870895385742e-05, 1.1743977665901184e-05, 1.2312084436416626e-05, 1.2880191206932068e-05, 1.344829797744751e-05, 1.4016404747962952e-05, 1.4584511518478394e-05, 1.5152618288993835e-05, 1.5720725059509277e-05, 1.628883183002472e-05, 1.685693860054016e-05, 1.7425045371055603e-05, 1.7993152141571045e-05, 1.8561258912086487e-05, 1.912936568260193e-05, 1.969747245311737e-05, 2.0265579223632812e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 10.0, 12.0, 14.0, 8.0, 14.0, 15.0, 36.0, 39.0, 46.0, 50.0, 75.0, 93.0, 103.0, 89.0, 76.0, 82.0, 49.0, 51.0, 27.0, 26.0, 15.0, 14.0, 5.0, 10.0, 9.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.794929504394531e-06, -6.557442247867584e-06, -6.319954991340637e-06, -6.08246773481369e-06, -5.844980478286743e-06, -5.607493221759796e-06, -5.370005965232849e-06, -5.132518708705902e-06, -4.895031452178955e-06, -4.657544195652008e-06, -4.420056939125061e-06, -4.182569682598114e-06, -3.945082426071167e-06, -3.70759516954422e-06, -3.470107913017273e-06, -3.232620656490326e-06, -2.995133399963379e-06, -2.757646143436432e-06, -2.520158886909485e-06, -2.282671630382538e-06, -2.045184373855591e-06, -1.8076971173286438e-06, -1.5702098608016968e-06, -1.3327226042747498e-06, -1.0952353477478027e-06, -8.577480912208557e-07, -6.202608346939087e-07, -3.8277357816696167e-07, -1.4528632164001465e-07, 9.220093488693237e-08, 3.296881914138794e-07, 5.671754479408264e-07, 8.046627044677734e-07, 1.0421499609947205e-06, 1.2796372175216675e-06, 1.5171244740486145e-06, 1.7546117305755615e-06, 1.9920989871025085e-06, 2.2295862436294556e-06, 2.4670735001564026e-06, 2.7045607566833496e-06, 2.9420480132102966e-06, 3.1795352697372437e-06, 3.4170225262641907e-06, 3.6545097827911377e-06, 3.891997039318085e-06, 4.129484295845032e-06, 4.366971552371979e-06, 4.604458808898926e-06, 4.841946065425873e-06, 5.07943332195282e-06, 5.316920578479767e-06, 5.554407835006714e-06, 5.791895091533661e-06, 6.029382348060608e-06, 6.266869604587555e-06, 6.504356861114502e-06, 6.741844117641449e-06, 6.979331374168396e-06, 7.216818630695343e-06, 7.45430588722229e-06, 7.691793143749237e-06, 7.929280400276184e-06, 8.166767656803131e-06, 8.404254913330078e-06]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 8.0, 7.0, 15.0, 14.0, 24.0, 30.0, 70.0, 75.0, 106.0, 201.0, 217.0, 117.0, 53.0, 22.0, 21.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004399352765176445, -0.00043153626029379666, -0.0004231372440699488, -0.0004147382278461009, -0.00040633921162225306, -0.0003979401953984052, -0.00038954117917455733, -0.00038114216295070946, -0.0003727431467268616, -0.00036434413050301373, -0.00035594511427916586, -0.000347546098055318, -0.00033914708183147013, -0.00033074806560762227, -0.0003223490493837744, -0.00031395003315992653, -0.0003055510460399091, -0.00029715202981606126, -0.0002887530135922134, -0.0002803539973683655, -0.00027195498114451766, -0.0002635559649206698, -0.00025515694869682193, -0.00024675793247297406, -0.0002383589162491262, -0.00022995990002527833, -0.00022156088380143046, -0.0002131618675775826, -0.00020476285135373473, -0.00019636383512988687, -0.000187964818906039, -0.00017956580268219113, -0.0001711667573545128, -0.00016276774113066494, -0.00015436872490681708, -0.0001459697086829692, -0.00013757069245912135, -0.00012917167623527348, -0.00012077266728738323, -0.00011237365106353536, -0.00010397464211564511, -9.557562589179724e-05, -8.717660966794938e-05, -7.877759344410151e-05, -7.037857722025365e-05, -6.197956099640578e-05, -5.358055204851553e-05, -4.518153582466766e-05, -3.6782519600819796e-05, -2.838350337697193e-05, -1.9984488972113468e-05, -1.1585474567255005e-05, -3.186458343407139e-06, 5.212557880440727e-06, 1.3611570466309786e-05, 2.2010586690157652e-05, 3.0409602914005518e-05, 3.8808619137853384e-05, 4.720763536170125e-05, 5.560664794757031e-05, 6.400566780939698e-05, 7.240468403324485e-05, 8.08036929811351e-05, 8.920270920498297e-05, 9.760172542883083e-05]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 2.0, 7.0, 5.0, 10.0, 8.0, 4.0, 12.0, 17.0, 17.0, 16.0, 13.0, 17.0, 28.0, 24.0, 23.0, 35.0, 38.0, 38.0, 35.0, 34.0, 43.0, 52.0, 49.0, 54.0, 31.0, 33.0, 46.0, 30.0, 37.0, 38.0, 23.0, 29.0, 19.0, 21.0, 10.0, 21.0, 13.0, 8.0, 8.0, 11.0, 8.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.608268737792969e-05, -9.329523891210556e-05, -9.050779044628143e-05, -8.77203419804573e-05, -8.493289351463318e-05, -8.214544504880905e-05, -7.935799658298492e-05, -7.65705481171608e-05, -7.378309965133667e-05, -7.099565118551254e-05, -6.820820271968842e-05, -6.542075425386429e-05, -6.263330578804016e-05, -5.9845857322216034e-05, -5.705840885639191e-05, -5.427096039056778e-05, -5.148351192474365e-05, -4.8696063458919525e-05, -4.59086149930954e-05, -4.312116652727127e-05, -4.0333718061447144e-05, -3.7546269595623016e-05, -3.475882112979889e-05, -3.197137266397476e-05, -2.9183924198150635e-05, -2.6396475732326508e-05, -2.360902726650238e-05, -2.0821578800678253e-05, -1.8034130334854126e-05, -1.5246681869029999e-05, -1.2459233403205872e-05, -9.671784937381744e-06, -6.884336471557617e-06, -4.09688800573349e-06, -1.3094395399093628e-06, 1.4780089259147644e-06, 4.265457391738892e-06, 7.052905857563019e-06, 9.840354323387146e-06, 1.2627802789211273e-05, 1.54152512550354e-05, 1.8202699720859528e-05, 2.0990148186683655e-05, 2.3777596652507782e-05, 2.656504511833191e-05, 2.9352493584156036e-05, 3.2139942049980164e-05, 3.492739051580429e-05, 3.771483898162842e-05, 4.0502287447452545e-05, 4.328973591327667e-05, 4.60771843791008e-05, 4.886463284492493e-05, 5.1652081310749054e-05, 5.443952977657318e-05, 5.722697824239731e-05, 6.0014426708221436e-05, 6.280187517404556e-05, 6.558932363986969e-05, 6.837677210569382e-05, 7.116422057151794e-05, 7.395166903734207e-05, 7.67391175031662e-05, 7.952656596899033e-05, 8.231401443481445e-05]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 4.0, 6.0, 6.0, 14.0, 10.0, 22.0, 24.0, 30.0, 43.0, 65.0, 120.0, 254.0, 134.0, 66.0, 57.0, 34.0, 25.0, 21.0, 9.0, 15.0, 13.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5974044799804688e-05, -1.5194527804851532e-05, -1.4415010809898376e-05, -1.3635493814945221e-05, -1.2855976819992065e-05, -1.207645982503891e-05, -1.1296942830085754e-05, -1.0517425835132599e-05, -9.737908840179443e-06, -8.958391845226288e-06, -8.178874850273132e-06, -7.399357855319977e-06, -6.619840860366821e-06, -5.840323865413666e-06, -5.06080687046051e-06, -4.281289875507355e-06, -3.5017728805541992e-06, -2.7222558856010437e-06, -1.942738890647888e-06, -1.1632218956947327e-06, -3.8370490074157715e-07, 3.9581209421157837e-07, 1.1753290891647339e-06, 1.9548460841178894e-06, 2.734363079071045e-06, 3.5138800740242004e-06, 4.293397068977356e-06, 5.0729140639305115e-06, 5.852431058883667e-06, 6.6319480538368225e-06, 7.411465048789978e-06, 8.190982043743134e-06, 8.970499038696289e-06, 9.750016033649445e-06, 1.05295330286026e-05, 1.1309050023555756e-05, 1.2088567018508911e-05, 1.2868084013462067e-05, 1.3647601008415222e-05, 1.4427118003368378e-05, 1.5206634998321533e-05, 1.598615199327469e-05, 1.6765668988227844e-05, 1.7545185983181e-05, 1.8324702978134155e-05, 1.910421997308731e-05, 1.9883736968040466e-05, 2.0663253962993622e-05, 2.1442770957946777e-05, 2.2222287952899933e-05, 2.300180494785309e-05, 2.3781321942806244e-05, 2.45608389377594e-05, 2.5340355932712555e-05, 2.611987292766571e-05, 2.6899389922618866e-05, 2.767890691757202e-05, 2.8458423912525177e-05, 2.9237940907478333e-05, 3.0017457902431488e-05, 3.0796974897384644e-05, 3.15764918923378e-05, 3.2356008887290955e-05, 3.313552588224411e-05, 3.3915042877197266e-05]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 0.0, 6.0, 6.0, 7.0, 10.0, 14.0, 16.0, 31.0, 29.0, 53.0, 98.0, 155.0, 261.0, 499.0, 1157.0, 3081.0, 12597.0, 8172233.0, 185380.0, 8696.0, 2402.0, 920.0, 398.0, 218.0, 103.0, 64.0, 54.0, 25.0, 22.0, 9.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.782462100498378e-05, -8.530747436452657e-05, -8.279032772406936e-05, -8.027317380765453e-05, -7.775602716719732e-05, -7.52388805267401e-05, -7.272172661032528e-05, -7.020457996986806e-05, -6.768743332941085e-05, -6.517028668895364e-05, -6.265314004849643e-05, -6.01359861320816e-05, -5.7618839491624385e-05, -5.510169285116717e-05, -5.258454257273115e-05, -5.006739229429513e-05, -4.755024565383792e-05, -4.5033099013380706e-05, -4.2515948734944686e-05, -3.9998798456508666e-05, -3.748165181605145e-05, -3.496450517559424e-05, -3.244735489715822e-05, -2.9930206437711604e-05, -2.7413057978264987e-05, -2.489590951881837e-05, -2.2378761059371755e-05, -1.9861612599925138e-05, -1.734446414047852e-05, -1.4827315681031905e-05, -1.2310167221585289e-05, -9.793018762138672e-06, -7.2758630267344415e-06, -4.758714567287825e-06, -2.2415661078412086e-06, 2.755823516054079e-07, 2.7927308110520244e-06, 5.309879270498641e-06, 7.827027729945257e-06, 1.0344176189391874e-05, 1.286132464883849e-05, 1.5378473108285107e-05, 1.7895621567731723e-05, 2.041277002717834e-05, 2.2929918486624956e-05, 2.5447066946071573e-05, 2.796421540551819e-05, 3.0481363864964806e-05, 3.299851232441142e-05, 3.5515658964868635e-05, 3.8032809243304655e-05, 4.0549959521740675e-05, 4.306710616219789e-05, 4.55842528026551e-05, 4.810140308109112e-05, 5.061855335952714e-05, 5.3135699999984354e-05, 5.565284664044157e-05, 5.816999691887759e-05, 6.068714719731361e-05, 6.320429383777082e-05, 6.572144047822803e-05, 6.823858711868525e-05, 7.075574103510007e-05, 7.327288767555729e-05]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 3.0, 2.0, 4.0, 7.0, 6.0, 9.0, 12.0, 3.0, 10.0, 5.0, 8.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03335392952431e-05, -5.793615127913654e-05, -5.553875962505117e-05, -5.314137160894461e-05, -5.074397995485924e-05, -4.834659193875268e-05, -4.594920028466731e-05, -4.355181226856075e-05, -4.115442425245419e-05, -3.875703623634763e-05, -3.635964458226226e-05, -3.39622565661557e-05, -3.1564864912070334e-05, -2.9167476895963773e-05, -2.677008706086781e-05, -2.4372697225771844e-05, -2.1975305571686476e-05, -1.9577915736590512e-05, -1.7180525901494548e-05, -1.4783136975893285e-05, -1.238574714079732e-05, -9.988357305701356e-06, -7.590968380100094e-06, -5.193578545004129e-06, -2.796188709908165e-06, -3.987991021858761e-07, 1.998590505536413e-06, 4.395979885885026e-06, 6.793369720980991e-06, 9.190759556076955e-06, 1.1588148481678218e-05, 1.3985538316774182e-05, 1.638292451389134e-05, 1.8780314348987304e-05, 2.1177704184083268e-05, 2.357509220018983e-05, 2.5972483854275197e-05, 2.8369871870381758e-05, 3.076725988648832e-05, 3.3164651540573686e-05, 3.5562043194659054e-05, 3.7959431210765615e-05, 4.035682286485098e-05, 4.2754210880957544e-05, 4.515160253504291e-05, 4.754899055114947e-05, 4.9946378567256033e-05, 5.23437702213414e-05, 5.474115823744796e-05, 5.713854625355452e-05, 5.953593790763989e-05, 6.193332956172526e-05, 6.433071393985301e-05, 6.672810559393838e-05, 6.912549724802375e-05, 7.15228816261515e-05, 7.392027328023687e-05, 7.631766493432224e-05, 7.871504931244999e-05, 8.111244096653536e-05, 8.350983262062073e-05, 8.59072242747061e-05, 8.830460865283385e-05, 9.070200030691922e-05, 9.309939196100459e-05]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 9.0, 9.0, 21.0, 24.0, 33.0, 40.0, 55.0, 44.0, 55.0, 76.0, 69.0, 68.0, 68.0, 69.0, 70.0, 60.0, 49.0, 36.0, 31.0, 25.0, 22.0, 16.0, 13.0, 8.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-06, -8.637085556983948e-06, -8.333474397659302e-06, -8.029863238334656e-06, -7.72625207901001e-06, -7.422640919685364e-06, -7.119029760360718e-06, -6.815418601036072e-06, -6.511807441711426e-06, -6.20819628238678e-06, -5.904585123062134e-06, -5.600973963737488e-06, -5.297362804412842e-06, -4.993751645088196e-06, -4.69014048576355e-06, -4.386529326438904e-06, -4.082918167114258e-06, -3.779307007789612e-06, -3.475695848464966e-06, -3.17208468914032e-06, -2.868473529815674e-06, -2.564862370491028e-06, -2.261251211166382e-06, -1.957640051841736e-06, -1.6540288925170898e-06, -1.3504177331924438e-06, -1.0468065738677979e-06, -7.431954145431519e-07, -4.3958425521850586e-07, -1.3597309589385986e-07, 1.6763806343078613e-07, 4.7124922275543213e-07, 7.748603820800781e-07, 1.0784715414047241e-06, 1.3820827007293701e-06, 1.6856938600540161e-06, 1.989305019378662e-06, 2.292916178703308e-06, 2.596527338027954e-06, 2.9001384973526e-06, 3.203749656677246e-06, 3.507360816001892e-06, 3.810971975326538e-06, 4.114583134651184e-06, 4.41819429397583e-06, 4.721805453300476e-06, 5.025416612625122e-06, 5.329027771949768e-06, 5.632638931274414e-06, 5.93625009059906e-06, 6.239861249923706e-06, 6.543472409248352e-06, 6.847083568572998e-06, 7.150694727897644e-06, 7.45430588722229e-06, 7.757917046546936e-06, 8.061528205871582e-06, 8.365139365196228e-06, 8.668750524520874e-06, 8.97236168384552e-06, 9.275972843170166e-06, 9.579584002494812e-06, 9.883195161819458e-06, 1.0186806321144104e-05, 1.049041748046875e-05]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 4.0, 7.0, 8.0, 13.0, 20.0, 20.0, 52.0, 63.0, 130.0, 185.0, 320.0, 608.0, 1220.0, 2768.0, 7542.0, 27023.0, 207186.0, 235654.0, 28341.0, 7449.0, 2895.0, 1255.0, 620.0, 347.0, 194.0, 131.0, 69.0, 48.0, 33.0, 19.0, 12.0, 16.0, 1.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002351999282836914, -0.00022579915821552277, -0.00021639838814735413, -0.00020699761807918549, -0.00019759684801101685, -0.0001881960779428482, -0.00017879530787467957, -0.00016939453780651093, -0.00015999376773834229, -0.00015059299767017365, -0.000141192227602005, -0.00013179145753383636, -0.00012239068746566772, -0.00011298991739749908, -0.00010358914732933044, -9.41883772611618e-05, -8.478760719299316e-05, -7.538683712482452e-05, -6.598606705665588e-05, -5.6585296988487244e-05, -4.7184526920318604e-05, -3.778375685214996e-05, -2.8382986783981323e-05, -1.8982216715812683e-05, -9.581446647644043e-06, -1.8067657947540283e-07, 9.220093488693237e-06, 1.8620863556861877e-05, 2.8021633625030518e-05, 3.742240369319916e-05, 4.68231737613678e-05, 5.622394382953644e-05, 6.562471389770508e-05, 7.502548396587372e-05, 8.442625403404236e-05, 9.3827024102211e-05, 0.00010322779417037964, 0.00011262856423854828, 0.00012202933430671692, 0.00013143010437488556, 0.0001408308744430542, 0.00015023164451122284, 0.00015963241457939148, 0.00016903318464756012, 0.00017843395471572876, 0.0001878347247838974, 0.00019723549485206604, 0.00020663626492023468, 0.00021603703498840332, 0.00022543780505657196, 0.0002348385751247406, 0.00024423934519290924, 0.0002536401152610779, 0.0002630408853292465, 0.00027244165539741516, 0.0002818424254655838, 0.00029124319553375244, 0.0003006439656019211, 0.0003100447356700897, 0.00031944550573825836, 0.000328846275806427, 0.00033824704587459564, 0.0003476478159427643, 0.0003570485860109329, 0.00036644935607910156]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 10.0, 3.0, 12.0, 21.0, 29.0, 25.0, 40.0, 48.0, 41.0, 57.0, 56.0, 80.0, 72.0, 80.0, 69.0, 64.0, 49.0, 48.0, 43.0, 23.0, 24.0, 21.0, 18.0, 16.0, 5.0, 16.0, 9.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.390146255493164e-05, -2.3117288947105408e-05, -2.2333115339279175e-05, -2.1548941731452942e-05, -2.076476812362671e-05, -1.9980594515800476e-05, -1.9196420907974243e-05, -1.841224730014801e-05, -1.7628073692321777e-05, -1.6843900084495544e-05, -1.605972647666931e-05, -1.527555286884308e-05, -1.4491379261016846e-05, -1.3707205653190613e-05, -1.292303204536438e-05, -1.2138858437538147e-05, -1.1354684829711914e-05, -1.0570511221885681e-05, -9.786337614059448e-06, -9.002164006233215e-06, -8.217990398406982e-06, -7.4338167905807495e-06, -6.649643182754517e-06, -5.865469574928284e-06, -5.081295967102051e-06, -4.297122359275818e-06, -3.512948751449585e-06, -2.728775143623352e-06, -1.944601535797119e-06, -1.1604279279708862e-06, -3.762543201446533e-07, 4.079192876815796e-07, 1.1920928955078125e-06, 1.9762665033340454e-06, 2.7604401111602783e-06, 3.5446137189865112e-06, 4.328787326812744e-06, 5.112960934638977e-06, 5.89713454246521e-06, 6.681308150291443e-06, 7.465481758117676e-06, 8.249655365943909e-06, 9.033828973770142e-06, 9.818002581596375e-06, 1.0602176189422607e-05, 1.138634979724884e-05, 1.2170523405075073e-05, 1.2954697012901306e-05, 1.3738870620727539e-05, 1.4523044228553772e-05, 1.5307217836380005e-05, 1.6091391444206238e-05, 1.687556505203247e-05, 1.7659738659858704e-05, 1.8443912267684937e-05, 1.922808587551117e-05, 2.0012259483337402e-05, 2.0796433091163635e-05, 2.1580606698989868e-05, 2.23647803068161e-05, 2.3148953914642334e-05, 2.3933127522468567e-05, 2.47173011302948e-05, 2.5501474738121033e-05, 2.6285648345947266e-05]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 12.0, 15.0, 22.0, 26.0, 39.0, 58.0, 60.0, 66.0, 70.0, 30.0, 20.0, 16.0, 12.0, 3.0, 9.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.662511153379455e-05, -3.491153984214179e-05, -3.319796815048903e-05, -3.1484392820857465e-05, -2.9770821129204705e-05, -2.8057249437551945e-05, -2.6343675926909782e-05, -2.463010241626762e-05, -2.291653072461486e-05, -2.12029590329621e-05, -1.9489385522319935e-05, -1.7775812011677772e-05, -1.6062240320025012e-05, -1.434866771887755e-05, -1.2635095117730089e-05, -1.0921522516582627e-05, -9.207949915435165e-06, -7.4943773142877035e-06, -5.780804713140242e-06, -4.06723211199278e-06, -2.3536595108453184e-06, -6.400869096978568e-07, 1.073485691449605e-06, 2.7870582925970666e-06, 4.500630893744528e-06, 6.21420349489199e-06, 7.927776096039452e-06, 9.641348697186913e-06, 1.1354921298334375e-05, 1.3068493899481837e-05, 1.4782066500629298e-05, 1.6495640011271462e-05, 1.8209211702924222e-05, 1.992278339457698e-05, 2.1636356905219145e-05, 2.334993041586131e-05, 2.506350210751407e-05, 2.677707379916683e-05, 2.8490647309808992e-05, 3.0204220820451155e-05, 3.1917792512103915e-05, 3.3631364203756675e-05, 3.5344935895409435e-05, 3.7058511225041e-05, 3.877208291669376e-05, 4.048565460834652e-05, 4.219922993797809e-05, 4.391280162963085e-05, 4.562637332128361e-05, 4.733994501293637e-05, 4.905351670458913e-05, 5.0767092034220695e-05, 5.2480663725873455e-05, 5.4194235417526215e-05, 5.590781074715778e-05, 5.762138243881054e-05, 5.93349541304633e-05, 6.104852946009487e-05, 6.276209751376882e-05, 6.447567284340039e-05, 6.618924089707434e-05, 6.790281622670591e-05, 6.961639155633748e-05, 7.132995961001143e-05, 7.3043534939643e-05]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 10.0, 10.0, 8.0, 8.0, 9.0, 6.0, 32.0, 55.0, 78.0, 63.0, 77.0, 32.0, 18.0, 11.0, 7.0, 11.0, 13.0, 7.0, 6.0, 8.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010335445404052734, -0.00010058097541332245, -9.780749678611755e-05, -9.503401815891266e-05, -9.226053953170776e-05, -8.948706090450287e-05, -8.671358227729797e-05, -8.394010365009308e-05, -8.116662502288818e-05, -7.839314639568329e-05, -7.56196677684784e-05, -7.28461891412735e-05, -7.00727105140686e-05, -6.729923188686371e-05, -6.452575325965881e-05, -6.175227463245392e-05, -5.8978796005249023e-05, -5.620531737804413e-05, -5.3431838750839233e-05, -5.065836012363434e-05, -4.788488149642944e-05, -4.511140286922455e-05, -4.233792424201965e-05, -3.956444561481476e-05, -3.679096698760986e-05, -3.401748836040497e-05, -3.124400973320007e-05, -2.8470531105995178e-05, -2.5697052478790283e-05, -2.2923573851585388e-05, -2.0150095224380493e-05, -1.7376616597175598e-05, -1.4603137969970703e-05, -1.1829659342765808e-05, -9.056180715560913e-06, -6.282702088356018e-06, -3.509223461151123e-06, -7.35744833946228e-07, 2.037733793258667e-06, 4.811212420463562e-06, 7.584691047668457e-06, 1.0358169674873352e-05, 1.3131648302078247e-05, 1.5905126929283142e-05, 1.8678605556488037e-05, 2.1452084183692932e-05, 2.4225562810897827e-05, 2.6999041438102722e-05, 2.9772520065307617e-05, 3.254599869251251e-05, 3.531947731971741e-05, 3.80929559469223e-05, 4.08664345741272e-05, 4.363991320133209e-05, 4.641339182853699e-05, 4.918687045574188e-05, 5.196034908294678e-05, 5.473382771015167e-05, 5.750730633735657e-05, 6.028078496456146e-05, 6.305426359176636e-05, 6.582774221897125e-05, 6.860122084617615e-05, 7.137469947338104e-05, 7.414817810058594e-05]}, "eval/loss": 16.721336364746094, "eval/bleu": 0.0, "eval/runtime": 3683.9491, "eval/samples_per_second": 4.007, "eval/steps_per_second": 1.002} \ No newline at end of file +{"train/loss": 4.673, "train/learning_rate": 0.0002719244724617255, "train/epoch": 0.77, "train/global_step": 5000, "_runtime": 53868, "_timestamp": 1651652316, "_step": 5009, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1022.0], "bins": [-358.7091979980469, -353.0705261230469, -347.4318542480469, -341.793212890625, -336.154541015625, -330.515869140625, -324.877197265625, -319.238525390625, -313.599853515625, -307.961181640625, -302.322509765625, -296.683837890625, -291.0451965332031, -285.4065246582031, -279.7678527832031, -274.1291809082031, -268.49053955078125, -262.85186767578125, -257.21319580078125, -251.5745391845703, -245.9358673095703, -240.29721069335938, -234.65853881835938, -229.01986694335938, -223.38119506835938, -217.74252319335938, -212.10386657714844, -206.46519470214844, -200.82652282714844, -195.1878662109375, -189.5491943359375, -183.9105224609375, -178.27188110351562, -172.63320922851562, -166.9945526123047, -161.3558807373047, -155.7172088623047, -150.07855224609375, -144.43988037109375, -138.80120849609375, -133.1625518798828, -127.52388763427734, -121.88521575927734, -116.24655151367188, -110.6078872680664, -104.96922302246094, -99.33055114746094, -93.69188690185547, -88.05321502685547, -82.41455078125, -76.77587890625, -71.13721466064453, -65.49855041503906, -59.85988235473633, -54.221214294433594, -48.582550048828125, -42.943878173828125, -37.30521011352539, -31.666545867919922, -26.027877807617188, -20.389211654663086, -14.750545501708984, -9.11187744140625, -3.4732131958007812, 2.165454387664795]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 0.0, 4.0, 7.0, 7.0, 8.0, 10.0, 19.0, 17.0, 22.0, 17.0, 26.0, 41.0, 52.0, 46.0, 53.0, 61.0, 50.0, 52.0, 52.0, 65.0, 46.0, 49.0, 53.0, 42.0, 43.0, 46.0, 26.0, 25.0, 19.0, 12.0, 9.0, 5.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.737998962402344, -14.262447357177734, -13.786895751953125, -13.311344146728516, -12.835792541503906, -12.360240936279297, -11.884689331054688, -11.409137725830078, -10.933586120605469, -10.45803451538086, -9.98248291015625, -9.50693130493164, -9.031379699707031, -8.555828094482422, -8.080276489257812, -7.604724884033203, -7.129173755645752, -6.653622150421143, -6.178070545196533, -5.702518939971924, -5.2269673347473145, -4.751416206359863, -4.275864601135254, -3.8003127574920654, -3.324761152267456, -2.8492095470428467, -2.3736579418182373, -1.8981064558029175, -1.422554850578308, -0.9470033645629883, -0.4714517593383789, 0.004099845886230469, 0.47965145111083984, 0.9552030563354492, 1.4307546615600586, 1.9063061475753784, 2.3818578720092773, 2.8574092388153076, 3.332960844039917, 3.8085124492645264, 4.284064292907715, 4.759615898132324, 5.235167503356934, 5.710719108581543, 6.186270713806152, 6.661822319030762, 7.137373924255371, 7.6129255294799805, 8.088476181030273, 8.564027786254883, 9.039579391479492, 9.515130996704102, 9.990682601928711, 10.46623420715332, 10.94178581237793, 11.417337417602539, 11.892889022827148, 12.368440628051758, 12.843992233276367, 13.319543838500977, 13.795095443725586, 14.270647048950195, 14.746198654174805, 15.221750259399414, 15.697301864624023]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 11.0, 14.0, 28.0, 21.0, 36.0, 56.0, 63.0, 94.0, 116.0, 181.0, 204.0, 301.0, 435.0, 519.0, 824.0, 1148.0, 1894.0, 3690.0, 8863.0, 25768.0, 4107578.0, 24822.0, 8383.0, 3490.0, 1869.0, 1054.0, 733.0, 530.0, 388.0, 306.0, 205.0, 175.0, 106.0, 83.0, 63.0, 54.0, 40.0, 31.0, 28.0, 17.0, 11.0, 12.0, 6.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.8359375, -4.67724609375, -4.5185546875, -4.35986328125, -4.201171875, -4.04248046875, -3.8837890625, -3.72509765625, -3.56640625, -3.40771484375, -3.2490234375, -3.09033203125, -2.931640625, -2.77294921875, -2.6142578125, -2.45556640625, -2.296875, -2.13818359375, -1.9794921875, -1.82080078125, -1.662109375, -1.50341796875, -1.3447265625, -1.18603515625, -1.02734375, -0.86865234375, -0.7099609375, -0.55126953125, -0.392578125, -0.23388671875, -0.0751953125, 0.08349609375, 0.2421875, 0.40087890625, 0.5595703125, 0.71826171875, 0.876953125, 1.03564453125, 1.1943359375, 1.35302734375, 1.51171875, 1.67041015625, 1.8291015625, 1.98779296875, 2.146484375, 2.30517578125, 2.4638671875, 2.62255859375, 2.78125, 2.93994140625, 3.0986328125, 3.25732421875, 3.416015625, 3.57470703125, 3.7333984375, 3.89208984375, 4.05078125, 4.20947265625, 4.3681640625, 4.52685546875, 4.685546875, 4.84423828125, 5.0029296875, 5.16162109375, 5.3203125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 8.0, 8.0, 11.0, 16.0, 15.0, 16.0, 31.0, 38.0, 49.0, 48.0, 56.0, 67.0, 48.0, 60.0, 64.0, 86.0, 57.0, 50.0, 51.0, 50.0, 37.0, 29.0, 25.0, 22.0, 14.0, 13.0, 6.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2890625, -8.9915771484375, -8.694091796875, -8.3966064453125, -8.09912109375, -7.8016357421875, -7.504150390625, -7.2066650390625, -6.9091796875, -6.6116943359375, -6.314208984375, -6.0167236328125, -5.71923828125, -5.4217529296875, -5.124267578125, -4.8267822265625, -4.529296875, -4.2318115234375, -3.934326171875, -3.6368408203125, -3.33935546875, -3.0418701171875, -2.744384765625, -2.4468994140625, -2.1494140625, -1.8519287109375, -1.554443359375, -1.2569580078125, -0.95947265625, -0.6619873046875, -0.364501953125, -0.0670166015625, 0.23046875, 0.5279541015625, 0.825439453125, 1.1229248046875, 1.42041015625, 1.7178955078125, 2.015380859375, 2.3128662109375, 2.6103515625, 2.9078369140625, 3.205322265625, 3.5028076171875, 3.80029296875, 4.0977783203125, 4.395263671875, 4.6927490234375, 4.990234375, 5.2877197265625, 5.585205078125, 5.8826904296875, 6.18017578125, 6.4776611328125, 6.775146484375, 7.0726318359375, 7.3701171875, 7.6676025390625, 7.965087890625, 8.2625732421875, 8.56005859375, 8.8575439453125, 9.155029296875, 9.4525146484375, 9.75]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 13.0, 81.0, 4194068.0, 51.0, 14.0, 6.0, 5.0, 8.0, 7.0, 1.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-207.875, -200.314453125, -192.75390625, -185.193359375, -177.6328125, -170.072265625, -162.51171875, -154.951171875, -147.390625, -139.830078125, -132.26953125, -124.708984375, -117.1484375, -109.587890625, -102.02734375, -94.466796875, -86.90625, -79.345703125, -71.78515625, -64.224609375, -56.6640625, -49.103515625, -41.54296875, -33.982421875, -26.421875, -18.861328125, -11.30078125, -3.740234375, 3.8203125, 11.380859375, 18.94140625, 26.501953125, 34.0625, 41.623046875, 49.18359375, 56.744140625, 64.3046875, 71.865234375, 79.42578125, 86.986328125, 94.546875, 102.107421875, 109.66796875, 117.228515625, 124.7890625, 132.349609375, 139.91015625, 147.470703125, 155.03125, 162.591796875, 170.15234375, 177.712890625, 185.2734375, 192.833984375, 200.39453125, 207.955078125, 215.515625, 223.076171875, 230.63671875, 238.197265625, 245.7578125, 253.318359375, 260.87890625, 268.439453125, 276.0]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 11.0, 28.0, 3808.0, 161.0, 13.0, 8.0, 4.0, 7.0, 8.0, 4.0, 1.0, 5.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.654296875, -2.559326171875, -2.46435546875, -2.369384765625, -2.2744140625, -2.179443359375, -2.08447265625, -1.989501953125, -1.89453125, -1.799560546875, -1.70458984375, -1.609619140625, -1.5146484375, -1.419677734375, -1.32470703125, -1.229736328125, -1.134765625, -1.039794921875, -0.94482421875, -0.849853515625, -0.7548828125, -0.659912109375, -0.56494140625, -0.469970703125, -0.375, -0.280029296875, -0.18505859375, -0.090087890625, 0.0048828125, 0.099853515625, 0.19482421875, 0.289794921875, 0.384765625, 0.479736328125, 0.57470703125, 0.669677734375, 0.7646484375, 0.859619140625, 0.95458984375, 1.049560546875, 1.14453125, 1.239501953125, 1.33447265625, 1.429443359375, 1.5244140625, 1.619384765625, 1.71435546875, 1.809326171875, 1.904296875, 1.999267578125, 2.09423828125, 2.189208984375, 2.2841796875, 2.379150390625, 2.47412109375, 2.569091796875, 2.6640625, 2.759033203125, 2.85400390625, 2.948974609375, 3.0439453125, 3.138916015625, 3.23388671875, 3.328857421875, 3.423828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 43.0, 213.0, 652.0, 96.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.891059398651123, -6.073329925537109, -5.2555999755859375, -4.437870025634766, -3.620140552520752, -2.80241060256958, -1.9846811294555664, -1.1669516563415527, -0.34922170639038086, 0.4685080051422119, 1.2862377166748047, 2.1039674282073975, 2.9216971397399902, 3.739427089691162, 4.557156562805176, 5.3748860359191895, 6.192615985870361, 7.010345458984375, 7.828075408935547, 8.645805358886719, 9.46353530883789, 10.281265258789062, 11.098994255065918, 11.916723251342773, 12.734453201293945, 13.552183151245117, 14.369913101196289, 15.187642097473145, 16.00537109375, 16.823101043701172, 17.640830993652344, 18.458560943603516, 19.276290893554688, 20.09402084350586, 20.91175079345703, 21.729480743408203, 22.547210693359375, 23.364940643310547, 24.182668685913086, 25.000398635864258, 25.81812858581543, 26.6358585357666, 27.453588485717773, 28.271318435668945, 29.089046478271484, 29.906776428222656, 30.724506378173828, 31.542236328125, 32.35996627807617, 33.177696228027344, 33.995426177978516, 34.81315612792969, 35.63088607788086, 36.44861602783203, 37.2663459777832, 38.084075927734375, 38.90180206298828, 39.71953201293945, 40.537261962890625, 41.3549919128418, 42.17272186279297, 42.99045181274414, 43.80818176269531, 44.62590789794922, 45.443641662597656]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 1.0, 7.0, 7.0, 10.0, 6.0, 6.0, 13.0, 19.0, 22.0, 28.0, 22.0, 37.0, 45.0, 42.0, 48.0, 49.0, 61.0, 50.0, 53.0, 47.0, 57.0, 53.0, 52.0, 41.0, 50.0, 27.0, 33.0, 29.0, 18.0, 17.0, 12.0, 14.0, 13.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.765387535095215, -8.506000518798828, -8.246613502502441, -7.9872260093688965, -7.727838516235352, -7.468451499938965, -7.209064483642578, -6.949676990509033, -6.690289497375488, -6.430902481079102, -6.171514987945557, -5.91212797164917, -5.652740478515625, -5.393353462219238, -5.133966445922852, -4.874578952789307, -4.61519193649292, -4.355804920196533, -4.096417427062988, -3.8370304107666016, -3.5776429176330566, -3.31825590133667, -3.058868646621704, -2.7994813919067383, -2.5400941371917725, -2.2807068824768066, -2.021319627761841, -1.7619324922561646, -1.5025452375411987, -1.243157982826233, -0.9837708473205566, -0.7243835926055908, -0.464996337890625, -0.20560911297798157, 0.053778111934661865, 0.3131653070449829, 0.5725525617599487, 0.8319398164749146, 1.0913269519805908, 1.3507142066955566, 1.6101014614105225, 1.8694887161254883, 2.128875970840454, 2.38826322555542, 2.6476502418518066, 2.9070377349853516, 3.1664247512817383, 3.425812005996704, 3.68519926071167, 3.9445865154266357, 4.203973770141602, 4.463360786437988, 4.722748279571533, 4.98213529586792, 5.241522789001465, 5.500909805297852, 5.760296821594238, 6.019683837890625, 6.27907133102417, 6.538458347320557, 6.797845840454102, 7.057232856750488, 7.316619873046875, 7.57600736618042, 7.835394859313965]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 5.0, 12.0, 4.0, 10.0, 13.0, 17.0, 30.0, 30.0, 59.0, 73.0, 103.0, 142.0, 255.0, 398.0, 609.0, 1102.0, 1918.0, 3680.0, 7986.0, 24569.0, 757908.0, 216116.0, 18928.0, 7063.0, 3308.0, 1605.0, 959.0, 558.0, 362.0, 226.0, 146.0, 105.0, 66.0, 47.0, 39.0, 20.0, 20.0, 20.0, 6.0, 7.0, 9.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99560546875, -0.9623184204101562, -0.9290313720703125, -0.8957443237304688, -0.862457275390625, -0.8291702270507812, -0.7958831787109375, -0.7625961303710938, -0.72930908203125, -0.6960220336914062, -0.6627349853515625, -0.6294479370117188, -0.596160888671875, -0.5628738403320312, -0.5295867919921875, -0.49629974365234375, -0.4630126953125, -0.42972564697265625, -0.3964385986328125, -0.36315155029296875, -0.329864501953125, -0.29657745361328125, -0.2632904052734375, -0.23000335693359375, -0.19671630859375, -0.16342926025390625, -0.1301422119140625, -0.09685516357421875, -0.063568115234375, -0.03028106689453125, 0.0030059814453125, 0.03629302978515625, 0.069580078125, 0.10286712646484375, 0.1361541748046875, 0.16944122314453125, 0.202728271484375, 0.23601531982421875, 0.2693023681640625, 0.30258941650390625, 0.33587646484375, 0.36916351318359375, 0.4024505615234375, 0.43573760986328125, 0.469024658203125, 0.5023117065429688, 0.5355987548828125, 0.5688858032226562, 0.6021728515625, 0.6354598999023438, 0.6687469482421875, 0.7020339965820312, 0.735321044921875, 0.7686080932617188, 0.8018951416015625, 0.8351821899414062, 0.86846923828125, 0.9017562866210938, 0.9350433349609375, 0.9683303833007812, 1.001617431640625, 1.0349044799804688, 1.0681915283203125, 1.1014785766601562, 1.134765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 10.0, 6.0, 13.0, 10.0, 13.0, 20.0, 29.0, 32.0, 47.0, 57.0, 49.0, 68.0, 76.0, 65.0, 86.0, 65.0, 71.0, 55.0, 44.0, 54.0, 33.0, 29.0, 20.0, 14.0, 13.0, 5.0, 3.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.21484375, -4.090240478515625, -3.96563720703125, -3.841033935546875, -3.7164306640625, -3.591827392578125, -3.46722412109375, -3.342620849609375, -3.218017578125, -3.093414306640625, -2.96881103515625, -2.844207763671875, -2.7196044921875, -2.595001220703125, -2.47039794921875, -2.345794677734375, -2.22119140625, -2.096588134765625, -1.97198486328125, -1.847381591796875, -1.7227783203125, -1.598175048828125, -1.47357177734375, -1.348968505859375, -1.224365234375, -1.099761962890625, -0.97515869140625, -0.850555419921875, -0.7259521484375, -0.601348876953125, -0.47674560546875, -0.352142333984375, -0.2275390625, -0.102935791015625, 0.02166748046875, 0.146270751953125, 0.2708740234375, 0.395477294921875, 0.52008056640625, 0.644683837890625, 0.769287109375, 0.893890380859375, 1.01849365234375, 1.143096923828125, 1.2677001953125, 1.392303466796875, 1.51690673828125, 1.641510009765625, 1.76611328125, 1.890716552734375, 2.01531982421875, 2.139923095703125, 2.2645263671875, 2.389129638671875, 2.51373291015625, 2.638336181640625, 2.762939453125, 2.887542724609375, 3.01214599609375, 3.136749267578125, 3.2613525390625, 3.385955810546875, 3.51055908203125, 3.635162353515625, 3.759765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 9.0, 3.0, 14.0, 14.0, 12.0, 11.0, 23.0, 30.0, 39.0, 55.0, 55.0, 70.0, 73.0, 111.0, 154.0, 222.0, 481.0, 1517.0, 5852.0, 38663.0, 798905.0, 181952.0, 15306.0, 2996.0, 867.0, 365.0, 182.0, 137.0, 95.0, 72.0, 71.0, 37.0, 46.0, 23.0, 23.0, 19.0, 14.0, 9.0, 12.0, 7.0, 4.0, 2.0, 1.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1651611328125, -0.1594219207763672, -0.15368270874023438, -0.14794349670410156, -0.14220428466796875, -0.13646507263183594, -0.13072586059570312, -0.12498664855957031, -0.1192474365234375, -0.11350822448730469, -0.10776901245117188, -0.10202980041503906, -0.09629058837890625, -0.09055137634277344, -0.08481216430664062, -0.07907295227050781, -0.073333740234375, -0.06759452819824219, -0.061855316162109375, -0.05611610412597656, -0.05037689208984375, -0.04463768005371094, -0.038898468017578125, -0.03315925598144531, -0.0274200439453125, -0.021680831909179688, -0.015941619873046875, -0.010202407836914062, -0.00446319580078125, 0.0012760162353515625, 0.007015228271484375, 0.012754440307617188, 0.01849365234375, 0.024232864379882812, 0.029972076416015625, 0.03571128845214844, 0.04145050048828125, 0.04718971252441406, 0.052928924560546875, 0.05866813659667969, 0.0644073486328125, 0.07014656066894531, 0.07588577270507812, 0.08162498474121094, 0.08736419677734375, 0.09310340881347656, 0.09884262084960938, 0.10458183288574219, 0.110321044921875, 0.11606025695800781, 0.12179946899414062, 0.12753868103027344, 0.13327789306640625, 0.13901710510253906, 0.14475631713867188, 0.1504955291748047, 0.1562347412109375, 0.1619739532470703, 0.16771316528320312, 0.17345237731933594, 0.17919158935546875, 0.18493080139160156, 0.19067001342773438, 0.1964092254638672, 0.2021484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 11.0, 10.0, 9.0, 12.0, 10.0, 14.0, 13.0, 23.0, 28.0, 28.0, 25.0, 28.0, 23.0, 45.0, 35.0, 45.0, 33.0, 47.0, 62.0, 51.0, 41.0, 39.0, 44.0, 45.0, 41.0, 30.0, 33.0, 28.0, 30.0, 18.0, 20.0, 9.0, 17.0, 12.0, 7.0, 5.0, 10.0, 5.0, 4.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.32421875, -4.1739501953125, -4.023681640625, -3.8734130859375, -3.72314453125, -3.5728759765625, -3.422607421875, -3.2723388671875, -3.1220703125, -2.9718017578125, -2.821533203125, -2.6712646484375, -2.52099609375, -2.3707275390625, -2.220458984375, -2.0701904296875, -1.919921875, -1.7696533203125, -1.619384765625, -1.4691162109375, -1.31884765625, -1.1685791015625, -1.018310546875, -0.8680419921875, -0.7177734375, -0.5675048828125, -0.417236328125, -0.2669677734375, -0.11669921875, 0.0335693359375, 0.183837890625, 0.3341064453125, 0.484375, 0.6346435546875, 0.784912109375, 0.9351806640625, 1.08544921875, 1.2357177734375, 1.385986328125, 1.5362548828125, 1.6865234375, 1.8367919921875, 1.987060546875, 2.1373291015625, 2.28759765625, 2.4378662109375, 2.588134765625, 2.7384033203125, 2.888671875, 3.0389404296875, 3.189208984375, 3.3394775390625, 3.48974609375, 3.6400146484375, 3.790283203125, 3.9405517578125, 4.0908203125, 4.2410888671875, 4.391357421875, 4.5416259765625, 4.69189453125, 4.8421630859375, 4.992431640625, 5.1427001953125, 5.29296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 2.0, 11.0, 12.0, 15.0, 20.0, 14.0, 20.0, 52.0, 42.0, 69.0, 80.0, 128.0, 233.0, 379.0, 809.0, 1694.0, 4239.0, 11897.0, 43736.0, 495883.0, 427450.0, 42264.0, 11658.0, 4167.0, 1785.0, 795.0, 410.0, 213.0, 140.0, 97.0, 60.0, 33.0, 32.0, 32.0, 20.0, 17.0, 9.0, 11.0, 3.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003025531768798828, -0.000293094664812088, -0.0002836361527442932, -0.0002741776406764984, -0.0002647191286087036, -0.0002552606165409088, -0.000245802104473114, -0.00023634359240531921, -0.00022688508033752441, -0.00021742656826972961, -0.00020796805620193481, -0.00019850954413414001, -0.00018905103206634521, -0.00017959251999855042, -0.00017013400793075562, -0.00016067549586296082, -0.00015121698379516602, -0.00014175847172737122, -0.00013229995965957642, -0.00012284144759178162, -0.00011338293552398682, -0.00010392442345619202, -9.446591138839722e-05, -8.500739932060242e-05, -7.554888725280762e-05, -6.609037518501282e-05, -5.663186311721802e-05, -4.717335104942322e-05, -3.771483898162842e-05, -2.8256326913833618e-05, -1.879781484603882e-05, -9.339302778244019e-06, 1.1920928955078125e-07, 9.577721357345581e-06, 1.903623342514038e-05, 2.849474549293518e-05, 3.795325756072998e-05, 4.741176962852478e-05, 5.687028169631958e-05, 6.632879376411438e-05, 7.578730583190918e-05, 8.524581789970398e-05, 9.470432996749878e-05, 0.00010416284203529358, 0.00011362135410308838, 0.00012307986617088318, 0.00013253837823867798, 0.00014199689030647278, 0.00015145540237426758, 0.00016091391444206238, 0.00017037242650985718, 0.00017983093857765198, 0.00018928945064544678, 0.00019874796271324158, 0.00020820647478103638, 0.00021766498684883118, 0.00022712349891662598, 0.00023658201098442078, 0.0002460405230522156, 0.0002554990351200104, 0.0002649575471878052, 0.0002744160592556, 0.0002838745713233948, 0.0002933330833911896, 0.0003027915954589844]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 7.0, 2.0, 8.0, 11.0, 15.0, 18.0, 20.0, 37.0, 62.0, 103.0, 227.0, 199.0, 115.0, 53.0, 31.0, 17.0, 28.0, 7.0, 9.0, 8.0, 10.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.546476364135742e-05, -3.3686868846416473e-05, -3.1908974051475525e-05, -3.0131079256534576e-05, -2.8353184461593628e-05, -2.657528966665268e-05, -2.479739487171173e-05, -2.3019500076770782e-05, -2.1241605281829834e-05, -1.9463710486888885e-05, -1.7685815691947937e-05, -1.590792089700699e-05, -1.413002610206604e-05, -1.2352131307125092e-05, -1.0574236512184143e-05, -8.796341717243195e-06, -7.018446922302246e-06, -5.240552127361298e-06, -3.462657332420349e-06, -1.6847625374794006e-06, 9.313225746154785e-08, 1.8710270524024963e-06, 3.648921847343445e-06, 5.426816642284393e-06, 7.204711437225342e-06, 8.98260623216629e-06, 1.0760501027107239e-05, 1.2538395822048187e-05, 1.4316290616989136e-05, 1.6094185411930084e-05, 1.7872080206871033e-05, 1.964997500181198e-05, 2.142786979675293e-05, 2.3205764591693878e-05, 2.4983659386634827e-05, 2.6761554181575775e-05, 2.8539448976516724e-05, 3.0317343771457672e-05, 3.209523856639862e-05, 3.387313336133957e-05, 3.565102815628052e-05, 3.7428922951221466e-05, 3.9206817746162415e-05, 4.098471254110336e-05, 4.276260733604431e-05, 4.454050213098526e-05, 4.631839692592621e-05, 4.809629172086716e-05, 4.9874186515808105e-05, 5.1652081310749054e-05, 5.342997610569e-05, 5.520787090063095e-05, 5.69857656955719e-05, 5.876366049051285e-05, 6.0541555285453796e-05, 6.231945008039474e-05, 6.40973448753357e-05, 6.587523967027664e-05, 6.765313446521759e-05, 6.943102926015854e-05, 7.120892405509949e-05, 7.298681885004044e-05, 7.476471364498138e-05, 7.654260843992233e-05, 7.832050323486328e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 13.0, 15.0, 14.0, 21.0, 36.0, 51.0, 183.0, 1045565.0, 2426.0, 84.0, 49.0, 25.0, 19.0, 9.0, 11.0, 5.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00421142578125, -0.004096895456314087, -0.003982365131378174, -0.0038678348064422607, -0.0037533044815063477, -0.0036387741565704346, -0.0035242438316345215, -0.0034097135066986084, -0.0032951831817626953, -0.0031806528568267822, -0.003066122531890869, -0.002951592206954956, -0.002837061882019043, -0.00272253155708313, -0.002608001232147217, -0.0024934709072113037, -0.0023789405822753906, -0.0022644102573394775, -0.0021498799324035645, -0.0020353496074676514, -0.0019208192825317383, -0.0018062889575958252, -0.0016917586326599121, -0.001577228307723999, -0.001462697982788086, -0.0013481676578521729, -0.0012336373329162598, -0.0011191070079803467, -0.0010045766830444336, -0.0008900463581085205, -0.0007755160331726074, -0.0006609857082366943, -0.0005464553833007812, -0.00043192505836486816, -0.0003173947334289551, -0.000202864408493042, -8.83340835571289e-05, 2.619624137878418e-05, 0.00014072656631469727, 0.00025525689125061035, 0.00036978721618652344, 0.0004843175411224365, 0.0005988478660583496, 0.0007133781909942627, 0.0008279085159301758, 0.0009424388408660889, 0.001056969165802002, 0.001171499490737915, 0.0012860298156738281, 0.0014005601406097412, 0.0015150904655456543, 0.0016296207904815674, 0.0017441511154174805, 0.0018586814403533936, 0.0019732117652893066, 0.0020877420902252197, 0.002202272415161133, 0.002316802740097046, 0.002431333065032959, 0.002545863389968872, 0.002660393714904785, 0.0027749240398406982, 0.0028894543647766113, 0.0030039846897125244, 0.0031185150146484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 11.0, 11.0, 12.0, 22.0, 31.0, 56.0, 137.0, 405.0, 147.0, 61.0, 36.0, 26.0, 14.0, 9.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014829635620117188, -0.0001442432403564453, -0.00014019012451171875, -0.0001361370086669922, -0.00013208389282226562, -0.00012803077697753906, -0.0001239776611328125, -0.00011992454528808594, -0.00011587142944335938, -0.00011181831359863281, -0.00010776519775390625, -0.00010371208190917969, -9.965896606445312e-05, -9.560585021972656e-05, -9.1552734375e-05, -8.749961853027344e-05, -8.344650268554688e-05, -7.939338684082031e-05, -7.534027099609375e-05, -7.128715515136719e-05, -6.723403930664062e-05, -6.318092346191406e-05, -5.91278076171875e-05, -5.507469177246094e-05, -5.1021575927734375e-05, -4.696846008300781e-05, -4.291534423828125e-05, -3.886222839355469e-05, -3.4809112548828125e-05, -3.075599670410156e-05, -2.6702880859375e-05, -2.2649765014648438e-05, -1.8596649169921875e-05, -1.4543533325195312e-05, -1.049041748046875e-05, -6.4373016357421875e-06, -2.384185791015625e-06, 1.6689300537109375e-06, 5.7220458984375e-06, 9.775161743164062e-06, 1.3828277587890625e-05, 1.7881393432617188e-05, 2.193450927734375e-05, 2.5987625122070312e-05, 3.0040740966796875e-05, 3.409385681152344e-05, 3.814697265625e-05, 4.220008850097656e-05, 4.6253204345703125e-05, 5.030632019042969e-05, 5.435943603515625e-05, 5.841255187988281e-05, 6.246566772460938e-05, 6.651878356933594e-05, 7.05718994140625e-05, 7.462501525878906e-05, 7.867813110351562e-05, 8.273124694824219e-05, 8.678436279296875e-05, 9.083747863769531e-05, 9.489059448242188e-05, 9.894371032714844e-05, 0.000102996826171875, 0.00010704994201660156, 0.00011110305786132812]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 10.0, 42.0, 536.0, 418.0, 11.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.748734951019287, -4.930497169494629, -4.112259387969971, -3.2940213680267334, -2.475783586502075, -1.657545566558838, -0.8393077850341797, -0.021070003509521484, 0.7971677780151367, 1.615405559539795, 2.433643341064453, 3.2518813610076904, 4.0701189041137695, 4.888357162475586, 5.706594944000244, 6.524832725524902, 7.3430705070495605, 8.161308288574219, 8.979546546936035, 9.797783851623535, 10.616022109985352, 11.434259414672852, 12.252497673034668, 13.070735931396484, 13.888973236083984, 14.7072114944458, 15.5254487991333, 16.343687057495117, 17.161924362182617, 17.98016357421875, 18.79840087890625, 19.61663818359375, 20.434877395629883, 21.253114700317383, 22.071353912353516, 22.889591217041016, 23.707828521728516, 24.526065826416016, 25.34430503845215, 26.16254234313965, 26.98077964782715, 27.79901695251465, 28.61725616455078, 29.43549346923828, 30.25373077392578, 31.07196807861328, 31.890207290649414, 32.70844268798828, 33.52668380737305, 34.34492111206055, 35.16315841674805, 35.98139572143555, 36.79963684082031, 37.61787414550781, 38.43611145019531, 39.25434875488281, 40.07258605957031, 40.89082336425781, 41.70906066894531, 42.52729797363281, 43.34553909301758, 44.16377639770508, 44.98201370239258, 45.80025100708008, 46.61848831176758]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 10.0, 8.0, 12.0, 13.0, 17.0, 31.0, 41.0, 43.0, 47.0, 61.0, 69.0, 73.0, 64.0, 64.0, 78.0, 54.0, 66.0, 61.0, 41.0, 29.0, 34.0, 20.0, 18.0, 13.0, 10.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.346042156219482, -4.228121280670166, -4.11020040512085, -3.992279529571533, -3.874358654022217, -3.7564377784729004, -3.638517141342163, -3.5205962657928467, -3.4026753902435303, -3.284754514694214, -3.1668336391448975, -3.048912763595581, -2.9309921264648438, -2.8130712509155273, -2.695150375366211, -2.5772294998168945, -2.459308624267578, -2.3413877487182617, -2.2234668731689453, -2.105545997619629, -1.987625241279602, -1.8697043657302856, -1.7517836093902588, -1.6338627338409424, -1.515941858291626, -1.3980209827423096, -1.2801001071929932, -1.1621793508529663, -1.04425847530365, -0.9263375997543335, -0.8084167838096619, -0.6904959678649902, -0.5725748538970947, -0.4546540081501007, -0.3367331624031067, -0.21881231665611267, -0.10089147090911865, 0.017029404640197754, 0.13495022058486938, 0.252871036529541, 0.3707919120788574, 0.48871275782585144, 0.6066336035728455, 0.7245544195175171, 0.8424752950668335, 0.9603961706161499, 1.0783169269561768, 1.1962378025054932, 1.3141586780548096, 1.432079553604126, 1.5500004291534424, 1.6679211854934692, 1.7858420610427856, 1.903762936592102, 2.021683692932129, 2.1396045684814453, 2.2575254440307617, 2.375446319580078, 2.4933671951293945, 2.611288070678711, 2.7292089462280273, 2.8471298217773438, 2.965050458908081, 3.0829713344573975, 3.200892210006714]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 4.0, 12.0, 16.0, 58.0, 88.0, 186.0, 438.0, 1361.0, 7268.0, 292156.0, 733491.0, 10812.0, 1729.0, 475.0, 212.0, 111.0, 50.0, 22.0, 23.0, 12.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9921875, -8.7733154296875, -8.554443359375, -8.3355712890625, -8.11669921875, -7.8978271484375, -7.678955078125, -7.4600830078125, -7.2412109375, -7.0223388671875, -6.803466796875, -6.5845947265625, -6.36572265625, -6.1468505859375, -5.927978515625, -5.7091064453125, -5.490234375, -5.2713623046875, -5.052490234375, -4.8336181640625, -4.61474609375, -4.3958740234375, -4.177001953125, -3.9581298828125, -3.7392578125, -3.5203857421875, -3.301513671875, -3.0826416015625, -2.86376953125, -2.6448974609375, -2.426025390625, -2.2071533203125, -1.98828125, -1.7694091796875, -1.550537109375, -1.3316650390625, -1.11279296875, -0.8939208984375, -0.675048828125, -0.4561767578125, -0.2373046875, -0.0184326171875, 0.200439453125, 0.4193115234375, 0.63818359375, 0.8570556640625, 1.075927734375, 1.2947998046875, 1.513671875, 1.7325439453125, 1.951416015625, 2.1702880859375, 2.38916015625, 2.6080322265625, 2.826904296875, 3.0457763671875, 3.2646484375, 3.4835205078125, 3.702392578125, 3.9212646484375, 4.14013671875, 4.3590087890625, 4.577880859375, 4.7967529296875, 5.015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 4.0, 20.0, 26.0, 36.0, 57.0, 65.0, 67.0, 92.0, 103.0, 101.0, 99.0, 78.0, 72.0, 53.0, 34.0, 34.0, 29.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.408203125, -3.321258544921875, -3.23431396484375, -3.147369384765625, -3.0604248046875, -2.973480224609375, -2.88653564453125, -2.799591064453125, -2.712646484375, -2.625701904296875, -2.53875732421875, -2.451812744140625, -2.3648681640625, -2.277923583984375, -2.19097900390625, -2.104034423828125, -2.01708984375, -1.930145263671875, -1.84320068359375, -1.756256103515625, -1.6693115234375, -1.582366943359375, -1.49542236328125, -1.408477783203125, -1.321533203125, -1.234588623046875, -1.14764404296875, -1.060699462890625, -0.9737548828125, -0.886810302734375, -0.79986572265625, -0.712921142578125, -0.6259765625, -0.539031982421875, -0.45208740234375, -0.365142822265625, -0.2781982421875, -0.191253662109375, -0.10430908203125, -0.017364501953125, 0.069580078125, 0.156524658203125, 0.24346923828125, 0.330413818359375, 0.4173583984375, 0.504302978515625, 0.59124755859375, 0.678192138671875, 0.76513671875, 0.852081298828125, 0.93902587890625, 1.025970458984375, 1.1129150390625, 1.199859619140625, 1.28680419921875, 1.373748779296875, 1.460693359375, 1.547637939453125, 1.63458251953125, 1.721527099609375, 1.8084716796875, 1.895416259765625, 1.98236083984375, 2.069305419921875, 2.15625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 4.0, 3.0, 6.0, 3.0, 4.0, 6.0, 9.0, 4.0, 8.0, 12.0, 19.0, 19.0, 25.0, 28.0, 41.0, 63.0, 84.0, 149.0, 487.0, 1044654.0, 2319.0, 197.0, 112.0, 58.0, 53.0, 34.0, 22.0, 28.0, 21.0, 10.0, 11.0, 5.0, 7.0, 9.0, 4.0, 3.0, 7.0, 6.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-30.1875, -29.171875, -28.15625, -27.140625, -26.125, -25.109375, -24.09375, -23.078125, -22.0625, -21.046875, -20.03125, -19.015625, -18.0, -16.984375, -15.96875, -14.953125, -13.9375, -12.921875, -11.90625, -10.890625, -9.875, -8.859375, -7.84375, -6.828125, -5.8125, -4.796875, -3.78125, -2.765625, -1.75, -0.734375, 0.28125, 1.296875, 2.3125, 3.328125, 4.34375, 5.359375, 6.375, 7.390625, 8.40625, 9.421875, 10.4375, 11.453125, 12.46875, 13.484375, 14.5, 15.515625, 16.53125, 17.546875, 18.5625, 19.578125, 20.59375, 21.609375, 22.625, 23.640625, 24.65625, 25.671875, 26.6875, 27.703125, 28.71875, 29.734375, 30.75, 31.765625, 32.78125, 33.796875, 34.8125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 7.0, 11.0, 4.0, 10.0, 17.0, 17.0, 17.0, 22.0, 28.0, 34.0, 27.0, 37.0, 54.0, 40.0, 53.0, 32.0, 46.0, 56.0, 57.0, 49.0, 41.0, 58.0, 45.0, 39.0, 31.0, 29.0, 14.0, 17.0, 23.0, 20.0, 16.0, 5.0, 2.0, 9.0, 6.0, 1.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.119140625, -2.048828125, -1.978515625, -1.908203125, -1.837890625, -1.767578125, -1.697265625, -1.626953125, -1.556640625, -1.486328125, -1.416015625, -1.345703125, -1.275390625, -1.205078125, -1.134765625, -1.064453125, -0.994140625, -0.923828125, -0.853515625, -0.783203125, -0.712890625, -0.642578125, -0.572265625, -0.501953125, -0.431640625, -0.361328125, -0.291015625, -0.220703125, -0.150390625, -0.080078125, -0.009765625, 0.060546875, 0.130859375, 0.201171875, 0.271484375, 0.341796875, 0.412109375, 0.482421875, 0.552734375, 0.623046875, 0.693359375, 0.763671875, 0.833984375, 0.904296875, 0.974609375, 1.044921875, 1.115234375, 1.185546875, 1.255859375, 1.326171875, 1.396484375, 1.466796875, 1.537109375, 1.607421875, 1.677734375, 1.748046875, 1.818359375, 1.888671875, 1.958984375, 2.029296875, 2.099609375, 2.169921875, 2.240234375, 2.310546875, 2.380859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 8.0, 6.0, 16.0, 27.0, 103.0, 1047670.0, 622.0, 42.0, 18.0, 14.0, 7.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.03125, -49.6787109375, -48.326171875, -46.9736328125, -45.62109375, -44.2685546875, -42.916015625, -41.5634765625, -40.2109375, -38.8583984375, -37.505859375, -36.1533203125, -34.80078125, -33.4482421875, -32.095703125, -30.7431640625, -29.390625, -28.0380859375, -26.685546875, -25.3330078125, -23.98046875, -22.6279296875, -21.275390625, -19.9228515625, -18.5703125, -17.2177734375, -15.865234375, -14.5126953125, -13.16015625, -11.8076171875, -10.455078125, -9.1025390625, -7.75, -6.3974609375, -5.044921875, -3.6923828125, -2.33984375, -0.9873046875, 0.365234375, 1.7177734375, 3.0703125, 4.4228515625, 5.775390625, 7.1279296875, 8.48046875, 9.8330078125, 11.185546875, 12.5380859375, 13.890625, 15.2431640625, 16.595703125, 17.9482421875, 19.30078125, 20.6533203125, 22.005859375, 23.3583984375, 24.7109375, 26.0634765625, 27.416015625, 28.7685546875, 30.12109375, 31.4736328125, 32.826171875, 34.1787109375, 35.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 7.0, 21.0, 32.0, 190.0, 685.0, 39.0, 25.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00054931640625, -0.0004998445510864258, -0.00045037269592285156, -0.00040090084075927734, -0.0003514289855957031, -0.0003019571304321289, -0.0002524852752685547, -0.00020301342010498047, -0.00015354156494140625, -0.00010406970977783203, -5.459785461425781e-05, -5.125999450683594e-06, 4.4345855712890625e-05, 9.381771087646484e-05, 0.00014328956604003906, 0.00019276142120361328, 0.0002422332763671875, 0.0002917051315307617, 0.00034117698669433594, 0.00039064884185791016, 0.0004401206970214844, 0.0004895925521850586, 0.0005390644073486328, 0.000588536262512207, 0.0006380081176757812, 0.0006874799728393555, 0.0007369518280029297, 0.0007864236831665039, 0.0008358955383300781, 0.0008853673934936523, 0.0009348392486572266, 0.0009843111038208008, 0.001033782958984375, 0.0010832548141479492, 0.0011327266693115234, 0.0011821985244750977, 0.0012316703796386719, 0.001281142234802246, 0.0013306140899658203, 0.0013800859451293945, 0.0014295578002929688, 0.001479029655456543, 0.0015285015106201172, 0.0015779733657836914, 0.0016274452209472656, 0.0016769170761108398, 0.001726388931274414, 0.0017758607864379883, 0.0018253326416015625, 0.0018748044967651367, 0.001924276351928711, 0.001973748207092285, 0.0020232200622558594, 0.0020726919174194336, 0.002122163772583008, 0.002171635627746582, 0.0022211074829101562, 0.0022705793380737305, 0.0023200511932373047, 0.002369523048400879, 0.002418994903564453, 0.0024684667587280273, 0.0025179386138916016, 0.0025674104690551758, 0.00261688232421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 10.0, 18.0, 21.0, 115.0, 1048240.0, 86.0, 19.0, 25.0, 12.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.6875, -68.2880859375, -65.888671875, -63.4892578125, -61.08984375, -58.6904296875, -56.291015625, -53.8916015625, -51.4921875, -49.0927734375, -46.693359375, -44.2939453125, -41.89453125, -39.4951171875, -37.095703125, -34.6962890625, -32.296875, -29.8974609375, -27.498046875, -25.0986328125, -22.69921875, -20.2998046875, -17.900390625, -15.5009765625, -13.1015625, -10.7021484375, -8.302734375, -5.9033203125, -3.50390625, -1.1044921875, 1.294921875, 3.6943359375, 6.09375, 8.4931640625, 10.892578125, 13.2919921875, 15.69140625, 18.0908203125, 20.490234375, 22.8896484375, 25.2890625, 27.6884765625, 30.087890625, 32.4873046875, 34.88671875, 37.2861328125, 39.685546875, 42.0849609375, 44.484375, 46.8837890625, 49.283203125, 51.6826171875, 54.08203125, 56.4814453125, 58.880859375, 61.2802734375, 63.6796875, 66.0791015625, 68.478515625, 70.8779296875, 73.27734375, 75.6767578125, 78.076171875, 80.4755859375, 82.875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 13.0, 22.0, 40.0, 714.0, 127.0, 28.0, 19.0, 15.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.929931640625, -2.82861328125, -2.727294921875, -2.6259765625, -2.524658203125, -2.42333984375, -2.322021484375, -2.220703125, -2.119384765625, -2.01806640625, -1.916748046875, -1.8154296875, -1.714111328125, -1.61279296875, -1.511474609375, -1.41015625, -1.308837890625, -1.20751953125, -1.106201171875, -1.0048828125, -0.903564453125, -0.80224609375, -0.700927734375, -0.599609375, -0.498291015625, -0.39697265625, -0.295654296875, -0.1943359375, -0.093017578125, 0.00830078125, 0.109619140625, 0.2109375, 0.312255859375, 0.41357421875, 0.514892578125, 0.6162109375, 0.717529296875, 0.81884765625, 0.920166015625, 1.021484375, 1.122802734375, 1.22412109375, 1.325439453125, 1.4267578125, 1.528076171875, 1.62939453125, 1.730712890625, 1.83203125, 1.933349609375, 2.03466796875, 2.135986328125, 2.2373046875, 2.338623046875, 2.43994140625, 2.541259765625, 2.642578125, 2.743896484375, 2.84521484375, 2.946533203125, 3.0478515625, 3.149169921875, 3.25048828125, 3.351806640625, 3.453125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1020.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5012686252593994, 2.1786506175994873, 6.858570098876953, 11.53848934173584, 16.218408584594727, 20.89832878112793, 25.5782470703125, 30.25816535949707, 34.93808364868164, 39.618003845214844, 44.29792022705078, 48.977840423583984, 53.65776062011719, 58.33768081665039, 63.017601013183594, 67.69751739501953, 72.37744140625, 77.05735778808594, 81.7372817993164, 86.41719818115234, 91.09712219238281, 95.77703857421875, 100.45695495605469, 105.13687133789062, 109.8167953491211, 114.49671173095703, 119.1766357421875, 123.85655212402344, 128.53646850585938, 133.21640014648438, 137.8963165283203, 142.57623291015625, 147.25613403320312, 151.93605041503906, 156.615966796875, 161.2958984375, 165.97581481933594, 170.65573120117188, 175.3356475830078, 180.01556396484375, 184.69549560546875, 189.3754119873047, 194.05532836914062, 198.73526000976562, 203.41517639160156, 208.0950927734375, 212.77500915527344, 217.45492553710938, 222.1348419189453, 226.81475830078125, 231.4946746826172, 236.1746063232422, 240.85452270507812, 245.53443908691406, 250.21435546875, 254.89427185058594, 259.5741882324219, 264.2541198730469, 268.93402099609375, 273.61395263671875, 278.2938537597656, 282.9737854003906, 287.6537170410156, 292.3336181640625, 297.0135498046875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 12.0, 24.0, 41.0, 68.0, 82.0, 115.0, 123.0, 119.0, 116.0, 101.0, 70.0, 66.0, 27.0, 22.0, 14.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2097671031951904, -2.9125418663024902, -2.615316867828369, -2.318091630935669, -2.0208663940429688, -1.7236413955688477, -1.4264161586761475, -1.1291911602020264, -0.8319659233093262, -0.5347408056259155, -0.2375156283378601, 0.05970954895019531, 0.35693466663360596, 0.6541597843170166, 0.9513850212097168, 1.248610019683838, 1.545835256576538, 1.8430603742599487, 2.1402854919433594, 2.4375107288360596, 2.7347359657287598, 3.031960964202881, 3.329186201095581, 3.626411199569702, 3.9236364364624023, 4.220861434936523, 4.518086910247803, 4.815311908721924, 5.112536907196045, 5.409762382507324, 5.706987380981445, 6.004212379455566, 6.301438331604004, 6.598663330078125, 6.895888805389404, 7.193113803863525, 7.4903388023376465, 7.787564277648926, 8.084789276123047, 8.382014274597168, 8.679239273071289, 8.97646427154541, 9.273689270019531, 9.570915222167969, 9.86814022064209, 10.165365219116211, 10.462590217590332, 10.759815216064453, 11.05704116821289, 11.354266166687012, 11.651491165161133, 11.94871711730957, 12.245942115783691, 12.543167114257812, 12.840392112731934, 13.137617111206055, 13.434842109680176, 13.732067108154297, 14.029292106628418, 14.326517105102539, 14.623743057250977, 14.920968055725098, 15.218193054199219, 15.51541805267334, 15.812643051147461]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 17.0, 17.0, 34.0, 98.0, 199.0, 431.0, 1520.0, 4186231.0, 4532.0, 662.0, 297.0, 131.0, 63.0, 26.0, 15.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.03125, -31.3592529296875, -30.687255859375, -30.0152587890625, -29.34326171875, -28.6712646484375, -27.999267578125, -27.3272705078125, -26.6552734375, -25.9832763671875, -25.311279296875, -24.6392822265625, -23.96728515625, -23.2952880859375, -22.623291015625, -21.9512939453125, -21.279296875, -20.6072998046875, -19.935302734375, -19.2633056640625, -18.59130859375, -17.9193115234375, -17.247314453125, -16.5753173828125, -15.9033203125, -15.2313232421875, -14.559326171875, -13.8873291015625, -13.21533203125, -12.5433349609375, -11.871337890625, -11.1993408203125, -10.52734375, -9.8553466796875, -9.183349609375, -8.5113525390625, -7.83935546875, -7.1673583984375, -6.495361328125, -5.8233642578125, -5.1513671875, -4.4793701171875, -3.807373046875, -3.1353759765625, -2.46337890625, -1.7913818359375, -1.119384765625, -0.4473876953125, 0.224609375, 0.8966064453125, 1.568603515625, 2.2406005859375, 2.91259765625, 3.5845947265625, 4.256591796875, 4.9285888671875, 5.6005859375, 6.2725830078125, 6.944580078125, 7.6165771484375, 8.28857421875, 8.9605712890625, 9.632568359375, 10.3045654296875, 10.9765625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 11.0, 42.0, 88.0, 139.0, 158.0, 187.0, 175.0, 98.0, 59.0, 23.0, 15.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.826171875, -2.7479248046875, -2.669677734375, -2.5914306640625, -2.51318359375, -2.4349365234375, -2.356689453125, -2.2784423828125, -2.2001953125, -2.1219482421875, -2.043701171875, -1.9654541015625, -1.88720703125, -1.8089599609375, -1.730712890625, -1.6524658203125, -1.57421875, -1.4959716796875, -1.417724609375, -1.3394775390625, -1.26123046875, -1.1829833984375, -1.104736328125, -1.0264892578125, -0.9482421875, -0.8699951171875, -0.791748046875, -0.7135009765625, -0.63525390625, -0.5570068359375, -0.478759765625, -0.4005126953125, -0.322265625, -0.2440185546875, -0.165771484375, -0.0875244140625, -0.00927734375, 0.0689697265625, 0.147216796875, 0.2254638671875, 0.3037109375, 0.3819580078125, 0.460205078125, 0.5384521484375, 0.61669921875, 0.6949462890625, 0.773193359375, 0.8514404296875, 0.9296875, 1.0079345703125, 1.086181640625, 1.1644287109375, 1.24267578125, 1.3209228515625, 1.399169921875, 1.4774169921875, 1.5556640625, 1.6339111328125, 1.712158203125, 1.7904052734375, 1.86865234375, 1.9468994140625, 2.025146484375, 2.1033935546875, 2.181640625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 6.0, 15.0, 66.0, 4190758.0, 3313.0, 43.0, 12.0, 13.0, 13.0, 7.0, 4.0, 5.0, 1.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-69.3125, -67.3251953125, -65.337890625, -63.3505859375, -61.36328125, -59.3759765625, -57.388671875, -55.4013671875, -53.4140625, -51.4267578125, -49.439453125, -47.4521484375, -45.46484375, -43.4775390625, -41.490234375, -39.5029296875, -37.515625, -35.5283203125, -33.541015625, -31.5537109375, -29.56640625, -27.5791015625, -25.591796875, -23.6044921875, -21.6171875, -19.6298828125, -17.642578125, -15.6552734375, -13.66796875, -11.6806640625, -9.693359375, -7.7060546875, -5.71875, -3.7314453125, -1.744140625, 0.2431640625, 2.23046875, 4.2177734375, 6.205078125, 8.1923828125, 10.1796875, 12.1669921875, 14.154296875, 16.1416015625, 18.12890625, 20.1162109375, 22.103515625, 24.0908203125, 26.078125, 28.0654296875, 30.052734375, 32.0400390625, 34.02734375, 36.0146484375, 38.001953125, 39.9892578125, 41.9765625, 43.9638671875, 45.951171875, 47.9384765625, 49.92578125, 51.9130859375, 53.900390625, 55.8876953125, 57.875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 314.0, 3673.0, 19.0, 17.0, 12.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5009765625, -1.458221435546875, -1.41546630859375, -1.372711181640625, -1.3299560546875, -1.287200927734375, -1.24444580078125, -1.201690673828125, -1.158935546875, -1.116180419921875, -1.07342529296875, -1.030670166015625, -0.9879150390625, -0.945159912109375, -0.90240478515625, -0.859649658203125, -0.81689453125, -0.774139404296875, -0.73138427734375, -0.688629150390625, -0.6458740234375, -0.603118896484375, -0.56036376953125, -0.517608642578125, -0.474853515625, -0.432098388671875, -0.38934326171875, -0.346588134765625, -0.3038330078125, -0.261077880859375, -0.21832275390625, -0.175567626953125, -0.1328125, -0.090057373046875, -0.04730224609375, -0.004547119140625, 0.0382080078125, 0.080963134765625, 0.12371826171875, 0.166473388671875, 0.209228515625, 0.251983642578125, 0.29473876953125, 0.337493896484375, 0.3802490234375, 0.423004150390625, 0.46575927734375, 0.508514404296875, 0.55126953125, 0.594024658203125, 0.63677978515625, 0.679534912109375, 0.7222900390625, 0.765045166015625, 0.80780029296875, 0.850555419921875, 0.893310546875, 0.936065673828125, 0.97882080078125, 1.021575927734375, 1.0643310546875, 1.107086181640625, 1.14984130859375, 1.192596435546875, 1.2353515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 6.0, 10.0, 15.0, 23.0, 44.0, 66.0, 110.0, 133.0, 189.0, 164.0, 88.0, 69.0, 32.0, 23.0, 5.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1287455558776855, -1.054998755455017, -0.9812518358230591, -0.9075050354003906, -0.8337581157684326, -0.7600113153457642, -0.6862644553184509, -0.6125175952911377, -0.5387707352638245, -0.46502387523651123, -0.391277015209198, -0.31753018498420715, -0.24378332495689392, -0.1700364649295807, -0.09628963470458984, -0.02254277467727661, 0.05120408535003662, 0.12495093792676926, 0.1986977905035019, 0.27244463562965393, 0.34619149565696716, 0.4199383556842804, 0.49368518590927124, 0.5674320459365845, 0.6411789059638977, 0.7149257659912109, 0.7886726260185242, 0.8624194860458374, 0.9361662864685059, 1.0099132061004639, 1.0836600065231323, 1.1574068069458008, 1.2311537265777588, 1.3049005270004272, 1.3786474466323853, 1.4523942470550537, 1.5261411666870117, 1.5998879671096802, 1.6736347675323486, 1.7473816871643066, 1.8211286067962646, 1.894875407218933, 1.9686223268508911, 2.0423691272735596, 2.1161160469055176, 2.1898629665374756, 2.2636096477508545, 2.3373565673828125, 2.4111032485961914, 2.4848501682281494, 2.5585968494415283, 2.6323437690734863, 2.7060906887054443, 2.7798376083374023, 2.8535842895507812, 2.9273312091827393, 3.0010781288146973, 3.0748250484466553, 3.148571729660034, 3.222318649291992, 3.29606556892395, 3.369812488555908, 3.443559169769287, 3.517306089401245, 3.591053009033203]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 8.0, 15.0, 19.0, 29.0, 34.0, 59.0, 49.0, 64.0, 70.0, 84.0, 75.0, 110.0, 63.0, 69.0, 54.0, 34.0, 49.0, 32.0, 38.0, 15.0, 12.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.7328779697418213, -2.6718125343322754, -2.6107470989227295, -2.5496816635131836, -2.4886162281036377, -2.427550792694092, -2.366485357284546, -2.305419921875, -2.244354486465454, -2.183289051055908, -2.1222236156463623, -2.0611581802368164, -2.0000927448272705, -1.9390273094177246, -1.8779618740081787, -1.8168964385986328, -1.755831003189087, -1.694765567779541, -1.6337001323699951, -1.5726346969604492, -1.5115692615509033, -1.4505038261413574, -1.3894383907318115, -1.3283729553222656, -1.2673074007034302, -1.2062419652938843, -1.1451765298843384, -1.0841110944747925, -1.0230456590652466, -0.9619802236557007, -0.9009147882461548, -0.8398493528366089, -0.778783917427063, -0.7177184820175171, -0.6566530466079712, -0.5955876111984253, -0.5345221757888794, -0.4734567105770111, -0.4123912751674652, -0.3513258397579193, -0.2902604043483734, -0.22919496893882751, -0.16812953352928162, -0.10706408321857452, -0.045998647809028625, 0.015066802501678467, 0.07613223791122437, 0.13719767332077026, 0.19826310873031616, 0.25932854413986206, 0.32039397954940796, 0.38145941495895386, 0.44252485036849976, 0.5035903453826904, 0.5646557807922363, 0.6257212162017822, 0.6867866516113281, 0.747852087020874, 0.8089175224304199, 0.8699829578399658, 0.9310483932495117, 0.9921138286590576, 1.0531792640686035, 1.1142446994781494, 1.1753101348876953]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 11.0, 16.0, 22.0, 33.0, 59.0, 239.0, 737.0, 3144.0, 57078.0, 977582.0, 7683.0, 1354.0, 357.0, 106.0, 53.0, 19.0, 13.0, 6.0, 3.0, 5.0, 3.0, 9.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9873046875, -0.9546356201171875, -0.921966552734375, -0.8892974853515625, -0.85662841796875, -0.8239593505859375, -0.791290283203125, -0.7586212158203125, -0.7259521484375, -0.6932830810546875, -0.660614013671875, -0.6279449462890625, -0.59527587890625, -0.5626068115234375, -0.529937744140625, -0.4972686767578125, -0.464599609375, -0.4319305419921875, -0.399261474609375, -0.3665924072265625, -0.33392333984375, -0.3012542724609375, -0.268585205078125, -0.2359161376953125, -0.2032470703125, -0.1705780029296875, -0.137908935546875, -0.1052398681640625, -0.07257080078125, -0.0399017333984375, -0.007232666015625, 0.0254364013671875, 0.05810546875, 0.0907745361328125, 0.123443603515625, 0.1561126708984375, 0.18878173828125, 0.2214508056640625, 0.254119873046875, 0.2867889404296875, 0.3194580078125, 0.3521270751953125, 0.384796142578125, 0.4174652099609375, 0.45013427734375, 0.4828033447265625, 0.515472412109375, 0.5481414794921875, 0.580810546875, 0.6134796142578125, 0.646148681640625, 0.6788177490234375, 0.71148681640625, 0.7441558837890625, 0.776824951171875, 0.8094940185546875, 0.8421630859375, 0.8748321533203125, 0.907501220703125, 0.9401702880859375, 0.97283935546875, 1.0055084228515625, 1.038177490234375, 1.0708465576171875, 1.103515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 13.0, 25.0, 45.0, 101.0, 142.0, 184.0, 180.0, 138.0, 93.0, 49.0, 24.0, 9.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6826171875, -1.6023712158203125, -1.522125244140625, -1.4418792724609375, -1.36163330078125, -1.2813873291015625, -1.201141357421875, -1.1208953857421875, -1.0406494140625, -0.9604034423828125, -0.880157470703125, -0.7999114990234375, -0.71966552734375, -0.6394195556640625, -0.559173583984375, -0.4789276123046875, -0.398681640625, -0.3184356689453125, -0.238189697265625, -0.1579437255859375, -0.07769775390625, 0.0025482177734375, 0.082794189453125, 0.1630401611328125, 0.2432861328125, 0.3235321044921875, 0.403778076171875, 0.4840240478515625, 0.56427001953125, 0.6445159912109375, 0.724761962890625, 0.8050079345703125, 0.88525390625, 0.9654998779296875, 1.045745849609375, 1.1259918212890625, 1.20623779296875, 1.2864837646484375, 1.366729736328125, 1.4469757080078125, 1.5272216796875, 1.6074676513671875, 1.687713623046875, 1.7679595947265625, 1.84820556640625, 1.9284515380859375, 2.008697509765625, 2.0889434814453125, 2.169189453125, 2.2494354248046875, 2.329681396484375, 2.4099273681640625, 2.49017333984375, 2.5704193115234375, 2.650665283203125, 2.7309112548828125, 2.8111572265625, 2.8914031982421875, 2.971649169921875, 3.0518951416015625, 3.13214111328125, 3.2123870849609375, 3.292633056640625, 3.3728790283203125, 3.453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 5.0, 13.0, 17.0, 21.0, 30.0, 39.0, 64.0, 64.0, 99.0, 144.0, 188.0, 330.0, 833.0, 3540.0, 27723.0, 825544.0, 176072.0, 10602.0, 1883.0, 505.0, 256.0, 139.0, 120.0, 65.0, 69.0, 58.0, 34.0, 24.0, 18.0, 16.0, 15.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.085693359375, -0.08315753936767578, -0.08062171936035156, -0.07808589935302734, -0.07555007934570312, -0.0730142593383789, -0.07047843933105469, -0.06794261932373047, -0.06540679931640625, -0.06287097930908203, -0.06033515930175781, -0.057799339294433594, -0.055263519287109375, -0.052727699279785156, -0.05019187927246094, -0.04765605926513672, -0.0451202392578125, -0.04258441925048828, -0.04004859924316406, -0.037512779235839844, -0.034976959228515625, -0.032441139221191406, -0.029905319213867188, -0.02736949920654297, -0.02483367919921875, -0.02229785919189453, -0.019762039184570312, -0.017226219177246094, -0.014690399169921875, -0.012154579162597656, -0.009618759155273438, -0.007082939147949219, -0.004547119140625, -0.0020112991333007812, 0.0005245208740234375, 0.0030603408813476562, 0.005596160888671875, 0.008131980895996094, 0.010667800903320312, 0.013203620910644531, 0.01573944091796875, 0.01827526092529297, 0.020811080932617188, 0.023346900939941406, 0.025882720947265625, 0.028418540954589844, 0.030954360961914062, 0.03349018096923828, 0.0360260009765625, 0.03856182098388672, 0.04109764099121094, 0.043633460998535156, 0.046169281005859375, 0.048705101013183594, 0.05124092102050781, 0.05377674102783203, 0.05631256103515625, 0.05884838104248047, 0.06138420104980469, 0.0639200210571289, 0.06645584106445312, 0.06899166107177734, 0.07152748107910156, 0.07406330108642578, 0.07659912109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 12.0, 11.0, 13.0, 17.0, 21.0, 28.0, 31.0, 32.0, 39.0, 44.0, 55.0, 45.0, 46.0, 61.0, 51.0, 50.0, 54.0, 39.0, 69.0, 51.0, 26.0, 44.0, 20.0, 32.0, 21.0, 20.0, 15.0, 11.0, 12.0, 14.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.248046875, -2.1815185546875, -2.114990234375, -2.0484619140625, -1.98193359375, -1.9154052734375, -1.848876953125, -1.7823486328125, -1.7158203125, -1.6492919921875, -1.582763671875, -1.5162353515625, -1.44970703125, -1.3831787109375, -1.316650390625, -1.2501220703125, -1.18359375, -1.1170654296875, -1.050537109375, -0.9840087890625, -0.91748046875, -0.8509521484375, -0.784423828125, -0.7178955078125, -0.6513671875, -0.5848388671875, -0.518310546875, -0.4517822265625, -0.38525390625, -0.3187255859375, -0.252197265625, -0.1856689453125, -0.119140625, -0.0526123046875, 0.013916015625, 0.0804443359375, 0.14697265625, 0.2135009765625, 0.280029296875, 0.3465576171875, 0.4130859375, 0.4796142578125, 0.546142578125, 0.6126708984375, 0.67919921875, 0.7457275390625, 0.812255859375, 0.8787841796875, 0.9453125, 1.0118408203125, 1.078369140625, 1.1448974609375, 1.21142578125, 1.2779541015625, 1.344482421875, 1.4110107421875, 1.4775390625, 1.5440673828125, 1.610595703125, 1.6771240234375, 1.74365234375, 1.8101806640625, 1.876708984375, 1.9432373046875, 2.009765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 13.0, 12.0, 13.0, 9.0, 25.0, 51.0, 61.0, 97.0, 149.0, 206.0, 280.0, 495.0, 692.0, 1115.0, 1911.0, 3203.0, 5604.0, 10396.0, 20983.0, 46439.0, 125360.0, 541671.0, 175863.0, 60594.0, 25087.0, 12222.0, 6430.0, 3669.0, 2127.0, 1333.0, 819.0, 503.0, 349.0, 257.0, 175.0, 100.0, 89.0, 48.0, 38.0, 21.0, 19.0, 8.0, 5.0, 11.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002467632293701172, -0.00023870915174484253, -0.00023065507411956787, -0.0002226009964942932, -0.00021454691886901855, -0.0002064928412437439, -0.00019843876361846924, -0.00019038468599319458, -0.00018233060836791992, -0.00017427653074264526, -0.0001662224531173706, -0.00015816837549209595, -0.0001501142978668213, -0.00014206022024154663, -0.00013400614261627197, -0.00012595206499099731, -0.00011789798736572266, -0.000109843909740448, -0.00010178983211517334, -9.373575448989868e-05, -8.568167686462402e-05, -7.762759923934937e-05, -6.957352161407471e-05, -6.151944398880005e-05, -5.346536636352539e-05, -4.541128873825073e-05, -3.7357211112976074e-05, -2.9303133487701416e-05, -2.1249055862426758e-05, -1.31949782371521e-05, -5.140900611877441e-06, 2.913177013397217e-06, 1.0967254638671875e-05, 1.9021332263946533e-05, 2.707540988922119e-05, 3.512948751449585e-05, 4.318356513977051e-05, 5.1237642765045166e-05, 5.9291720390319824e-05, 6.734579801559448e-05, 7.539987564086914e-05, 8.34539532661438e-05, 9.150803089141846e-05, 9.956210851669312e-05, 0.00010761618614196777, 0.00011567026376724243, 0.0001237243413925171, 0.00013177841901779175, 0.0001398324966430664, 0.00014788657426834106, 0.00015594065189361572, 0.00016399472951889038, 0.00017204880714416504, 0.0001801028847694397, 0.00018815696239471436, 0.00019621104001998901, 0.00020426511764526367, 0.00021231919527053833, 0.000220373272895813, 0.00022842735052108765, 0.0002364814281463623, 0.00024453550577163696, 0.0002525895833969116, 0.0002606436610221863, 0.00026869773864746094]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 8.0, 2.0, 5.0, 5.0, 7.0, 12.0, 14.0, 18.0, 28.0, 55.0, 111.0, 215.0, 276.0, 84.0, 56.0, 29.0, 17.0, 22.0, 10.0, 6.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000179290771484375, -0.00017431378364562988, -0.00016933679580688477, -0.00016435980796813965, -0.00015938282012939453, -0.00015440583229064941, -0.0001494288444519043, -0.00014445185661315918, -0.00013947486877441406, -0.00013449788093566895, -0.00012952089309692383, -0.0001245439052581787, -0.0001195669174194336, -0.00011458992958068848, -0.00010961294174194336, -0.00010463595390319824, -9.965896606445312e-05, -9.468197822570801e-05, -8.970499038696289e-05, -8.472800254821777e-05, -7.975101470947266e-05, -7.477402687072754e-05, -6.979703903198242e-05, -6.48200511932373e-05, -5.984306335449219e-05, -5.486607551574707e-05, -4.988908767700195e-05, -4.4912099838256836e-05, -3.993511199951172e-05, -3.49581241607666e-05, -2.9981136322021484e-05, -2.5004148483276367e-05, -2.002716064453125e-05, -1.5050172805786133e-05, -1.0073184967041016e-05, -5.0961971282958984e-06, -1.1920928955078125e-07, 4.857778549194336e-06, 9.834766387939453e-06, 1.481175422668457e-05, 1.9788742065429688e-05, 2.4765729904174805e-05, 2.9742717742919922e-05, 3.471970558166504e-05, 3.9696693420410156e-05, 4.4673681259155273e-05, 4.965066909790039e-05, 5.462765693664551e-05, 5.9604644775390625e-05, 6.458163261413574e-05, 6.955862045288086e-05, 7.453560829162598e-05, 7.95125961303711e-05, 8.448958396911621e-05, 8.946657180786133e-05, 9.444355964660645e-05, 9.942054748535156e-05, 0.00010439753532409668, 0.0001093745231628418, 0.00011435151100158691, 0.00011932849884033203, 0.00012430548667907715, 0.00012928247451782227, 0.00013425946235656738, 0.0001392364501953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 5.0, 4.0, 3.0, 5.0, 8.0, 10.0, 9.0, 14.0, 28.0, 20.0, 41.0, 56.0, 114.0, 295.0, 748.0, 2562.0, 14401.0, 740926.0, 275262.0, 10654.0, 2154.0, 629.0, 269.0, 112.0, 62.0, 36.0, 31.0, 18.0, 21.0, 10.0, 6.0, 6.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005135536193847656, -0.0004988498985767365, -0.0004841461777687073, -0.0004694424569606781, -0.0004547387361526489, -0.00044003501534461975, -0.0004253312945365906, -0.0004106275737285614, -0.0003959238529205322, -0.00038122013211250305, -0.0003665164113044739, -0.0003518126904964447, -0.00033710896968841553, -0.00032240524888038635, -0.0003077015280723572, -0.000292997807264328, -0.00027829408645629883, -0.00026359036564826965, -0.0002488866448402405, -0.0002341829240322113, -0.00021947920322418213, -0.00020477548241615295, -0.00019007176160812378, -0.0001753680408000946, -0.00016066431999206543, -0.00014596059918403625, -0.00013125687837600708, -0.0001165531575679779, -0.00010184943675994873, -8.714571595191956e-05, -7.244199514389038e-05, -5.7738274335861206e-05, -4.303455352783203e-05, -2.8330832719802856e-05, -1.3627111911773682e-05, 1.0766088962554932e-06, 1.5780329704284668e-05, 3.0484050512313843e-05, 4.518777132034302e-05, 5.989149212837219e-05, 7.459521293640137e-05, 8.929893374443054e-05, 0.00010400265455245972, 0.00011870637536048889, 0.00013341009616851807, 0.00014811381697654724, 0.00016281753778457642, 0.0001775212585926056, 0.00019222497940063477, 0.00020692870020866394, 0.00022163242101669312, 0.0002363361418247223, 0.00025103986263275146, 0.00026574358344078064, 0.0002804473042488098, 0.000295151025056839, 0.00030985474586486816, 0.00032455846667289734, 0.0003392621874809265, 0.0003539659082889557, 0.00036866962909698486, 0.00038337334990501404, 0.0003980770707130432, 0.0004127807915210724, 0.00042748451232910156]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 0.0, 7.0, 8.0, 5.0, 12.0, 10.0, 25.0, 20.0, 19.0, 39.0, 60.0, 64.0, 101.0, 145.0, 114.0, 90.0, 57.0, 46.0, 39.0, 22.0, 19.0, 18.0, 15.0, 10.0, 5.0, 8.0, 4.0, 7.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5359134674072266e-05, -4.4022686779499054e-05, -4.268623888492584e-05, -4.134979099035263e-05, -4.001334309577942e-05, -3.867689520120621e-05, -3.7340447306632996e-05, -3.6003999412059784e-05, -3.466755151748657e-05, -3.333110362291336e-05, -3.199465572834015e-05, -3.065820783376694e-05, -2.9321759939193726e-05, -2.7985312044620514e-05, -2.6648864150047302e-05, -2.531241625547409e-05, -2.397596836090088e-05, -2.2639520466327667e-05, -2.1303072571754456e-05, -1.9966624677181244e-05, -1.8630176782608032e-05, -1.729372888803482e-05, -1.595728099346161e-05, -1.4620833098888397e-05, -1.3284385204315186e-05, -1.1947937309741974e-05, -1.0611489415168762e-05, -9.27504152059555e-06, -7.938593626022339e-06, -6.602145731449127e-06, -5.2656978368759155e-06, -3.929249942302704e-06, -2.592802047729492e-06, -1.2563541531562805e-06, 8.009374141693115e-08, 1.4165416359901428e-06, 2.7529895305633545e-06, 4.089437425136566e-06, 5.425885319709778e-06, 6.7623332142829895e-06, 8.098781108856201e-06, 9.435229003429413e-06, 1.0771676898002625e-05, 1.2108124792575836e-05, 1.3444572687149048e-05, 1.478102058172226e-05, 1.611746847629547e-05, 1.7453916370868683e-05, 1.8790364265441895e-05, 2.0126812160015106e-05, 2.1463260054588318e-05, 2.279970794916153e-05, 2.413615584373474e-05, 2.5472603738307953e-05, 2.6809051632881165e-05, 2.8145499527454376e-05, 2.9481947422027588e-05, 3.08183953166008e-05, 3.215484321117401e-05, 3.349129110574722e-05, 3.4827739000320435e-05, 3.6164186894893646e-05, 3.750063478946686e-05, 3.883708268404007e-05, 4.017353057861328e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 8.0, 15.0, 21.0, 34.0, 63.0, 125.0, 241.0, 274.0, 120.0, 60.0, 26.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9748425483703613, -0.9103848934173584, -0.8459272384643555, -0.7814695835113525, -0.7170119285583496, -0.6525542736053467, -0.5880966186523438, -0.5236389636993408, -0.4591813087463379, -0.39472365379333496, -0.33026599884033203, -0.2658083438873291, -0.20135068893432617, -0.13689303398132324, -0.07243537902832031, -0.007977724075317383, 0.05647993087768555, 0.12093758583068848, 0.1853952407836914, 0.24985289573669434, 0.31431055068969727, 0.3787682056427002, 0.4432258605957031, 0.507683515548706, 0.572141170501709, 0.6365988254547119, 0.7010564804077148, 0.7655141353607178, 0.8299717903137207, 0.8944294452667236, 0.9588871002197266, 1.0233447551727295, 1.0878026485443115, 1.1522603034973145, 1.2167179584503174, 1.2811756134033203, 1.3456332683563232, 1.4100909233093262, 1.474548578262329, 1.539006233215332, 1.603463888168335, 1.667921543121338, 1.7323791980743408, 1.7968368530273438, 1.8612945079803467, 1.9257521629333496, 1.9902098178863525, 2.0546674728393555, 2.1191251277923584, 2.1835827827453613, 2.2480404376983643, 2.312498092651367, 2.37695574760437, 2.441413402557373, 2.505871057510376, 2.570328712463379, 2.634786367416382, 2.6992440223693848, 2.7637016773223877, 2.8281593322753906, 2.8926169872283936, 2.9570746421813965, 3.0215322971343994, 3.0859899520874023, 3.1504476070404053]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 29.0, 32.0, 52.0, 107.0, 94.0, 124.0, 155.0, 119.0, 91.0, 69.0, 54.0, 36.0, 16.0, 8.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9960737228393555, -1.9409973621368408, -1.8859211206436157, -1.8308448791503906, -1.775768518447876, -1.7206921577453613, -1.6656159162521362, -1.6105396747589111, -1.5554633140563965, -1.5003869533538818, -1.4453107118606567, -1.3902344703674316, -1.335158109664917, -1.2800817489624023, -1.2250055074691772, -1.1699292659759521, -1.1148529052734375, -1.0597765445709229, -1.0047003030776978, -0.9496240019798279, -0.894547700881958, -0.8394713997840881, -0.7843950986862183, -0.7293187975883484, -0.6742424964904785, -0.6191661953926086, -0.5640898942947388, -0.5090135931968689, -0.453937292098999, -0.39886099100112915, -0.3437846899032593, -0.2887083888053894, -0.23363196849822998, -0.1785556674003601, -0.12347936630249023, -0.06840306520462036, -0.013326764106750488, 0.041749536991119385, 0.09682583808898926, 0.15190213918685913, 0.206978440284729, 0.2620547413825989, 0.31713104248046875, 0.3722073435783386, 0.4272836446762085, 0.48235994577407837, 0.5374362468719482, 0.5925125479698181, 0.647588849067688, 0.7026651501655579, 0.7577414512634277, 0.8128177523612976, 0.8678940534591675, 0.9229703545570374, 0.9780466556549072, 1.0331230163574219, 1.088199257850647, 1.143275499343872, 1.1983518600463867, 1.2534282207489014, 1.3085044622421265, 1.3635807037353516, 1.4186570644378662, 1.4737334251403809, 1.528809666633606]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 11.0, 7.0, 18.0, 10.0, 21.0, 26.0, 42.0, 61.0, 127.0, 262.0, 644.0, 1768.0, 5312.0, 21424.0, 139679.0, 753658.0, 101232.0, 17103.0, 4542.0, 1482.0, 565.0, 248.0, 128.0, 53.0, 41.0, 20.0, 15.0, 11.0, 6.0, 13.0, 6.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1669921875, -1.122833251953125, -1.07867431640625, -1.034515380859375, -0.9903564453125, -0.946197509765625, -0.90203857421875, -0.857879638671875, -0.813720703125, -0.769561767578125, -0.72540283203125, -0.681243896484375, -0.6370849609375, -0.592926025390625, -0.54876708984375, -0.504608154296875, -0.46044921875, -0.416290283203125, -0.37213134765625, -0.327972412109375, -0.2838134765625, -0.239654541015625, -0.19549560546875, -0.151336669921875, -0.107177734375, -0.063018798828125, -0.01885986328125, 0.025299072265625, 0.0694580078125, 0.113616943359375, 0.15777587890625, 0.201934814453125, 0.24609375, 0.290252685546875, 0.33441162109375, 0.378570556640625, 0.4227294921875, 0.466888427734375, 0.51104736328125, 0.555206298828125, 0.599365234375, 0.643524169921875, 0.68768310546875, 0.731842041015625, 0.7760009765625, 0.820159912109375, 0.86431884765625, 0.908477783203125, 0.95263671875, 0.996795654296875, 1.04095458984375, 1.085113525390625, 1.1292724609375, 1.173431396484375, 1.21759033203125, 1.261749267578125, 1.305908203125, 1.350067138671875, 1.39422607421875, 1.438385009765625, 1.4825439453125, 1.526702880859375, 1.57086181640625, 1.615020751953125, 1.6591796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 13.0, 8.0, 10.0, 22.0, 17.0, 25.0, 29.0, 33.0, 40.0, 42.0, 39.0, 40.0, 42.0, 55.0, 54.0, 49.0, 46.0, 46.0, 42.0, 49.0, 47.0, 34.0, 34.0, 34.0, 35.0, 26.0, 11.0, 13.0, 11.0, 12.0, 8.0, 6.0, 15.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1995849609375, -0.194122314453125, -0.18865966796875, -0.183197021484375, -0.177734375, -0.172271728515625, -0.16680908203125, -0.161346435546875, -0.1558837890625, -0.150421142578125, -0.14495849609375, -0.139495849609375, -0.134033203125, -0.128570556640625, -0.12310791015625, -0.117645263671875, -0.1121826171875, -0.106719970703125, -0.10125732421875, -0.095794677734375, -0.09033203125, -0.084869384765625, -0.07940673828125, -0.073944091796875, -0.0684814453125, -0.063018798828125, -0.05755615234375, -0.052093505859375, -0.046630859375, -0.041168212890625, -0.03570556640625, -0.030242919921875, -0.0247802734375, -0.019317626953125, -0.01385498046875, -0.008392333984375, -0.0029296875, 0.002532958984375, 0.00799560546875, 0.013458251953125, 0.0189208984375, 0.024383544921875, 0.02984619140625, 0.035308837890625, 0.040771484375, 0.046234130859375, 0.05169677734375, 0.057159423828125, 0.0626220703125, 0.068084716796875, 0.07354736328125, 0.079010009765625, 0.08447265625, 0.089935302734375, 0.09539794921875, 0.100860595703125, 0.1063232421875, 0.111785888671875, 0.11724853515625, 0.122711181640625, 0.128173828125, 0.133636474609375, 0.13909912109375, 0.144561767578125, 0.1500244140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 12.0, 7.0, 4.0, 25.0, 21.0, 36.0, 30.0, 56.0, 53.0, 68.0, 98.0, 123.0, 293.0, 2124.0, 166791.0, 873986.0, 3908.0, 356.0, 136.0, 89.0, 77.0, 48.0, 45.0, 45.0, 27.0, 17.0, 18.0, 21.0, 9.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.93890380859375, -4.7801513671875, -4.62139892578125, -4.462646484375, -4.30389404296875, -4.1451416015625, -3.98638916015625, -3.82763671875, -3.66888427734375, -3.5101318359375, -3.35137939453125, -3.192626953125, -3.03387451171875, -2.8751220703125, -2.71636962890625, -2.5576171875, -2.39886474609375, -2.2401123046875, -2.08135986328125, -1.922607421875, -1.76385498046875, -1.6051025390625, -1.44635009765625, -1.28759765625, -1.12884521484375, -0.9700927734375, -0.81134033203125, -0.652587890625, -0.49383544921875, -0.3350830078125, -0.17633056640625, -0.017578125, 0.14117431640625, 0.2999267578125, 0.45867919921875, 0.617431640625, 0.77618408203125, 0.9349365234375, 1.09368896484375, 1.25244140625, 1.41119384765625, 1.5699462890625, 1.72869873046875, 1.887451171875, 2.04620361328125, 2.2049560546875, 2.36370849609375, 2.5224609375, 2.68121337890625, 2.8399658203125, 2.99871826171875, 3.157470703125, 3.31622314453125, 3.4749755859375, 3.63372802734375, 3.79248046875, 3.95123291015625, 4.1099853515625, 4.26873779296875, 4.427490234375, 4.58624267578125, 4.7449951171875, 4.90374755859375, 5.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 0.0, 12.0, 12.0, 14.0, 23.0, 10.0, 17.0, 24.0, 36.0, 28.0, 47.0, 52.0, 66.0, 61.0, 85.0, 68.0, 79.0, 64.0, 52.0, 44.0, 31.0, 29.0, 22.0, 20.0, 19.0, 13.0, 5.0, 14.0, 9.0, 11.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7197265625, -0.6972427368164062, -0.6747589111328125, -0.6522750854492188, -0.629791259765625, -0.6073074340820312, -0.5848236083984375, -0.5623397827148438, -0.53985595703125, -0.5173721313476562, -0.4948883056640625, -0.47240447998046875, -0.449920654296875, -0.42743682861328125, -0.4049530029296875, -0.38246917724609375, -0.3599853515625, -0.33750152587890625, -0.3150177001953125, -0.29253387451171875, -0.270050048828125, -0.24756622314453125, -0.2250823974609375, -0.20259857177734375, -0.18011474609375, -0.15763092041015625, -0.1351470947265625, -0.11266326904296875, -0.090179443359375, -0.06769561767578125, -0.0452117919921875, -0.02272796630859375, -0.000244140625, 0.02223968505859375, 0.0447235107421875, 0.06720733642578125, 0.089691162109375, 0.11217498779296875, 0.1346588134765625, 0.15714263916015625, 0.17962646484375, 0.20211029052734375, 0.2245941162109375, 0.24707794189453125, 0.269561767578125, 0.29204559326171875, 0.3145294189453125, 0.33701324462890625, 0.3594970703125, 0.38198089599609375, 0.4044647216796875, 0.42694854736328125, 0.449432373046875, 0.47191619873046875, 0.4944000244140625, 0.5168838500976562, 0.53936767578125, 0.5618515014648438, 0.5843353271484375, 0.6068191528320312, 0.629302978515625, 0.6517868041992188, 0.6742706298828125, 0.6967544555664062, 0.71923828125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 4.0, 9.0, 3.0, 4.0, 10.0, 5.0, 9.0, 16.0, 23.0, 32.0, 43.0, 68.0, 86.0, 135.0, 294.0, 519.0, 932.0, 1866.0, 4217.0, 11892.0, 84154.0, 899470.0, 31138.0, 7443.0, 2958.0, 1414.0, 755.0, 386.0, 227.0, 152.0, 79.0, 49.0, 31.0, 22.0, 14.0, 22.0, 13.0, 13.0, 5.0, 1.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0], "bins": [-0.33984375, -0.32932281494140625, -0.3188018798828125, -0.30828094482421875, -0.297760009765625, -0.28723907470703125, -0.2767181396484375, -0.26619720458984375, -0.25567626953125, -0.24515533447265625, -0.2346343994140625, -0.22411346435546875, -0.213592529296875, -0.20307159423828125, -0.1925506591796875, -0.18202972412109375, -0.1715087890625, -0.16098785400390625, -0.1504669189453125, -0.13994598388671875, -0.129425048828125, -0.11890411376953125, -0.1083831787109375, -0.09786224365234375, -0.08734130859375, -0.07682037353515625, -0.0662994384765625, -0.05577850341796875, -0.045257568359375, -0.03473663330078125, -0.0242156982421875, -0.01369476318359375, -0.003173828125, 0.00734710693359375, 0.0178680419921875, 0.02838897705078125, 0.038909912109375, 0.04943084716796875, 0.0599517822265625, 0.07047271728515625, 0.08099365234375, 0.09151458740234375, 0.1020355224609375, 0.11255645751953125, 0.123077392578125, 0.13359832763671875, 0.1441192626953125, 0.15464019775390625, 0.1651611328125, 0.17568206787109375, 0.1862030029296875, 0.19672393798828125, 0.207244873046875, 0.21776580810546875, 0.2282867431640625, 0.23880767822265625, 0.24932861328125, 0.25984954833984375, 0.2703704833984375, 0.28089141845703125, 0.291412353515625, 0.30193328857421875, 0.3124542236328125, 0.32297515869140625, 0.33349609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 3.0, 0.0, 8.0, 2.0, 11.0, 26.0, 84.0, 729.0, 70.0, 33.0, 14.0, 3.0, 7.0, 0.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018334388732910156, -0.00017666444182395935, -0.00016998499631881714, -0.00016330555081367493, -0.00015662610530853271, -0.0001499466598033905, -0.0001432672142982483, -0.00013658776879310608, -0.00012990832328796387, -0.00012322887778282166, -0.00011654943227767944, -0.00010986998677253723, -0.00010319054126739502, -9.651109576225281e-05, -8.98316502571106e-05, -8.315220475196838e-05, -7.647275924682617e-05, -6.979331374168396e-05, -6.311386823654175e-05, -5.6434422731399536e-05, -4.9754977226257324e-05, -4.307553172111511e-05, -3.63960862159729e-05, -2.971664071083069e-05, -2.3037195205688477e-05, -1.6357749700546265e-05, -9.678304195404053e-06, -2.998858690261841e-06, 3.680586814880371e-06, 1.0360032320022583e-05, 1.7039477825164795e-05, 2.3718923330307007e-05, 3.039836883544922e-05, 3.707781434059143e-05, 4.375725984573364e-05, 5.0436705350875854e-05, 5.7116150856018066e-05, 6.379559636116028e-05, 7.047504186630249e-05, 7.71544873714447e-05, 8.383393287658691e-05, 9.051337838172913e-05, 9.719282388687134e-05, 0.00010387226939201355, 0.00011055171489715576, 0.00011723116040229797, 0.00012391060590744019, 0.0001305900514125824, 0.0001372694969177246, 0.00014394894242286682, 0.00015062838792800903, 0.00015730783343315125, 0.00016398727893829346, 0.00017066672444343567, 0.00017734616994857788, 0.0001840256154537201, 0.0001907050609588623, 0.00019738450646400452, 0.00020406395196914673, 0.00021074339747428894, 0.00021742284297943115, 0.00022410228848457336, 0.00023078173398971558, 0.0002374611794948578, 0.000244140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 4.0, 3.0, 4.0, 2.0, 6.0, 5.0, 7.0, 11.0, 4.0, 5.0, 10.0, 28.0, 41.0, 76.0, 205.0, 720.0, 3531.0, 48272.0, 986394.0, 7314.0, 1246.0, 323.0, 141.0, 47.0, 33.0, 21.0, 20.0, 15.0, 15.0, 9.0, 7.0, 7.0, 7.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.427001953125, -0.4137306213378906, -0.40045928955078125, -0.3871879577636719, -0.3739166259765625, -0.3606452941894531, -0.34737396240234375, -0.3341026306152344, -0.320831298828125, -0.3075599670410156, -0.29428863525390625, -0.2810173034667969, -0.2677459716796875, -0.2544746398925781, -0.24120330810546875, -0.22793197631835938, -0.21466064453125, -0.20138931274414062, -0.18811798095703125, -0.17484664916992188, -0.1615753173828125, -0.14830398559570312, -0.13503265380859375, -0.12176132202148438, -0.108489990234375, -0.09521865844726562, -0.08194732666015625, -0.06867599487304688, -0.0554046630859375, -0.042133331298828125, -0.02886199951171875, -0.015590667724609375, -0.0023193359375, 0.010951995849609375, 0.02422332763671875, 0.037494659423828125, 0.0507659912109375, 0.06403732299804688, 0.07730865478515625, 0.09057998657226562, 0.103851318359375, 0.11712265014648438, 0.13039398193359375, 0.14366531372070312, 0.1569366455078125, 0.17020797729492188, 0.18347930908203125, 0.19675064086914062, 0.21002197265625, 0.22329330444335938, 0.23656463623046875, 0.24983596801757812, 0.2631072998046875, 0.2763786315917969, 0.28964996337890625, 0.3029212951660156, 0.316192626953125, 0.3294639587402344, 0.34273529052734375, 0.3560066223144531, 0.3692779541015625, 0.3825492858886719, 0.39582061767578125, 0.4090919494628906, 0.42236328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 15.0, 8.0, 24.0, 22.0, 115.0, 513.0, 118.0, 50.0, 10.0, 13.0, 11.0, 10.0, 9.0, 4.0, 3.0, 5.0, 4.0, 4.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06494140625, -0.0626668930053711, -0.06039237976074219, -0.05811786651611328, -0.055843353271484375, -0.05356884002685547, -0.05129432678222656, -0.049019813537597656, -0.04674530029296875, -0.044470787048339844, -0.04219627380371094, -0.03992176055908203, -0.037647247314453125, -0.03537273406982422, -0.03309822082519531, -0.030823707580566406, -0.0285491943359375, -0.026274681091308594, -0.024000167846679688, -0.02172565460205078, -0.019451141357421875, -0.01717662811279297, -0.014902114868164062, -0.012627601623535156, -0.01035308837890625, -0.008078575134277344, -0.0058040618896484375, -0.0035295486450195312, -0.001255035400390625, 0.0010194778442382812, 0.0032939910888671875, 0.005568504333496094, 0.007843017578125, 0.010117530822753906, 0.012392044067382812, 0.014666557312011719, 0.016941070556640625, 0.01921558380126953, 0.021490097045898438, 0.023764610290527344, 0.02603912353515625, 0.028313636779785156, 0.030588150024414062, 0.03286266326904297, 0.035137176513671875, 0.03741168975830078, 0.03968620300292969, 0.041960716247558594, 0.0442352294921875, 0.046509742736816406, 0.04878425598144531, 0.05105876922607422, 0.053333282470703125, 0.05560779571533203, 0.05788230895996094, 0.060156822204589844, 0.06243133544921875, 0.06470584869384766, 0.06698036193847656, 0.06925487518310547, 0.07152938842773438, 0.07380390167236328, 0.07607841491699219, 0.0783529281616211, 0.08062744140625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 4.0, 9.0, 15.0, 21.0, 51.0, 90.0, 141.0, 191.0, 167.0, 132.0, 70.0, 56.0, 19.0, 17.0, 11.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.971177577972412, -1.9078834056854248, -1.8445892333984375, -1.7812949419021606, -1.7180007696151733, -1.654706597328186, -1.5914123058319092, -1.5281181335449219, -1.4648239612579346, -1.4015297889709473, -1.33823561668396, -1.274941325187683, -1.2116471529006958, -1.1483529806137085, -1.0850586891174316, -1.0217645168304443, -0.958470344543457, -0.8951761722564697, -0.8318819403648376, -0.7685877084732056, -0.7052935361862183, -0.641999363899231, -0.5787051320075989, -0.5154109001159668, -0.4521167278289795, -0.3888225257396698, -0.3255283236503601, -0.2622341215610504, -0.19893991947174072, -0.13564571738243103, -0.07235151529312134, -0.009057313203811646, 0.05423688888549805, 0.11753109097480774, 0.18082529306411743, 0.24411949515342712, 0.3074136972427368, 0.3707078993320465, 0.4340021014213562, 0.4972963035106659, 0.5605905055999756, 0.6238846778869629, 0.687178909778595, 0.750473141670227, 0.8137673139572144, 0.8770614862442017, 0.9403557181358337, 1.0036499500274658, 1.0669441223144531, 1.1302382946014404, 1.1935324668884277, 1.2568267583847046, 1.320120930671692, 1.3834151029586792, 1.446709394454956, 1.5100035667419434, 1.5732977390289307, 1.636591911315918, 1.6998860836029053, 1.7631803750991821, 1.8264745473861694, 1.8897687196731567, 1.9530630111694336, 2.016357183456421, 2.079651355743408]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 5.0, 6.0, 13.0, 12.0, 14.0, 10.0, 24.0, 24.0, 29.0, 37.0, 26.0, 43.0, 28.0, 27.0, 49.0, 41.0, 36.0, 44.0, 47.0, 54.0, 41.0, 40.0, 48.0, 40.0, 36.0, 28.0, 32.0, 22.0, 30.0, 17.0, 22.0, 11.0, 13.0, 14.0, 10.0, 5.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9781044721603394, -0.9401484727859497, -0.9021924734115601, -0.8642364740371704, -0.8262804746627808, -0.7883244752883911, -0.7503684759140015, -0.7124124765396118, -0.6744564771652222, -0.6365004777908325, -0.5985444784164429, -0.5605884790420532, -0.5226324796676636, -0.4846764802932739, -0.4467204809188843, -0.40876448154449463, -0.370808482170105, -0.33285248279571533, -0.2948964834213257, -0.25694048404693604, -0.2189844846725464, -0.18102848529815674, -0.1430724859237671, -0.10511648654937744, -0.06716048717498779, -0.029204487800598145, 0.008751511573791504, 0.04670751094818115, 0.0846635103225708, 0.12261950969696045, 0.1605755090713501, 0.19853150844573975, 0.23648738861083984, 0.2744433879852295, 0.31239938735961914, 0.3503553867340088, 0.38831138610839844, 0.4262673854827881, 0.46422338485717773, 0.5021793842315674, 0.540135383605957, 0.5780913829803467, 0.6160473823547363, 0.654003381729126, 0.6919593811035156, 0.7299153804779053, 0.7678713798522949, 0.8058273792266846, 0.8437833786010742, 0.8817393779754639, 0.9196953773498535, 0.9576513767242432, 0.9956073760986328, 1.0335633754730225, 1.071519374847412, 1.1094753742218018, 1.1474313735961914, 1.185387372970581, 1.2233433723449707, 1.2612993717193604, 1.29925537109375, 1.3372113704681396, 1.3751673698425293, 1.413123369216919, 1.4510793685913086]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 8.0, 11.0, 12.0, 15.0, 31.0, 54.0, 82.0, 98.0, 107.0, 179.0, 261.0, 387.0, 544.0, 823.0, 1188.0, 1815.0, 2693.0, 5997.0, 4166315.0, 5372.0, 2660.0, 1768.0, 1169.0, 835.0, 576.0, 392.0, 275.0, 174.0, 136.0, 87.0, 57.0, 35.0, 41.0, 22.0, 16.0, 15.0, 12.0, 12.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.884765625, -3.748199462890625, -3.61163330078125, -3.475067138671875, -3.3385009765625, -3.201934814453125, -3.06536865234375, -2.928802490234375, -2.792236328125, -2.655670166015625, -2.51910400390625, -2.382537841796875, -2.2459716796875, -2.109405517578125, -1.97283935546875, -1.836273193359375, -1.69970703125, -1.563140869140625, -1.42657470703125, -1.290008544921875, -1.1534423828125, -1.016876220703125, -0.88031005859375, -0.743743896484375, -0.607177734375, -0.470611572265625, -0.33404541015625, -0.197479248046875, -0.0609130859375, 0.075653076171875, 0.21221923828125, 0.348785400390625, 0.4853515625, 0.621917724609375, 0.75848388671875, 0.895050048828125, 1.0316162109375, 1.168182373046875, 1.30474853515625, 1.441314697265625, 1.577880859375, 1.714447021484375, 1.85101318359375, 1.987579345703125, 2.1241455078125, 2.260711669921875, 2.39727783203125, 2.533843994140625, 2.67041015625, 2.806976318359375, 2.94354248046875, 3.080108642578125, 3.2166748046875, 3.353240966796875, 3.48980712890625, 3.626373291015625, 3.762939453125, 3.899505615234375, 4.03607177734375, 4.172637939453125, 4.3092041015625, 4.445770263671875, 4.58233642578125, 4.718902587890625, 4.85546875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 4.0, 4.0, 9.0, 9.0, 7.0, 8.0, 16.0, 12.0, 22.0, 27.0, 26.0, 31.0, 31.0, 35.0, 23.0, 46.0, 57.0, 46.0, 45.0, 40.0, 41.0, 46.0, 30.0, 44.0, 45.0, 35.0, 39.0, 29.0, 33.0, 24.0, 26.0, 18.0, 15.0, 11.0, 11.0, 11.0, 12.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14892578125, -0.1442394256591797, -0.13955307006835938, -0.13486671447753906, -0.13018035888671875, -0.12549400329589844, -0.12080764770507812, -0.11612129211425781, -0.1114349365234375, -0.10674858093261719, -0.10206222534179688, -0.09737586975097656, -0.09268951416015625, -0.08800315856933594, -0.08331680297851562, -0.07863044738769531, -0.073944091796875, -0.06925773620605469, -0.06457138061523438, -0.05988502502441406, -0.05519866943359375, -0.05051231384277344, -0.045825958251953125, -0.04113960266113281, -0.0364532470703125, -0.03176689147949219, -0.027080535888671875, -0.022394180297851562, -0.01770782470703125, -0.013021469116210938, -0.008335113525390625, -0.0036487579345703125, 0.00103759765625, 0.0057239532470703125, 0.010410308837890625, 0.015096664428710938, 0.01978302001953125, 0.024469375610351562, 0.029155731201171875, 0.03384208679199219, 0.0385284423828125, 0.04321479797363281, 0.047901153564453125, 0.05258750915527344, 0.05727386474609375, 0.06196022033691406, 0.06664657592773438, 0.07133293151855469, 0.076019287109375, 0.08070564270019531, 0.08539199829101562, 0.09007835388183594, 0.09476470947265625, 0.09945106506347656, 0.10413742065429688, 0.10882377624511719, 0.1135101318359375, 0.11819648742675781, 0.12288284301757812, 0.12756919860839844, 0.13225555419921875, 0.13694190979003906, 0.14162826538085938, 0.1463146209716797, 0.1510009765625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 16.0, 89.0, 1711.0, 4191644.0, 750.0, 42.0, 15.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.90625, -28.921875, -27.9375, -26.953125, -25.96875, -24.984375, -24.0, -23.015625, -22.03125, -21.046875, -20.0625, -19.078125, -18.09375, -17.109375, -16.125, -15.140625, -14.15625, -13.171875, -12.1875, -11.203125, -10.21875, -9.234375, -8.25, -7.265625, -6.28125, -5.296875, -4.3125, -3.328125, -2.34375, -1.359375, -0.375, 0.609375, 1.59375, 2.578125, 3.5625, 4.546875, 5.53125, 6.515625, 7.5, 8.484375, 9.46875, 10.453125, 11.4375, 12.421875, 13.40625, 14.390625, 15.375, 16.359375, 17.34375, 18.328125, 19.3125, 20.296875, 21.28125, 22.265625, 23.25, 24.234375, 25.21875, 26.203125, 27.1875, 28.171875, 29.15625, 30.140625, 31.125, 32.109375, 33.09375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 11.0, 3995.0, 48.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95068359375, -0.9137344360351562, -0.8767852783203125, -0.8398361206054688, -0.802886962890625, -0.7659378051757812, -0.7289886474609375, -0.6920394897460938, -0.65509033203125, -0.6181411743164062, -0.5811920166015625, -0.5442428588867188, -0.507293701171875, -0.47034454345703125, -0.4333953857421875, -0.39644622802734375, -0.3594970703125, -0.32254791259765625, -0.2855987548828125, -0.24864959716796875, -0.211700439453125, -0.17475128173828125, -0.1378021240234375, -0.10085296630859375, -0.06390380859375, -0.02695465087890625, 0.0099945068359375, 0.04694366455078125, 0.083892822265625, 0.12084197998046875, 0.1577911376953125, 0.19474029541015625, 0.231689453125, 0.26863861083984375, 0.3055877685546875, 0.34253692626953125, 0.379486083984375, 0.41643524169921875, 0.4533843994140625, 0.49033355712890625, 0.52728271484375, 0.5642318725585938, 0.6011810302734375, 0.6381301879882812, 0.675079345703125, 0.7120285034179688, 0.7489776611328125, 0.7859268188476562, 0.8228759765625, 0.8598251342773438, 0.8967742919921875, 0.9337234497070312, 0.970672607421875, 1.0076217651367188, 1.0445709228515625, 1.0815200805664062, 1.11846923828125, 1.1554183959960938, 1.1923675537109375, 1.2293167114257812, 1.266265869140625, 1.3032150268554688, 1.3401641845703125, 1.3771133422851562, 1.4140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 14.0, 12.0, 24.0, 38.0, 57.0, 94.0, 158.0, 242.0, 144.0, 83.0, 41.0, 28.0, 16.0, 6.0, 5.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4417426586151123, -1.40015709400177, -1.3585715293884277, -1.3169859647750854, -1.2754004001617432, -1.2338148355484009, -1.1922292709350586, -1.1506435871124268, -1.109058141708374, -1.0674725770950317, -1.0258870124816895, -0.9843014478683472, -0.9427158832550049, -0.9011303186416626, -0.8595446944236755, -0.8179591298103333, -0.7763735055923462, -0.7347879409790039, -0.6932023763656616, -0.6516168117523193, -0.610031247138977, -0.5684456825256348, -0.5268600583076477, -0.4852744936943054, -0.44368892908096313, -0.40210336446762085, -0.36051779985427856, -0.3189322054386139, -0.2773466408252716, -0.23576107621192932, -0.19417549669742584, -0.15258991718292236, -0.11100435256958008, -0.0694187805056572, -0.027833208441734314, 0.013752363622188568, 0.05533793568611145, 0.09692350029945374, 0.13850907981395721, 0.1800946593284607, 0.22168022394180298, 0.26326578855514526, 0.30485135316848755, 0.3464369475841522, 0.3880225121974945, 0.4296080768108368, 0.47119367122650146, 0.5127792358398438, 0.554364800453186, 0.5959503650665283, 0.6375359296798706, 0.6791214942932129, 0.7207070589065552, 0.7622926235198975, 0.8038782477378845, 0.8454638123512268, 0.8870493769645691, 0.9286349415779114, 0.9702205061912537, 1.0118061304092407, 1.053391695022583, 1.0949772596359253, 1.1365628242492676, 1.1781483888626099, 1.2197339534759521]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 4.0, 6.0, 4.0, 4.0, 4.0, 8.0, 7.0, 9.0, 12.0, 11.0, 26.0, 15.0, 28.0, 25.0, 39.0, 35.0, 24.0, 37.0, 39.0, 32.0, 35.0, 44.0, 53.0, 41.0, 33.0, 41.0, 53.0, 39.0, 34.0, 38.0, 36.0, 27.0, 27.0, 23.0, 16.0, 20.0, 16.0, 7.0, 5.0, 10.0, 8.0, 4.0, 5.0, 2.0, 4.0, 2.0, 4.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39157435297966003, -0.3793319761753082, -0.3670895993709564, -0.3548472225666046, -0.3426048457622528, -0.330362468957901, -0.3181200623512268, -0.305877685546875, -0.2936353087425232, -0.2813929319381714, -0.2691505551338196, -0.2569081783294678, -0.24466580152511597, -0.23242342472076416, -0.22018103301525116, -0.20793865621089935, -0.19569629430770874, -0.18345391750335693, -0.17121154069900513, -0.15896916389465332, -0.1467267870903015, -0.1344844102859497, -0.1222420185804367, -0.1099996417760849, -0.0977572649717331, -0.08551488816738129, -0.07327251136302948, -0.061030127108097076, -0.04878775030374527, -0.03654537349939346, -0.02430298924446106, -0.012060612440109253, 0.00018173456192016602, 0.012424113228917122, 0.024666491895914078, 0.03690887242555618, 0.04915124922990799, 0.061393626034259796, 0.0736360102891922, 0.085878387093544, 0.09812076389789581, 0.11036314070224762, 0.12260551750659943, 0.13484790921211243, 0.14709028601646423, 0.15933266282081604, 0.17157503962516785, 0.18381741642951965, 0.19605979323387146, 0.20830217003822327, 0.22054454684257507, 0.23278692364692688, 0.2450293004512787, 0.2572716772556305, 0.2695140838623047, 0.2817564606666565, 0.2939988374710083, 0.3062412142753601, 0.3184835910797119, 0.3307259678840637, 0.3429683446884155, 0.35521072149276733, 0.36745309829711914, 0.37969547510147095, 0.39193785190582275]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 13.0, 18.0, 16.0, 52.0, 121.0, 898.0, 92718.0, 953115.0, 1334.0, 147.0, 45.0, 23.0, 10.0, 12.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9931640625, -0.964019775390625, -0.93487548828125, -0.905731201171875, -0.8765869140625, -0.847442626953125, -0.81829833984375, -0.789154052734375, -0.760009765625, -0.730865478515625, -0.70172119140625, -0.672576904296875, -0.6434326171875, -0.614288330078125, -0.58514404296875, -0.555999755859375, -0.52685546875, -0.497711181640625, -0.46856689453125, -0.439422607421875, -0.4102783203125, -0.381134033203125, -0.35198974609375, -0.322845458984375, -0.293701171875, -0.264556884765625, -0.23541259765625, -0.206268310546875, -0.1771240234375, -0.147979736328125, -0.11883544921875, -0.089691162109375, -0.060546875, -0.031402587890625, -0.00225830078125, 0.026885986328125, 0.0560302734375, 0.085174560546875, 0.11431884765625, 0.143463134765625, 0.172607421875, 0.201751708984375, 0.23089599609375, 0.260040283203125, 0.2891845703125, 0.318328857421875, 0.34747314453125, 0.376617431640625, 0.40576171875, 0.434906005859375, 0.46405029296875, 0.493194580078125, 0.5223388671875, 0.551483154296875, 0.58062744140625, 0.609771728515625, 0.638916015625, 0.668060302734375, 0.69720458984375, 0.726348876953125, 0.7554931640625, 0.784637451171875, 0.81378173828125, 0.842926025390625, 0.8720703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [6.0, 9.0, 19.0, 45.0, 132.0, 226.0, 276.0, 173.0, 90.0, 29.0, 10.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28759765625, -0.24217987060546875, -0.1967620849609375, -0.15134429931640625, -0.105926513671875, -0.06050872802734375, -0.0150909423828125, 0.03032684326171875, 0.07574462890625, 0.12116241455078125, 0.1665802001953125, 0.21199798583984375, 0.257415771484375, 0.30283355712890625, 0.3482513427734375, 0.39366912841796875, 0.4390869140625, 0.48450469970703125, 0.5299224853515625, 0.5753402709960938, 0.620758056640625, 0.6661758422851562, 0.7115936279296875, 0.7570114135742188, 0.80242919921875, 0.8478469848632812, 0.8932647705078125, 0.9386825561523438, 0.984100341796875, 1.0295181274414062, 1.0749359130859375, 1.1203536987304688, 1.165771484375, 1.2111892700195312, 1.2566070556640625, 1.3020248413085938, 1.347442626953125, 1.3928604125976562, 1.4382781982421875, 1.4836959838867188, 1.52911376953125, 1.5745315551757812, 1.6199493408203125, 1.6653671264648438, 1.710784912109375, 1.7562026977539062, 1.8016204833984375, 1.8470382690429688, 1.8924560546875, 1.9378738403320312, 1.9832916259765625, 2.0287094116210938, 2.074127197265625, 2.1195449829101562, 2.1649627685546875, 2.2103805541992188, 2.25579833984375, 2.3012161254882812, 2.3466339111328125, 2.3920516967773438, 2.437469482421875, 2.4828872680664062, 2.5283050537109375, 2.5737228393554688, 2.619140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 7.0, 10.0, 15.0, 21.0, 32.0, 32.0, 42.0, 60.0, 62.0, 77.0, 115.0, 129.0, 185.0, 419.0, 1118.0, 4241.0, 25219.0, 700597.0, 294041.0, 17291.0, 2966.0, 854.0, 327.0, 191.0, 132.0, 80.0, 62.0, 58.0, 45.0, 19.0, 18.0, 16.0, 20.0, 15.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.02581787109375, -0.025078296661376953, -0.024338722229003906, -0.02359914779663086, -0.022859573364257812, -0.022119998931884766, -0.02138042449951172, -0.020640850067138672, -0.019901275634765625, -0.019161701202392578, -0.01842212677001953, -0.017682552337646484, -0.016942977905273438, -0.01620340347290039, -0.015463829040527344, -0.014724254608154297, -0.01398468017578125, -0.013245105743408203, -0.012505531311035156, -0.01176595687866211, -0.011026382446289062, -0.010286808013916016, -0.009547233581542969, -0.008807659149169922, -0.008068084716796875, -0.007328510284423828, -0.006588935852050781, -0.005849361419677734, -0.0051097869873046875, -0.004370212554931641, -0.0036306381225585938, -0.002891063690185547, -0.0021514892578125, -0.0014119148254394531, -0.0006723403930664062, 6.723403930664062e-05, 0.0008068084716796875, 0.0015463829040527344, 0.0022859573364257812, 0.003025531768798828, 0.003765106201171875, 0.004504680633544922, 0.005244255065917969, 0.005983829498291016, 0.0067234039306640625, 0.007462978363037109, 0.008202552795410156, 0.008942127227783203, 0.00968170166015625, 0.010421276092529297, 0.011160850524902344, 0.01190042495727539, 0.012639999389648438, 0.013379573822021484, 0.014119148254394531, 0.014858722686767578, 0.015598297119140625, 0.016337871551513672, 0.01707744598388672, 0.017817020416259766, 0.018556594848632812, 0.01929616928100586, 0.020035743713378906, 0.020775318145751953, 0.021514892578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 7.0, 2.0, 13.0, 15.0, 14.0, 18.0, 19.0, 26.0, 27.0, 19.0, 29.0, 26.0, 38.0, 49.0, 54.0, 44.0, 53.0, 49.0, 55.0, 55.0, 44.0, 49.0, 34.0, 41.0, 40.0, 30.0, 24.0, 28.0, 21.0, 13.0, 12.0, 9.0, 11.0, 9.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.68359375, -0.6640701293945312, -0.6445465087890625, -0.6250228881835938, -0.605499267578125, -0.5859756469726562, -0.5664520263671875, -0.5469284057617188, -0.52740478515625, -0.5078811645507812, -0.4883575439453125, -0.46883392333984375, -0.449310302734375, -0.42978668212890625, -0.4102630615234375, -0.39073944091796875, -0.3712158203125, -0.35169219970703125, -0.3321685791015625, -0.31264495849609375, -0.293121337890625, -0.27359771728515625, -0.2540740966796875, -0.23455047607421875, -0.21502685546875, -0.19550323486328125, -0.1759796142578125, -0.15645599365234375, -0.136932373046875, -0.11740875244140625, -0.0978851318359375, -0.07836151123046875, -0.058837890625, -0.03931427001953125, -0.0197906494140625, -0.00026702880859375, 0.019256591796875, 0.03878021240234375, 0.0583038330078125, 0.07782745361328125, 0.09735107421875, 0.11687469482421875, 0.1363983154296875, 0.15592193603515625, 0.175445556640625, 0.19496917724609375, 0.2144927978515625, 0.23401641845703125, 0.2535400390625, 0.27306365966796875, 0.2925872802734375, 0.31211090087890625, 0.331634521484375, 0.35115814208984375, 0.3706817626953125, 0.39020538330078125, 0.40972900390625, 0.42925262451171875, 0.4487762451171875, 0.46829986572265625, 0.487823486328125, 0.5073471069335938, 0.5268707275390625, 0.5463943481445312, 0.56591796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 12.0, 19.0, 18.0, 31.0, 40.0, 57.0, 84.0, 127.0, 154.0, 230.0, 319.0, 473.0, 678.0, 972.0, 1470.0, 2292.0, 3674.0, 6585.0, 13201.0, 31474.0, 823311.0, 116963.0, 21702.0, 9984.0, 5410.0, 3137.0, 1941.0, 1315.0, 854.0, 602.0, 418.0, 295.0, 235.0, 142.0, 95.0, 65.0, 54.0, 44.0, 23.0, 19.0, 8.0, 6.0, 9.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009636878967285156, -0.0009324178099632263, -0.000901147723197937, -0.0008698776364326477, -0.0008386075496673584, -0.0008073374629020691, -0.0007760673761367798, -0.0007447972893714905, -0.0007135272026062012, -0.0006822571158409119, -0.0006509870290756226, -0.0006197169423103333, -0.0005884468555450439, -0.0005571767687797546, -0.0005259066820144653, -0.000494636595249176, -0.0004633665084838867, -0.0004320964217185974, -0.0004008263349533081, -0.0003695562481880188, -0.0003382861614227295, -0.0003070160746574402, -0.0002757459878921509, -0.00024447590112686157, -0.00021320581436157227, -0.00018193572759628296, -0.00015066564083099365, -0.00011939555406570435, -8.812546730041504e-05, -5.685538053512573e-05, -2.5585293769836426e-05, 5.684792995452881e-06, 3.695487976074219e-05, 6.82249665260315e-05, 9.94950532913208e-05, 0.0001307651400566101, 0.00016203522682189941, 0.00019330531358718872, 0.00022457540035247803, 0.00025584548711776733, 0.00028711557388305664, 0.00031838566064834595, 0.00034965574741363525, 0.00038092583417892456, 0.00041219592094421387, 0.0004434660077095032, 0.0004747360944747925, 0.0005060061812400818, 0.0005372762680053711, 0.0005685463547706604, 0.0005998164415359497, 0.000631086528301239, 0.0006623566150665283, 0.0006936267018318176, 0.0007248967885971069, 0.0007561668753623962, 0.0007874369621276855, 0.0008187070488929749, 0.0008499771356582642, 0.0008812472224235535, 0.0009125173091888428, 0.0009437873959541321, 0.0009750574827194214, 0.0010063275694847107, 0.00103759765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 11.0, 9.0, 20.0, 62.0, 433.0, 347.0, 48.0, 17.0, 15.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00020694732666015625, -0.0002018958330154419, -0.00019684433937072754, -0.00019179284572601318, -0.00018674135208129883, -0.00018168985843658447, -0.00017663836479187012, -0.00017158687114715576, -0.0001665353775024414, -0.00016148388385772705, -0.0001564323902130127, -0.00015138089656829834, -0.00014632940292358398, -0.00014127790927886963, -0.00013622641563415527, -0.00013117492198944092, -0.00012612342834472656, -0.00012107193470001221, -0.00011602044105529785, -0.0001109689474105835, -0.00010591745376586914, -0.00010086596012115479, -9.581446647644043e-05, -9.076297283172607e-05, -8.571147918701172e-05, -8.065998554229736e-05, -7.560849189758301e-05, -7.055699825286865e-05, -6.55055046081543e-05, -6.045401096343994e-05, -5.5402517318725586e-05, -5.035102367401123e-05, -4.5299530029296875e-05, -4.024803638458252e-05, -3.5196542739868164e-05, -3.014504909515381e-05, -2.5093555450439453e-05, -2.0042061805725098e-05, -1.4990568161010742e-05, -9.939074516296387e-06, -4.887580871582031e-06, 1.6391277313232422e-07, 5.21540641784668e-06, 1.0266900062561035e-05, 1.531839370727539e-05, 2.0369887351989746e-05, 2.54213809967041e-05, 3.0472874641418457e-05, 3.552436828613281e-05, 4.057586193084717e-05, 4.5627355575561523e-05, 5.067884922027588e-05, 5.5730342864990234e-05, 6.078183650970459e-05, 6.583333015441895e-05, 7.08848237991333e-05, 7.593631744384766e-05, 8.098781108856201e-05, 8.603930473327637e-05, 9.109079837799072e-05, 9.614229202270508e-05, 0.00010119378566741943, 0.00010624527931213379, 0.00011129677295684814, 0.0001163482666015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 2.0, 6.0, 8.0, 16.0, 29.0, 28.0, 45.0, 49.0, 77.0, 125.0, 194.0, 298.0, 428.0, 712.0, 1091.0, 1712.0, 2877.0, 4837.0, 8957.0, 22674.0, 787448.0, 179026.0, 18418.0, 8097.0, 4406.0, 2600.0, 1589.0, 952.0, 610.0, 432.0, 255.0, 165.0, 113.0, 70.0, 68.0, 43.0, 33.0, 22.0, 12.0, 8.0, 7.0, 2.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004401206970214844, -0.000424899160861969, -0.0004096776247024536, -0.00039445608854293823, -0.00037923455238342285, -0.00036401301622390747, -0.0003487914800643921, -0.0003335699439048767, -0.00031834840774536133, -0.00030312687158584595, -0.00028790533542633057, -0.0002726837992668152, -0.0002574622631072998, -0.00024224072694778442, -0.00022701919078826904, -0.00021179765462875366, -0.00019657611846923828, -0.0001813545823097229, -0.00016613304615020752, -0.00015091150999069214, -0.00013568997383117676, -0.00012046843767166138, -0.000105246901512146, -9.002536535263062e-05, -7.480382919311523e-05, -5.9582293033599854e-05, -4.436075687408447e-05, -2.9139220714569092e-05, -1.3917684555053711e-05, 1.30385160446167e-06, 1.652538776397705e-05, 3.174692392349243e-05, 4.696846008300781e-05, 6.21899962425232e-05, 7.741153240203857e-05, 9.263306856155396e-05, 0.00010785460472106934, 0.00012307614088058472, 0.0001382976770401001, 0.00015351921319961548, 0.00016874074935913086, 0.00018396228551864624, 0.00019918382167816162, 0.000214405357837677, 0.00022962689399719238, 0.00024484843015670776, 0.00026006996631622314, 0.0002752915024757385, 0.0002905130386352539, 0.0003057345747947693, 0.00032095611095428467, 0.00033617764711380005, 0.00035139918327331543, 0.0003666207194328308, 0.0003818422555923462, 0.00039706379175186157, 0.00041228532791137695, 0.00042750686407089233, 0.0004427284002304077, 0.0004579499363899231, 0.0004731714725494385, 0.0004883930087089539, 0.0005036145448684692, 0.0005188360810279846, 0.0005340576171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 3.0, 2.0, 5.0, 6.0, 3.0, 10.0, 12.0, 17.0, 33.0, 60.0, 329.0, 309.0, 87.0, 34.0, 10.0, 11.0, 9.0, 1.0, 5.0, 2.0, 5.0, 2.0, 5.0, 5.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010412931442260742, -0.00010040868073701859, -9.668804705142975e-05, -9.296741336584091e-05, -8.924677968025208e-05, -8.552614599466324e-05, -8.18055123090744e-05, -7.808487862348557e-05, -7.436424493789673e-05, -7.064361125230789e-05, -6.692297756671906e-05, -6.320234388113022e-05, -5.948171019554138e-05, -5.5761076509952545e-05, -5.204044282436371e-05, -4.831980913877487e-05, -4.4599175453186035e-05, -4.08785417675972e-05, -3.715790808200836e-05, -3.3437274396419525e-05, -2.971664071083069e-05, -2.5996007025241852e-05, -2.2275373339653015e-05, -1.855473965406418e-05, -1.4834105968475342e-05, -1.1113472282886505e-05, -7.3928385972976685e-06, -3.6722049117088318e-06, 4.842877388000488e-08, 3.7690624594688416e-06, 7.489696145057678e-06, 1.1210329830646515e-05, 1.4930963516235352e-05, 1.8651597201824188e-05, 2.2372230887413025e-05, 2.609286457300186e-05, 2.9813498258590698e-05, 3.3534131944179535e-05, 3.725476562976837e-05, 4.097539931535721e-05, 4.4696033000946045e-05, 4.841666668653488e-05, 5.213730037212372e-05, 5.5857934057712555e-05, 5.957856774330139e-05, 6.329920142889023e-05, 6.701983511447906e-05, 7.07404688000679e-05, 7.446110248565674e-05, 7.818173617124557e-05, 8.190236985683441e-05, 8.562300354242325e-05, 8.934363722801208e-05, 9.306427091360092e-05, 9.678490459918976e-05, 0.0001005055382847786, 0.00010422617197036743, 0.00010794680565595627, 0.0001116674393415451, 0.00011538807302713394, 0.00011910870671272278, 0.00012282934039831161, 0.00012654997408390045, 0.0001302706077694893, 0.00013399124145507812]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 13.0, 36.0, 483.0, 430.0, 38.0, 11.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9797057509422302, -0.8714054226875305, -0.7631050944328308, -0.6548048257827759, -0.5465044975280762, -0.43820416927337646, -0.32990384101867676, -0.22160351276397705, -0.11330318450927734, -0.005002863705158234, 0.10329745709896088, 0.2115977704524994, 0.3198980987071991, 0.4281983971595764, 0.5364987254142761, 0.6447990536689758, 0.7530993819236755, 0.8613997101783752, 0.969700038433075, 1.0780003070831299, 1.1863006353378296, 1.2946009635925293, 1.402901291847229, 1.5112016201019287, 1.6195019483566284, 1.7278022766113281, 1.8361026048660278, 1.9444029331207275, 2.0527031421661377, 2.161003589630127, 2.269303798675537, 2.3776042461395264, 2.4859044551849365, 2.5942046642303467, 2.702505111694336, 2.810805320739746, 2.9191057682037354, 3.0274059772491455, 3.1357064247131348, 3.244006633758545, 3.352307081222534, 3.4606072902679443, 3.5689077377319336, 3.6772079467773438, 3.785508394241333, 3.893808603286743, 4.002109050750732, 4.110409259796143, 4.218709468841553, 4.327009677886963, 4.435309886932373, 4.543610572814941, 4.651910781860352, 4.760210990905762, 4.868511199951172, 4.97681188583374, 5.08511209487915, 5.1934123039245605, 5.301712512969971, 5.410013198852539, 5.518313407897949, 5.626613616943359, 5.7349138259887695, 5.843214511871338, 5.951514720916748]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 12.0, 30.0, 114.0, 243.0, 323.0, 196.0, 75.0, 20.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23198917508125305, -0.1888667792081833, -0.14574438333511353, -0.10262197256088257, -0.059499576687812805, -0.016377180814743042, 0.026745229959487915, 0.06986761093139648, 0.11299002170562744, 0.1561124175786972, 0.19923481345176697, 0.24235722422599792, 0.2854796051979065, 0.32860201597213745, 0.3717244267463684, 0.414846807718277, 0.45796921849250793, 0.5010915994644165, 0.5442140102386475, 0.5873364210128784, 0.6304588317871094, 0.6735812425613403, 0.7167036533355713, 0.7598260045051575, 0.8029484152793884, 0.8460708260536194, 0.8891932368278503, 0.9323155879974365, 0.9754379987716675, 1.0185604095458984, 1.0616828203201294, 1.1048052310943604, 1.1479276418685913, 1.1910500526428223, 1.2341724634170532, 1.2772948741912842, 1.3204172849655151, 1.363539695739746, 1.4066619873046875, 1.4497843980789185, 1.4929068088531494, 1.5360292196273804, 1.5791516304016113, 1.6222740411758423, 1.6653964519500732, 1.7085187435150146, 1.7516412734985352, 1.7947635650634766, 1.837886095046997, 1.881008505821228, 1.924130916595459, 1.96725332736969, 2.010375738143921, 2.0534980297088623, 2.096620559692383, 2.139742851257324, 2.1828651428222656, 2.225987434387207, 2.2691099643707275, 2.312232255935669, 2.3553547859191895, 2.398477077484131, 2.4415996074676514, 2.4847218990325928, 2.5278444290161133]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 9.0, 2.0, 7.0, 5.0, 7.0, 9.0, 11.0, 14.0, 9.0, 8.0, 8.0, 12.0, 10.0, 16.0, 10.0, 11.0, 18.0, 40.0, 68.0, 208.0, 2317.0, 30306.0, 959793.0, 51242.0, 3794.0, 339.0, 68.0, 34.0, 23.0, 16.0, 15.0, 7.0, 11.0, 6.0, 7.0, 7.0, 7.0, 14.0, 8.0, 12.0, 7.0, 7.0, 2.0, 5.0, 5.0, 6.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.2451171875, -1.2080535888671875, -1.170989990234375, -1.1339263916015625, -1.09686279296875, -1.0597991943359375, -1.022735595703125, -0.9856719970703125, -0.9486083984375, -0.9115447998046875, -0.874481201171875, -0.8374176025390625, -0.80035400390625, -0.7632904052734375, -0.726226806640625, -0.6891632080078125, -0.652099609375, -0.6150360107421875, -0.577972412109375, -0.5409088134765625, -0.50384521484375, -0.4667816162109375, -0.429718017578125, -0.3926544189453125, -0.3555908203125, -0.3185272216796875, -0.281463623046875, -0.2444000244140625, -0.20733642578125, -0.1702728271484375, -0.133209228515625, -0.0961456298828125, -0.05908203125, -0.0220184326171875, 0.015045166015625, 0.0521087646484375, 0.08917236328125, 0.1262359619140625, 0.163299560546875, 0.2003631591796875, 0.2374267578125, 0.2744903564453125, 0.311553955078125, 0.3486175537109375, 0.38568115234375, 0.4227447509765625, 0.459808349609375, 0.4968719482421875, 0.533935546875, 0.5709991455078125, 0.608062744140625, 0.6451263427734375, 0.68218994140625, 0.7192535400390625, 0.756317138671875, 0.7933807373046875, 0.8304443359375, 0.8675079345703125, 0.904571533203125, 0.9416351318359375, 0.97869873046875, 1.0157623291015625, 1.052825927734375, 1.0898895263671875, 1.126953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 13.0, 26.0, 80.0, 205.0, 308.0, 239.0, 100.0, 35.0, 13.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0259857177734375, -0.02297234535217285, -0.019958972930908203, -0.016945600509643555, -0.013932228088378906, -0.010918855667114258, -0.00790548324584961, -0.004892110824584961, -0.0018787384033203125, 0.001134634017944336, 0.004148006439208984, 0.007161378860473633, 0.010174751281738281, 0.01318812370300293, 0.016201496124267578, 0.019214868545532227, 0.022228240966796875, 0.025241613388061523, 0.028254985809326172, 0.03126835823059082, 0.03428173065185547, 0.03729510307312012, 0.040308475494384766, 0.043321847915649414, 0.04633522033691406, 0.04934859275817871, 0.05236196517944336, 0.05537533760070801, 0.058388710021972656, 0.061402082443237305, 0.06441545486450195, 0.0674288272857666, 0.07044219970703125, 0.0734555721282959, 0.07646894454956055, 0.0794823169708252, 0.08249568939208984, 0.08550906181335449, 0.08852243423461914, 0.09153580665588379, 0.09454917907714844, 0.09756255149841309, 0.10057592391967773, 0.10358929634094238, 0.10660266876220703, 0.10961604118347168, 0.11262941360473633, 0.11564278602600098, 0.11865615844726562, 0.12166953086853027, 0.12468290328979492, 0.12769627571105957, 0.13070964813232422, 0.13372302055358887, 0.13673639297485352, 0.13974976539611816, 0.1427631378173828, 0.14577651023864746, 0.1487898826599121, 0.15180325508117676, 0.1548166275024414, 0.15782999992370605, 0.1608433723449707, 0.16385674476623535, 0.1668701171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 1.0, 2.0, 3.0, 6.0, 15.0, 18.0, 20.0, 34.0, 39.0, 52.0, 71.0, 126.0, 182.0, 220.0, 341.0, 602.0, 793.0, 1338.0, 2226.0, 3771.0, 6947.0, 13071.0, 28188.0, 77277.0, 465530.0, 328847.0, 65741.0, 25432.0, 12024.0, 6452.0, 3441.0, 2115.0, 1297.0, 750.0, 496.0, 325.0, 234.0, 163.0, 104.0, 71.0, 58.0, 38.0, 26.0, 26.0, 16.0, 9.0, 9.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1197509765625, -0.11561203002929688, -0.11147308349609375, -0.10733413696289062, -0.1031951904296875, -0.09905624389648438, -0.09491729736328125, -0.09077835083007812, -0.086639404296875, -0.08250045776367188, -0.07836151123046875, -0.07422256469726562, -0.0700836181640625, -0.06594467163085938, -0.06180572509765625, -0.057666778564453125, -0.05352783203125, -0.049388885498046875, -0.04524993896484375, -0.041110992431640625, -0.0369720458984375, -0.032833099365234375, -0.02869415283203125, -0.024555206298828125, -0.020416259765625, -0.016277313232421875, -0.01213836669921875, -0.007999420166015625, -0.0038604736328125, 0.000278472900390625, 0.00441741943359375, 0.008556365966796875, 0.0126953125, 0.016834259033203125, 0.02097320556640625, 0.025112152099609375, 0.0292510986328125, 0.033390045166015625, 0.03752899169921875, 0.041667938232421875, 0.045806884765625, 0.049945831298828125, 0.05408477783203125, 0.058223724365234375, 0.0623626708984375, 0.06650161743164062, 0.07064056396484375, 0.07477951049804688, 0.07891845703125, 0.08305740356445312, 0.08719635009765625, 0.09133529663085938, 0.0954742431640625, 0.09961318969726562, 0.10375213623046875, 0.10789108276367188, 0.112030029296875, 0.11616897583007812, 0.12030792236328125, 0.12444686889648438, 0.1285858154296875, 0.13272476196289062, 0.13686370849609375, 0.14100265502929688, 0.1451416015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 9.0, 7.0, 6.0, 4.0, 9.0, 8.0, 12.0, 12.0, 17.0, 16.0, 19.0, 20.0, 22.0, 27.0, 32.0, 47.0, 60.0, 58.0, 61.0, 69.0, 78.0, 65.0, 54.0, 57.0, 35.0, 31.0, 22.0, 13.0, 14.0, 21.0, 14.0, 11.0, 8.0, 6.0, 12.0, 8.0, 7.0, 9.0, 8.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.047821044921875, -0.04630231857299805, -0.044783592224121094, -0.04326486587524414, -0.04174613952636719, -0.040227413177490234, -0.03870868682861328, -0.03718996047973633, -0.035671234130859375, -0.03415250778198242, -0.03263378143310547, -0.031115055084228516, -0.029596328735351562, -0.02807760238647461, -0.026558876037597656, -0.025040149688720703, -0.02352142333984375, -0.022002696990966797, -0.020483970642089844, -0.01896524429321289, -0.017446517944335938, -0.015927791595458984, -0.014409065246582031, -0.012890338897705078, -0.011371612548828125, -0.009852886199951172, -0.008334159851074219, -0.006815433502197266, -0.0052967071533203125, -0.0037779808044433594, -0.0022592544555664062, -0.0007405281066894531, 0.0007781982421875, 0.002296924591064453, 0.0038156509399414062, 0.005334377288818359, 0.0068531036376953125, 0.008371829986572266, 0.009890556335449219, 0.011409282684326172, 0.012928009033203125, 0.014446735382080078, 0.01596546173095703, 0.017484188079833984, 0.019002914428710938, 0.02052164077758789, 0.022040367126464844, 0.023559093475341797, 0.02507781982421875, 0.026596546173095703, 0.028115272521972656, 0.02963399887084961, 0.031152725219726562, 0.032671451568603516, 0.03419017791748047, 0.03570890426635742, 0.037227630615234375, 0.03874635696411133, 0.04026508331298828, 0.041783809661865234, 0.04330253601074219, 0.04482126235961914, 0.046339988708496094, 0.04785871505737305, 0.04937744140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 8.0, 10.0, 11.0, 13.0, 24.0, 40.0, 54.0, 95.0, 146.0, 219.0, 386.0, 638.0, 1135.0, 2445.0, 8824.0, 990912.0, 35087.0, 4642.0, 1706.0, 818.0, 473.0, 284.0, 191.0, 119.0, 84.0, 54.0, 43.0, 31.0, 10.0, 15.0, 11.0, 8.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48828125, -4.32672119140625, -4.1651611328125, -4.00360107421875, -3.842041015625, -3.68048095703125, -3.5189208984375, -3.35736083984375, -3.19580078125, -3.03424072265625, -2.8726806640625, -2.71112060546875, -2.549560546875, -2.38800048828125, -2.2264404296875, -2.06488037109375, -1.9033203125, -1.74176025390625, -1.5802001953125, -1.41864013671875, -1.257080078125, -1.09552001953125, -0.9339599609375, -0.77239990234375, -0.61083984375, -0.44927978515625, -0.2877197265625, -0.12615966796875, 0.035400390625, 0.19696044921875, 0.3585205078125, 0.52008056640625, 0.681640625, 0.84320068359375, 1.0047607421875, 1.16632080078125, 1.327880859375, 1.48944091796875, 1.6510009765625, 1.81256103515625, 1.97412109375, 2.13568115234375, 2.2972412109375, 2.45880126953125, 2.620361328125, 2.78192138671875, 2.9434814453125, 3.10504150390625, 3.2666015625, 3.42816162109375, 3.5897216796875, 3.75128173828125, 3.912841796875, 4.07440185546875, 4.2359619140625, 4.39752197265625, 4.55908203125, 4.72064208984375, 4.8822021484375, 5.04376220703125, 5.205322265625, 5.36688232421875, 5.5284423828125, 5.69000244140625, 5.8515625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 19.0, 663.0, 253.0, 21.0, 8.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001811981201171875, -0.001753494143486023, -0.001695007085800171, -0.0016365200281143188, -0.0015780329704284668, -0.0015195459127426147, -0.0014610588550567627, -0.0014025717973709106, -0.0013440847396850586, -0.0012855976819992065, -0.0012271106243133545, -0.0011686235666275024, -0.0011101365089416504, -0.0010516494512557983, -0.0009931623935699463, -0.0009346753358840942, -0.0008761882781982422, -0.0008177012205123901, -0.0007592141628265381, -0.000700727105140686, -0.000642240047454834, -0.0005837529897689819, -0.0005252659320831299, -0.00046677887439727783, -0.0004082918167114258, -0.00034980475902557373, -0.0002913177013397217, -0.00023283064365386963, -0.00017434358596801758, -0.00011585652828216553, -5.7369470596313477e-05, 1.1175870895385742e-06, 5.9604644775390625e-05, 0.00011809170246124268, 0.00017657876014709473, 0.00023506581783294678, 0.00029355287551879883, 0.0003520399332046509, 0.00041052699089050293, 0.000469014048576355, 0.000527501106262207, 0.0005859881639480591, 0.0006444752216339111, 0.0007029622793197632, 0.0007614493370056152, 0.0008199363946914673, 0.0008784234523773193, 0.0009369105100631714, 0.0009953975677490234, 0.0010538846254348755, 0.0011123716831207275, 0.0011708587408065796, 0.0012293457984924316, 0.0012878328561782837, 0.0013463199138641357, 0.0014048069715499878, 0.0014632940292358398, 0.001521781086921692, 0.001580268144607544, 0.001638755202293396, 0.001697242259979248, 0.0017557293176651, 0.0018142163753509521, 0.0018727034330368042, 0.0019311904907226562]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 15.0, 12.0, 24.0, 34.0, 27.0, 42.0, 63.0, 66.0, 106.0, 140.0, 192.0, 271.0, 405.0, 563.0, 863.0, 1501.0, 2665.0, 5683.0, 15651.0, 779582.0, 213525.0, 14828.0, 5590.0, 2567.0, 1378.0, 838.0, 568.0, 387.0, 264.0, 198.0, 122.0, 88.0, 75.0, 51.0, 41.0, 31.0, 29.0, 18.0, 13.0, 11.0, 4.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.78369140625, -0.759185791015625, -0.73468017578125, -0.710174560546875, -0.6856689453125, -0.661163330078125, -0.63665771484375, -0.612152099609375, -0.587646484375, -0.563140869140625, -0.53863525390625, -0.514129638671875, -0.4896240234375, -0.465118408203125, -0.44061279296875, -0.416107177734375, -0.3916015625, -0.367095947265625, -0.34259033203125, -0.318084716796875, -0.2935791015625, -0.269073486328125, -0.24456787109375, -0.220062255859375, -0.195556640625, -0.171051025390625, -0.14654541015625, -0.122039794921875, -0.0975341796875, -0.073028564453125, -0.04852294921875, -0.024017333984375, 0.00048828125, 0.024993896484375, 0.04949951171875, 0.074005126953125, 0.0985107421875, 0.123016357421875, 0.14752197265625, 0.172027587890625, 0.196533203125, 0.221038818359375, 0.24554443359375, 0.270050048828125, 0.2945556640625, 0.319061279296875, 0.34356689453125, 0.368072509765625, 0.392578125, 0.417083740234375, 0.44158935546875, 0.466094970703125, 0.4906005859375, 0.515106201171875, 0.53961181640625, 0.564117431640625, 0.588623046875, 0.613128662109375, 0.63763427734375, 0.662139892578125, 0.6866455078125, 0.711151123046875, 0.73565673828125, 0.760162353515625, 0.78466796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 11.0, 14.0, 13.0, 33.0, 397.0, 416.0, 22.0, 21.0, 6.0, 10.0, 13.0, 9.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.417236328125, -0.40419769287109375, -0.3911590576171875, -0.37812042236328125, -0.365081787109375, -0.35204315185546875, -0.3390045166015625, -0.32596588134765625, -0.31292724609375, -0.29988861083984375, -0.2868499755859375, -0.27381134033203125, -0.260772705078125, -0.24773406982421875, -0.2346954345703125, -0.22165679931640625, -0.2086181640625, -0.19557952880859375, -0.1825408935546875, -0.16950225830078125, -0.156463623046875, -0.14342498779296875, -0.1303863525390625, -0.11734771728515625, -0.10430908203125, -0.09127044677734375, -0.0782318115234375, -0.06519317626953125, -0.052154541015625, -0.03911590576171875, -0.0260772705078125, -0.01303863525390625, 0.0, 0.01303863525390625, 0.0260772705078125, 0.03911590576171875, 0.052154541015625, 0.06519317626953125, 0.0782318115234375, 0.09127044677734375, 0.10430908203125, 0.11734771728515625, 0.1303863525390625, 0.14342498779296875, 0.156463623046875, 0.16950225830078125, 0.1825408935546875, 0.19557952880859375, 0.2086181640625, 0.22165679931640625, 0.2346954345703125, 0.24773406982421875, 0.260772705078125, 0.27381134033203125, 0.2868499755859375, 0.29988861083984375, 0.31292724609375, 0.32596588134765625, 0.3390045166015625, 0.35204315185546875, 0.365081787109375, 0.37812042236328125, 0.3911590576171875, 0.40419769287109375, 0.417236328125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 7.0, 14.0, 21.0, 36.0, 102.0, 437.0, 252.0, 60.0, 30.0, 16.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.341251373291016, -17.941007614135742, -17.540761947631836, -17.140518188476562, -16.740272521972656, -16.340028762817383, -15.939783096313477, -15.539538383483887, -15.139293670654297, -14.739048957824707, -14.338804244995117, -13.938559532165527, -13.538314819335938, -13.138070106506348, -12.737825393676758, -12.337580680847168, -11.937335968017578, -11.537091255187988, -11.136846542358398, -10.736601829528809, -10.336357116699219, -9.936112403869629, -9.535867691040039, -9.13562297821045, -8.735379219055176, -8.335134506225586, -7.934889793395996, -7.534645080566406, -7.134400367736816, -6.734155654907227, -6.333910942077637, -5.933666229248047, -5.533421516418457, -5.133176803588867, -4.732932090759277, -4.3326873779296875, -3.9324426651000977, -3.532198190689087, -3.131953477859497, -2.7317087650299072, -2.3314640522003174, -1.9312193393707275, -1.5309746265411377, -1.1307300329208374, -0.7304853200912476, -0.33024072647094727, 0.07000398635864258, 0.4702486991882324, 0.8704934120178223, 1.270738124847412, 1.670982837677002, 2.071227550506592, 2.4714722633361816, 2.8717167377471924, 3.2719614505767822, 3.672206163406372, 4.072450637817383, 4.472695350646973, 4.8729400634765625, 5.273184776306152, 5.673429489135742, 6.073674201965332, 6.473918914794922, 6.874163627624512, 7.274408340454102]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 6.0, 9.0, 9.0, 5.0, 7.0, 11.0, 15.0, 12.0, 21.0, 21.0, 21.0, 21.0, 28.0, 36.0, 34.0, 38.0, 40.0, 47.0, 36.0, 24.0, 47.0, 47.0, 45.0, 40.0, 36.0, 34.0, 36.0, 37.0, 24.0, 39.0, 20.0, 33.0, 14.0, 25.0, 17.0, 13.0, 11.0, 12.0, 4.0, 7.0, 6.0, 1.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3505553603172302, -0.33817169070243835, -0.32578805088996887, -0.313404381275177, -0.3010207414627075, -0.28863707184791565, -0.2762534022331238, -0.2638697624206543, -0.2514861226081848, -0.23910246789455414, -0.22671881318092346, -0.2143351435661316, -0.2019515037536621, -0.18956783413887024, -0.17718417942523956, -0.1648005247116089, -0.15241685509681702, -0.14003320038318634, -0.12764954566955566, -0.11526588350534439, -0.10288222879171371, -0.09049857407808304, -0.07811491191387177, -0.06573125720024109, -0.05334760248661041, -0.040963947772979736, -0.02858028933405876, -0.016196630895137787, -0.0038129761815071106, 0.008570678532123566, 0.02095434069633484, 0.033337995409965515, 0.04572165012359619, 0.05810530483722687, 0.07048895955085754, 0.08287262171506882, 0.0952562764286995, 0.10763993114233017, 0.12002359330654144, 0.13240724802017212, 0.1447909027338028, 0.15717455744743347, 0.16955821216106415, 0.18194186687469482, 0.1943255364894867, 0.20670917630195618, 0.21909284591674805, 0.23147650063037872, 0.2438601553440094, 0.25624382495880127, 0.26862746477127075, 0.2810111343860626, 0.2933947741985321, 0.305778443813324, 0.31816208362579346, 0.3305457532405853, 0.3429294228553772, 0.35531309247016907, 0.36769673228263855, 0.3800804018974304, 0.3924640417098999, 0.4048477113246918, 0.41723138093948364, 0.4296150207519531, 0.4419986605644226]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 11.0, 8.0, 15.0, 24.0, 24.0, 18.0, 45.0, 78.0, 98.0, 174.0, 250.0, 419.0, 724.0, 1283.0, 2635.0, 5334.0, 12789.0, 36660.0, 4010987.0, 88688.0, 19793.0, 7372.0, 3248.0, 1552.0, 817.0, 453.0, 308.0, 156.0, 114.0, 64.0, 49.0, 24.0, 18.0, 16.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.9827880859375, -3.844482421875, -3.7061767578125, -3.56787109375, -3.4295654296875, -3.291259765625, -3.1529541015625, -3.0146484375, -2.8763427734375, -2.738037109375, -2.5997314453125, -2.46142578125, -2.3231201171875, -2.184814453125, -2.0465087890625, -1.908203125, -1.7698974609375, -1.631591796875, -1.4932861328125, -1.35498046875, -1.2166748046875, -1.078369140625, -0.9400634765625, -0.8017578125, -0.6634521484375, -0.525146484375, -0.3868408203125, -0.24853515625, -0.1102294921875, 0.028076171875, 0.1663818359375, 0.3046875, 0.4429931640625, 0.581298828125, 0.7196044921875, 0.85791015625, 0.9962158203125, 1.134521484375, 1.2728271484375, 1.4111328125, 1.5494384765625, 1.687744140625, 1.8260498046875, 1.96435546875, 2.1026611328125, 2.240966796875, 2.3792724609375, 2.517578125, 2.6558837890625, 2.794189453125, 2.9324951171875, 3.07080078125, 3.2091064453125, 3.347412109375, 3.4857177734375, 3.6240234375, 3.7623291015625, 3.900634765625, 4.0389404296875, 4.17724609375, 4.3155517578125, 4.453857421875, 4.5921630859375, 4.73046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 11.0, 10.0, 15.0, 15.0, 27.0, 25.0, 27.0, 40.0, 74.0, 125.0, 232.0, 177.0, 62.0, 34.0, 30.0, 32.0, 17.0, 10.0, 9.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.214111328125, -0.20908164978027344, -0.20405197143554688, -0.1990222930908203, -0.19399261474609375, -0.1889629364013672, -0.18393325805664062, -0.17890357971191406, -0.1738739013671875, -0.16884422302246094, -0.16381454467773438, -0.1587848663330078, -0.15375518798828125, -0.1487255096435547, -0.14369583129882812, -0.13866615295410156, -0.133636474609375, -0.12860679626464844, -0.12357711791992188, -0.11854743957519531, -0.11351776123046875, -0.10848808288574219, -0.10345840454101562, -0.09842872619628906, -0.0933990478515625, -0.08836936950683594, -0.08333969116210938, -0.07831001281738281, -0.07328033447265625, -0.06825065612792969, -0.06322097778320312, -0.05819129943847656, -0.05316162109375, -0.04813194274902344, -0.043102264404296875, -0.03807258605957031, -0.03304290771484375, -0.028013229370117188, -0.022983551025390625, -0.017953872680664062, -0.0129241943359375, -0.007894515991210938, -0.002864837646484375, 0.0021648406982421875, 0.00719451904296875, 0.012224197387695312, 0.017253875732421875, 0.022283554077148438, 0.027313232421875, 0.03234291076660156, 0.037372589111328125, 0.04240226745605469, 0.04743194580078125, 0.05246162414550781, 0.057491302490234375, 0.06252098083496094, 0.0675506591796875, 0.07258033752441406, 0.07761001586914062, 0.08263969421386719, 0.08766937255859375, 0.09269905090332031, 0.09772872924804688, 0.10275840759277344, 0.1077880859375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 10.0, 11.0, 14.0, 27.0, 38.0, 44.0, 76.0, 125.0, 230.0, 379.0, 711.0, 1366.0, 2873.0, 6802.0, 17946.0, 64879.0, 3980195.0, 83479.0, 20928.0, 7563.0, 3277.0, 1507.0, 752.0, 419.0, 241.0, 150.0, 91.0, 42.0, 37.0, 19.0, 15.0, 6.0, 4.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.779296875, -1.7191162109375, -1.658935546875, -1.5987548828125, -1.53857421875, -1.4783935546875, -1.418212890625, -1.3580322265625, -1.2978515625, -1.2376708984375, -1.177490234375, -1.1173095703125, -1.05712890625, -0.9969482421875, -0.936767578125, -0.8765869140625, -0.81640625, -0.7562255859375, -0.696044921875, -0.6358642578125, -0.57568359375, -0.5155029296875, -0.455322265625, -0.3951416015625, -0.3349609375, -0.2747802734375, -0.214599609375, -0.1544189453125, -0.09423828125, -0.0340576171875, 0.026123046875, 0.0863037109375, 0.146484375, 0.2066650390625, 0.266845703125, 0.3270263671875, 0.38720703125, 0.4473876953125, 0.507568359375, 0.5677490234375, 0.6279296875, 0.6881103515625, 0.748291015625, 0.8084716796875, 0.86865234375, 0.9288330078125, 0.989013671875, 1.0491943359375, 1.109375, 1.1695556640625, 1.229736328125, 1.2899169921875, 1.35009765625, 1.4102783203125, 1.470458984375, 1.5306396484375, 1.5908203125, 1.6510009765625, 1.711181640625, 1.7713623046875, 1.83154296875, 1.8917236328125, 1.951904296875, 2.0120849609375, 2.072265625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 12.0, 10.0, 6.0, 16.0, 12.0, 29.0, 46.0, 79.0, 2671.0, 993.0, 64.0, 25.0, 24.0, 11.0, 10.0, 8.0, 9.0, 4.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4501953125, -0.43350982666015625, -0.4168243408203125, -0.40013885498046875, -0.383453369140625, -0.36676788330078125, -0.3500823974609375, -0.33339691162109375, -0.31671142578125, -0.30002593994140625, -0.2833404541015625, -0.26665496826171875, -0.249969482421875, -0.23328399658203125, -0.2165985107421875, -0.19991302490234375, -0.1832275390625, -0.16654205322265625, -0.1498565673828125, -0.13317108154296875, -0.116485595703125, -0.09980010986328125, -0.0831146240234375, -0.06642913818359375, -0.04974365234375, -0.03305816650390625, -0.0163726806640625, 0.00031280517578125, 0.016998291015625, 0.03368377685546875, 0.0503692626953125, 0.06705474853515625, 0.083740234375, 0.10042572021484375, 0.1171112060546875, 0.13379669189453125, 0.150482177734375, 0.16716766357421875, 0.1838531494140625, 0.20053863525390625, 0.21722412109375, 0.23390960693359375, 0.2505950927734375, 0.26728057861328125, 0.283966064453125, 0.30065155029296875, 0.3173370361328125, 0.33402252197265625, 0.3507080078125, 0.36739349365234375, 0.3840789794921875, 0.40076446533203125, 0.417449951171875, 0.43413543701171875, 0.4508209228515625, 0.46750640869140625, 0.48419189453125, 0.5008773803710938, 0.5175628662109375, 0.5342483520507812, 0.550933837890625, 0.5676193237304688, 0.5843048095703125, 0.6009902954101562, 0.61767578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 20.0, 18.0, 22.0, 48.0, 80.0, 163.0, 231.0, 165.0, 94.0, 59.0, 23.0, 18.0, 21.0, 7.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2225303649902344, -2.1544642448425293, -2.086397886276245, -2.01833176612854, -1.950265645980835, -1.8821994066238403, -1.8141331672668457, -1.7460670471191406, -1.678000807762146, -1.6099345684051514, -1.5418684482574463, -1.4738022089004517, -1.405735969543457, -1.337669849395752, -1.2696036100387573, -1.2015373706817627, -1.1334712505340576, -1.065405011177063, -0.9973388910293579, -0.9292726516723633, -0.8612064719200134, -0.7931402921676636, -0.725074052810669, -0.6570078730583191, -0.5889416933059692, -0.5208755135536194, -0.45280930399894714, -0.3847430944442749, -0.31667691469192505, -0.2486107349395752, -0.18054452538490295, -0.11247831583023071, -0.04441237449645996, 0.023653820157051086, 0.09172001481056213, 0.15978620946407318, 0.22785240411758423, 0.2959185838699341, 0.3639847934246063, 0.43205100297927856, 0.5001171827316284, 0.5681833624839783, 0.6362495422363281, 0.7043157815933228, 0.7723819613456726, 0.8404481410980225, 0.9085143804550171, 0.9765805602073669, 1.0446467399597168, 1.1127129793167114, 1.1807790994644165, 1.2488453388214111, 1.3169114589691162, 1.3849776983261108, 1.4530439376831055, 1.5211100578308105, 1.5891762971878052, 1.6572425365447998, 1.7253086566925049, 1.7933748960494995, 1.8614411354064941, 1.9295072555541992, 1.9975734949111938, 2.0656397342681885, 2.1337058544158936]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 7.0, 4.0, 11.0, 2.0, 9.0, 9.0, 11.0, 15.0, 19.0, 11.0, 25.0, 30.0, 27.0, 27.0, 46.0, 29.0, 46.0, 38.0, 45.0, 50.0, 47.0, 56.0, 42.0, 50.0, 43.0, 46.0, 34.0, 27.0, 33.0, 33.0, 25.0, 17.0, 21.0, 20.0, 9.0, 13.0, 9.0, 5.0, 6.0, 6.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4896220266819, -0.4749629497528076, -0.4603038430213928, -0.4456447660923004, -0.4309856593608856, -0.4163265824317932, -0.4016674757003784, -0.387008398771286, -0.3723493218421936, -0.3576902449131012, -0.3430311381816864, -0.328372061252594, -0.3137129545211792, -0.2990538775920868, -0.2843948006629944, -0.2697356939315796, -0.2550765872001648, -0.2404174953699112, -0.2257584035396576, -0.21109932661056519, -0.1964402198791504, -0.18178114295005798, -0.16712205111980438, -0.15246295928955078, -0.13780386745929718, -0.12314477562904358, -0.10848568379878998, -0.09382659941911697, -0.07916750758886337, -0.06450841575860977, -0.04984933137893677, -0.035190239548683167, -0.020531147718429565, -0.005872057750821114, 0.008787032216787338, 0.02344612032175064, 0.03810521215200424, 0.05276430398225784, 0.06742338836193085, 0.08208248019218445, 0.09674157202243805, 0.11140066385269165, 0.12605975568294525, 0.14071884751319885, 0.15537792444229126, 0.17003703117370605, 0.18469610810279846, 0.19935519993305206, 0.21401429176330566, 0.22867338359355927, 0.24333247542381287, 0.2579915523529053, 0.27265065908432007, 0.2873097360134125, 0.3019688129425049, 0.3166279196739197, 0.3312870264053345, 0.3459461033344269, 0.3606052100658417, 0.3752642869949341, 0.3899233937263489, 0.4045824706554413, 0.4192415475845337, 0.4339006543159485, 0.4485597312450409]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 5.0, 7.0, 2.0, 5.0, 10.0, 9.0, 27.0, 27.0, 42.0, 49.0, 103.0, 173.0, 308.0, 576.0, 1164.0, 3289.0, 11950.0, 75419.0, 816417.0, 116187.0, 15775.0, 4093.0, 1427.0, 633.0, 343.0, 201.0, 114.0, 76.0, 41.0, 23.0, 12.0, 15.0, 9.0, 9.0, 6.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2447509765625, -0.23767471313476562, -0.23059844970703125, -0.22352218627929688, -0.2164459228515625, -0.20936965942382812, -0.20229339599609375, -0.19521713256835938, -0.188140869140625, -0.18106460571289062, -0.17398834228515625, -0.16691207885742188, -0.1598358154296875, -0.15275955200195312, -0.14568328857421875, -0.13860702514648438, -0.13153076171875, -0.12445449829101562, -0.11737823486328125, -0.11030197143554688, -0.1032257080078125, -0.09614944458007812, -0.08907318115234375, -0.08199691772460938, -0.074920654296875, -0.06784439086914062, -0.06076812744140625, -0.053691864013671875, -0.0466156005859375, -0.039539337158203125, -0.03246307373046875, -0.025386810302734375, -0.018310546875, -0.011234283447265625, -0.00415802001953125, 0.002918243408203125, 0.0099945068359375, 0.017070770263671875, 0.02414703369140625, 0.031223297119140625, 0.038299560546875, 0.045375823974609375, 0.05245208740234375, 0.059528350830078125, 0.0666046142578125, 0.07368087768554688, 0.08075714111328125, 0.08783340454101562, 0.09490966796875, 0.10198593139648438, 0.10906219482421875, 0.11613845825195312, 0.1232147216796875, 0.13029098510742188, 0.13736724853515625, 0.14444351196289062, 0.151519775390625, 0.15859603881835938, 0.16567230224609375, 0.17274856567382812, 0.1798248291015625, 0.18690109252929688, 0.19397735595703125, 0.20105361938476562, 0.2081298828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 6.0, 8.0, 7.0, 10.0, 11.0, 15.0, 25.0, 32.0, 40.0, 81.0, 66.0, 82.0, 112.0, 102.0, 95.0, 69.0, 64.0, 46.0, 47.0, 28.0, 15.0, 11.0, 14.0, 6.0, 5.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6597213745117188, -0.6402435302734375, -0.6207656860351562, -0.601287841796875, -0.5818099975585938, -0.5623321533203125, -0.5428543090820312, -0.52337646484375, -0.5038986206054688, -0.4844207763671875, -0.46494293212890625, -0.445465087890625, -0.42598724365234375, -0.4065093994140625, -0.38703155517578125, -0.3675537109375, -0.34807586669921875, -0.3285980224609375, -0.30912017822265625, -0.289642333984375, -0.27016448974609375, -0.2506866455078125, -0.23120880126953125, -0.21173095703125, -0.19225311279296875, -0.1727752685546875, -0.15329742431640625, -0.133819580078125, -0.11434173583984375, -0.0948638916015625, -0.07538604736328125, -0.055908203125, -0.03643035888671875, -0.0169525146484375, 0.00252532958984375, 0.022003173828125, 0.04148101806640625, 0.0609588623046875, 0.08043670654296875, 0.09991455078125, 0.11939239501953125, 0.1388702392578125, 0.15834808349609375, 0.177825927734375, 0.19730377197265625, 0.2167816162109375, 0.23625946044921875, 0.2557373046875, 0.27521514892578125, 0.2946929931640625, 0.31417083740234375, 0.333648681640625, 0.35312652587890625, 0.3726043701171875, 0.39208221435546875, 0.41156005859375, 0.43103790283203125, 0.4505157470703125, 0.46999359130859375, 0.489471435546875, 0.5089492797851562, 0.5284271240234375, 0.5479049682617188, 0.5673828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 11.0, 10.0, 15.0, 16.0, 22.0, 34.0, 36.0, 47.0, 52.0, 71.0, 85.0, 100.0, 140.0, 209.0, 442.0, 1292.0, 4995.0, 30104.0, 655255.0, 327229.0, 21928.0, 4117.0, 1083.0, 391.0, 197.0, 135.0, 116.0, 73.0, 75.0, 62.0, 51.0, 38.0, 21.0, 35.0, 16.0, 10.0, 9.0, 7.0, 6.0, 8.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039031982421875, -0.03788137435913086, -0.03673076629638672, -0.03558015823364258, -0.03442955017089844, -0.0332789421081543, -0.032128334045410156, -0.030977725982666016, -0.029827117919921875, -0.028676509857177734, -0.027525901794433594, -0.026375293731689453, -0.025224685668945312, -0.024074077606201172, -0.02292346954345703, -0.02177286148071289, -0.02062225341796875, -0.01947164535522461, -0.01832103729248047, -0.017170429229736328, -0.016019821166992188, -0.014869213104248047, -0.013718605041503906, -0.012567996978759766, -0.011417388916015625, -0.010266780853271484, -0.009116172790527344, -0.007965564727783203, -0.0068149566650390625, -0.005664348602294922, -0.004513740539550781, -0.0033631324768066406, -0.0022125244140625, -0.0010619163513183594, 8.869171142578125e-05, 0.0012392997741699219, 0.0023899078369140625, 0.003540515899658203, 0.004691123962402344, 0.005841732025146484, 0.006992340087890625, 0.008142948150634766, 0.009293556213378906, 0.010444164276123047, 0.011594772338867188, 0.012745380401611328, 0.013895988464355469, 0.01504659652709961, 0.01619720458984375, 0.01734781265258789, 0.01849842071533203, 0.019649028778076172, 0.020799636840820312, 0.021950244903564453, 0.023100852966308594, 0.024251461029052734, 0.025402069091796875, 0.026552677154541016, 0.027703285217285156, 0.028853893280029297, 0.030004501342773438, 0.031155109405517578, 0.03230571746826172, 0.03345632553100586, 0.03460693359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 10.0, 7.0, 9.0, 10.0, 13.0, 20.0, 15.0, 21.0, 21.0, 23.0, 25.0, 30.0, 32.0, 34.0, 40.0, 41.0, 44.0, 46.0, 45.0, 47.0, 38.0, 39.0, 41.0, 35.0, 36.0, 35.0, 36.0, 26.0, 26.0, 26.0, 25.0, 16.0, 11.0, 21.0, 12.0, 12.0, 7.0, 7.0, 6.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.9962081909179688, -0.9660491943359375, -0.9358901977539062, -0.905731201171875, -0.8755722045898438, -0.8454132080078125, -0.8152542114257812, -0.78509521484375, -0.7549362182617188, -0.7247772216796875, -0.6946182250976562, -0.664459228515625, -0.6343002319335938, -0.6041412353515625, -0.5739822387695312, -0.5438232421875, -0.5136642456054688, -0.4835052490234375, -0.45334625244140625, -0.423187255859375, -0.39302825927734375, -0.3628692626953125, -0.33271026611328125, -0.30255126953125, -0.27239227294921875, -0.2422332763671875, -0.21207427978515625, -0.181915283203125, -0.15175628662109375, -0.1215972900390625, -0.09143829345703125, -0.061279296875, -0.03112030029296875, -0.0009613037109375, 0.02919769287109375, 0.059356689453125, 0.08951568603515625, 0.1196746826171875, 0.14983367919921875, 0.17999267578125, 0.21015167236328125, 0.2403106689453125, 0.27046966552734375, 0.300628662109375, 0.33078765869140625, 0.3609466552734375, 0.39110565185546875, 0.4212646484375, 0.45142364501953125, 0.4815826416015625, 0.5117416381835938, 0.541900634765625, 0.5720596313476562, 0.6022186279296875, 0.6323776245117188, 0.66253662109375, 0.6926956176757812, 0.7228546142578125, 0.7530136108398438, 0.783172607421875, 0.8133316040039062, 0.8434906005859375, 0.8736495971679688, 0.90380859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 3.0, 4.0, 18.0, 19.0, 28.0, 40.0, 29.0, 76.0, 111.0, 164.0, 254.0, 391.0, 582.0, 985.0, 1525.0, 2574.0, 4457.0, 8591.0, 18664.0, 50872.0, 261823.0, 582027.0, 68497.0, 23596.0, 10189.0, 5383.0, 2884.0, 1760.0, 1068.0, 670.0, 443.0, 283.0, 164.0, 117.0, 88.0, 51.0, 45.0, 20.0, 13.0, 17.0, 10.0, 9.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00031685829162597656, -0.0003069937229156494, -0.00029712915420532227, -0.0002872645854949951, -0.00027740001678466797, -0.0002675354480743408, -0.00025767087936401367, -0.0002478063106536865, -0.00023794174194335938, -0.00022807717323303223, -0.00021821260452270508, -0.00020834803581237793, -0.00019848346710205078, -0.00018861889839172363, -0.00017875432968139648, -0.00016888976097106934, -0.0001590251922607422, -0.00014916062355041504, -0.0001392960548400879, -0.00012943148612976074, -0.0001195669174194336, -0.00010970234870910645, -9.98377799987793e-05, -8.997321128845215e-05, -8.0108642578125e-05, -7.024407386779785e-05, -6.03795051574707e-05, -5.0514936447143555e-05, -4.0650367736816406e-05, -3.078579902648926e-05, -2.092123031616211e-05, -1.1056661605834961e-05, -1.1920928955078125e-06, 8.672475814819336e-06, 1.8537044525146484e-05, 2.8401613235473633e-05, 3.826618194580078e-05, 4.813075065612793e-05, 5.799531936645508e-05, 6.785988807678223e-05, 7.772445678710938e-05, 8.758902549743652e-05, 9.745359420776367e-05, 0.00010731816291809082, 0.00011718273162841797, 0.00012704730033874512, 0.00013691186904907227, 0.00014677643775939941, 0.00015664100646972656, 0.0001665055751800537, 0.00017637014389038086, 0.000186234712600708, 0.00019609928131103516, 0.0002059638500213623, 0.00021582841873168945, 0.0002256929874420166, 0.00023555755615234375, 0.0002454221248626709, 0.00025528669357299805, 0.0002651512622833252, 0.00027501583099365234, 0.0002848803997039795, 0.00029474496841430664, 0.0003046095371246338, 0.00031447410583496094]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 9.0, 14.0, 15.0, 17.0, 31.0, 37.0, 44.0, 69.0, 134.0, 232.0, 126.0, 55.0, 48.0, 35.0, 23.0, 19.0, 17.0, 8.0, 11.0, 9.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.343292236328125e-05, -7.093697786331177e-05, -6.844103336334229e-05, -6.59450888633728e-05, -6.344914436340332e-05, -6.095319986343384e-05, -5.8457255363464355e-05, -5.596131086349487e-05, -5.346536636352539e-05, -5.096942186355591e-05, -4.8473477363586426e-05, -4.597753286361694e-05, -4.348158836364746e-05, -4.098564386367798e-05, -3.8489699363708496e-05, -3.5993754863739014e-05, -3.349781036376953e-05, -3.100186586380005e-05, -2.8505921363830566e-05, -2.6009976863861084e-05, -2.35140323638916e-05, -2.101808786392212e-05, -1.8522143363952637e-05, -1.6026198863983154e-05, -1.3530254364013672e-05, -1.103430986404419e-05, -8.538365364074707e-06, -6.042420864105225e-06, -3.546476364135742e-06, -1.0505318641662598e-06, 1.4454126358032227e-06, 3.941357135772705e-06, 6.4373016357421875e-06, 8.93324613571167e-06, 1.1429190635681152e-05, 1.3925135135650635e-05, 1.6421079635620117e-05, 1.89170241355896e-05, 2.1412968635559082e-05, 2.3908913135528564e-05, 2.6404857635498047e-05, 2.890080213546753e-05, 3.139674663543701e-05, 3.3892691135406494e-05, 3.6388635635375977e-05, 3.888458013534546e-05, 4.138052463531494e-05, 4.3876469135284424e-05, 4.6372413635253906e-05, 4.886835813522339e-05, 5.136430263519287e-05, 5.3860247135162354e-05, 5.6356191635131836e-05, 5.885213613510132e-05, 6.13480806350708e-05, 6.384402513504028e-05, 6.633996963500977e-05, 6.883591413497925e-05, 7.133185863494873e-05, 7.382780313491821e-05, 7.63237476348877e-05, 7.881969213485718e-05, 8.131563663482666e-05, 8.381158113479614e-05, 8.630752563476562e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 5.0, 5.0, 8.0, 13.0, 19.0, 15.0, 29.0, 23.0, 34.0, 53.0, 86.0, 111.0, 152.0, 200.0, 279.0, 385.0, 548.0, 884.0, 1305.0, 2157.0, 3641.0, 6765.0, 13920.0, 34915.0, 154434.0, 710744.0, 71514.0, 22668.0, 10106.0, 5164.0, 3009.0, 1804.0, 1063.0, 733.0, 540.0, 342.0, 256.0, 160.0, 110.0, 104.0, 64.0, 48.0, 44.0, 30.0, 19.0, 14.0, 12.0, 9.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.00022304058074951172, -0.0002161320298910141, -0.00020922347903251648, -0.00020231492817401886, -0.00019540637731552124, -0.00018849782645702362, -0.000181589275598526, -0.00017468072474002838, -0.00016777217388153076, -0.00016086362302303314, -0.00015395507216453552, -0.0001470465213060379, -0.00014013797044754028, -0.00013322941958904266, -0.00012632086873054504, -0.00011941231787204742, -0.0001125037670135498, -0.00010559521615505219, -9.868666529655457e-05, -9.177811443805695e-05, -8.486956357955933e-05, -7.79610127210617e-05, -7.105246186256409e-05, -6.414391100406647e-05, -5.723536014556885e-05, -5.032680928707123e-05, -4.341825842857361e-05, -3.650970757007599e-05, -2.960115671157837e-05, -2.269260585308075e-05, -1.578405499458313e-05, -8.87550413608551e-06, -1.9669532775878906e-06, 4.941597580909729e-06, 1.1850148439407349e-05, 1.8758699297904968e-05, 2.5667250156402588e-05, 3.257580101490021e-05, 3.948435187339783e-05, 4.639290273189545e-05, 5.3301453590393066e-05, 6.0210004448890686e-05, 6.71185553073883e-05, 7.402710616588593e-05, 8.093565702438354e-05, 8.784420788288116e-05, 9.475275874137878e-05, 0.0001016613095998764, 0.00010856986045837402, 0.00011547841131687164, 0.00012238696217536926, 0.00012929551303386688, 0.0001362040638923645, 0.00014311261475086212, 0.00015002116560935974, 0.00015692971646785736, 0.00016383826732635498, 0.0001707468181848526, 0.00017765536904335022, 0.00018456391990184784, 0.00019147247076034546, 0.00019838102161884308, 0.0002052895724773407, 0.00021219812333583832, 0.00021910667419433594]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 16.0, 11.0, 18.0, 39.0, 47.0, 102.0, 187.0, 215.0, 113.0, 66.0, 48.0, 20.0, 18.0, 15.0, 13.0, 11.0, 11.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.204843521118164e-05, -5.9767626225948334e-05, -5.748681724071503e-05, -5.520600825548172e-05, -5.292519927024841e-05, -5.0644390285015106e-05, -4.83635812997818e-05, -4.608277231454849e-05, -4.3801963329315186e-05, -4.152115434408188e-05, -3.924034535884857e-05, -3.6959536373615265e-05, -3.467872738838196e-05, -3.239791840314865e-05, -3.0117109417915344e-05, -2.7836300432682037e-05, -2.555549144744873e-05, -2.3274682462215424e-05, -2.0993873476982117e-05, -1.871306449174881e-05, -1.6432255506515503e-05, -1.4151446521282196e-05, -1.187063753604889e-05, -9.589828550815582e-06, -7.309019565582275e-06, -5.0282105803489685e-06, -2.7474015951156616e-06, -4.6659260988235474e-07, 1.8142163753509521e-06, 4.095025360584259e-06, 6.375834345817566e-06, 8.656643331050873e-06, 1.093745231628418e-05, 1.3218261301517487e-05, 1.5499070286750793e-05, 1.77798792719841e-05, 2.0060688257217407e-05, 2.2341497242450714e-05, 2.462230622768402e-05, 2.6903115212917328e-05, 2.9183924198150635e-05, 3.146473318338394e-05, 3.374554216861725e-05, 3.6026351153850555e-05, 3.830716013908386e-05, 4.058796912431717e-05, 4.2868778109550476e-05, 4.514958709478378e-05, 4.743039608001709e-05, 4.97112050652504e-05, 5.1992014050483704e-05, 5.427282303571701e-05, 5.655363202095032e-05, 5.8834441006183624e-05, 6.111524999141693e-05, 6.339605897665024e-05, 6.567686796188354e-05, 6.795767694711685e-05, 7.023848593235016e-05, 7.251929491758347e-05, 7.480010390281677e-05, 7.708091288805008e-05, 7.936172187328339e-05, 8.164253085851669e-05, 8.392333984375e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 13.0, 12.0, 27.0, 37.0, 112.0, 187.0, 319.0, 142.0, 61.0, 32.0, 13.0, 13.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3092880249023438, -1.2689340114593506, -1.2285799980163574, -1.1882259845733643, -1.147871971130371, -1.1075178384780884, -1.0671638250350952, -1.026809811592102, -0.9864557981491089, -0.9461017847061157, -0.9057477712631226, -0.8653936982154846, -0.8250396847724915, -0.7846856713294983, -0.7443315982818604, -0.7039775848388672, -0.663623571395874, -0.6232695579528809, -0.5829155445098877, -0.5425614714622498, -0.5022074580192566, -0.4618534445762634, -0.4214994013309479, -0.3811453580856323, -0.34079134464263916, -0.300437331199646, -0.26008328795433044, -0.2197292596101761, -0.17937523126602173, -0.13902120292186737, -0.09866717457771301, -0.05831313133239746, -0.017958998680114746, 0.022395029664039612, 0.06274905800819397, 0.10310308635234833, 0.14345711469650269, 0.18381114304065704, 0.2241651713848114, 0.26451921463012695, 0.3048732280731201, 0.3452272415161133, 0.38558128476142883, 0.4259353280067444, 0.46628934144973755, 0.5066433548927307, 0.5469974279403687, 0.5873514413833618, 0.627705454826355, 0.6680594682693481, 0.7084134817123413, 0.7487675547599792, 0.7891215682029724, 0.8294755816459656, 0.8698296546936035, 0.9101836681365967, 0.9505376815795898, 0.990891695022583, 1.0312457084655762, 1.0715997219085693, 1.1119537353515625, 1.1523078680038452, 1.1926618814468384, 1.2330158948898315, 1.2733699083328247]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 6.0, 14.0, 14.0, 17.0, 22.0, 21.0, 29.0, 42.0, 41.0, 45.0, 59.0, 43.0, 58.0, 68.0, 59.0, 68.0, 52.0, 62.0, 45.0, 50.0, 34.0, 29.0, 25.0, 22.0, 22.0, 9.0, 15.0, 10.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18351320922374725, -0.17560678720474243, -0.1677003800868988, -0.15979395806789398, -0.15188753604888916, -0.14398112893104553, -0.1360747069120407, -0.1281682848930359, -0.12026187032461166, -0.11235545575618744, -0.10444903373718262, -0.09654261916875839, -0.08863620460033417, -0.08072978258132935, -0.07282336801290512, -0.0649169534444809, -0.057010531425476074, -0.04910411313176155, -0.04119769483804703, -0.0332912802696228, -0.02538486197590828, -0.017478443682193756, -0.009572029113769531, -0.001665610820055008, 0.006240807473659515, 0.014147224836051464, 0.022053642198443413, 0.029960058629512787, 0.03786647692322731, 0.045772895216941833, 0.05367930978536606, 0.06158572807908058, 0.0694921612739563, 0.07739857584238052, 0.08530499786138535, 0.09321141242980957, 0.10111783444881439, 0.10902424901723862, 0.11693066358566284, 0.12483708560466766, 0.13274350762367249, 0.1406499296426773, 0.14855633676052094, 0.15646275877952576, 0.16436918079853058, 0.1722756028175354, 0.18018200993537903, 0.18808843195438385, 0.19599483907222748, 0.2039012610912323, 0.21180766820907593, 0.21971409022808075, 0.22762051224708557, 0.2355269193649292, 0.24343334138393402, 0.25133976340293884, 0.25924617052078247, 0.2671525776386261, 0.2750590145587921, 0.28296542167663574, 0.29087182879447937, 0.2987782657146454, 0.306684672832489, 0.31459107995033264, 0.32249751687049866]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 8.0, 8.0, 15.0, 24.0, 33.0, 27.0, 57.0, 70.0, 99.0, 151.0, 195.0, 290.0, 391.0, 517.0, 737.0, 1127.0, 1698.0, 2573.0, 4020.0, 6323.0, 10543.0, 18153.0, 33346.0, 69105.0, 190380.0, 462406.0, 126500.0, 53098.0, 26938.0, 15238.0, 8699.0, 5424.0, 3366.0, 2131.0, 1410.0, 1018.0, 726.0, 453.0, 329.0, 256.0, 167.0, 148.0, 92.0, 60.0, 50.0, 38.0, 23.0, 30.0, 17.0, 15.0, 13.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.2266845703125, -0.21967315673828125, -0.2126617431640625, -0.20565032958984375, -0.198638916015625, -0.19162750244140625, -0.1846160888671875, -0.17760467529296875, -0.17059326171875, -0.16358184814453125, -0.1565704345703125, -0.14955902099609375, -0.142547607421875, -0.13553619384765625, -0.1285247802734375, -0.12151336669921875, -0.114501953125, -0.10749053955078125, -0.1004791259765625, -0.09346771240234375, -0.086456298828125, -0.07944488525390625, -0.0724334716796875, -0.06542205810546875, -0.05841064453125, -0.05139923095703125, -0.0443878173828125, -0.03737640380859375, -0.030364990234375, -0.02335357666015625, -0.0163421630859375, -0.00933074951171875, -0.0023193359375, 0.00469207763671875, 0.0117034912109375, 0.01871490478515625, 0.025726318359375, 0.03273773193359375, 0.0397491455078125, 0.04676055908203125, 0.05377197265625, 0.06078338623046875, 0.0677947998046875, 0.07480621337890625, 0.081817626953125, 0.08882904052734375, 0.0958404541015625, 0.10285186767578125, 0.10986328125, 0.11687469482421875, 0.1238861083984375, 0.13089752197265625, 0.137908935546875, 0.14492034912109375, 0.1519317626953125, 0.15894317626953125, 0.16595458984375, 0.17296600341796875, 0.1799774169921875, 0.18698883056640625, 0.194000244140625, 0.20101165771484375, 0.2080230712890625, 0.21503448486328125, 0.2220458984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 9.0, 7.0, 24.0, 18.0, 38.0, 46.0, 60.0, 80.0, 99.0, 88.0, 105.0, 82.0, 74.0, 65.0, 48.0, 29.0, 28.0, 21.0, 18.0, 14.0, 6.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0341796875, -0.03323698043823242, -0.032294273376464844, -0.031351566314697266, -0.030408859252929688, -0.02946615219116211, -0.02852344512939453, -0.027580738067626953, -0.026638031005859375, -0.025695323944091797, -0.02475261688232422, -0.02380990982055664, -0.022867202758789062, -0.021924495697021484, -0.020981788635253906, -0.020039081573486328, -0.01909637451171875, -0.018153667449951172, -0.017210960388183594, -0.016268253326416016, -0.015325546264648438, -0.01438283920288086, -0.013440132141113281, -0.012497425079345703, -0.011554718017578125, -0.010612010955810547, -0.009669303894042969, -0.00872659683227539, -0.0077838897705078125, -0.006841182708740234, -0.005898475646972656, -0.004955768585205078, -0.0040130615234375, -0.003070354461669922, -0.0021276473999023438, -0.0011849403381347656, -0.0002422332763671875, 0.0007004737854003906, 0.0016431808471679688, 0.002585887908935547, 0.003528594970703125, 0.004471302032470703, 0.005414009094238281, 0.006356716156005859, 0.0072994232177734375, 0.008242130279541016, 0.009184837341308594, 0.010127544403076172, 0.01107025146484375, 0.012012958526611328, 0.012955665588378906, 0.013898372650146484, 0.014841079711914062, 0.01578378677368164, 0.01672649383544922, 0.017669200897216797, 0.018611907958984375, 0.019554615020751953, 0.02049732208251953, 0.02144002914428711, 0.022382736206054688, 0.023325443267822266, 0.024268150329589844, 0.025210857391357422, 0.026153564453125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 9.0, 4.0, 10.0, 18.0, 21.0, 27.0, 26.0, 46.0, 78.0, 111.0, 121.0, 188.0, 257.0, 318.0, 540.0, 763.0, 1055.0, 1567.0, 2416.0, 3985.0, 6180.0, 10544.0, 18775.0, 36927.0, 83566.0, 276900.0, 395443.0, 109208.0, 44898.0, 22377.0, 12217.0, 7170.0, 4313.0, 2694.0, 1827.0, 1218.0, 823.0, 565.0, 406.0, 264.0, 196.0, 138.0, 99.0, 74.0, 46.0, 43.0, 28.0, 20.0, 16.0, 5.0, 6.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.096435546875, -0.09343433380126953, -0.09043312072753906, -0.0874319076538086, -0.08443069458007812, -0.08142948150634766, -0.07842826843261719, -0.07542705535888672, -0.07242584228515625, -0.06942462921142578, -0.06642341613769531, -0.06342220306396484, -0.060420989990234375, -0.057419776916503906, -0.05441856384277344, -0.05141735076904297, -0.0484161376953125, -0.04541492462158203, -0.04241371154785156, -0.039412498474121094, -0.036411285400390625, -0.033410072326660156, -0.030408859252929688, -0.02740764617919922, -0.02440643310546875, -0.02140522003173828, -0.018404006958007812, -0.015402793884277344, -0.012401580810546875, -0.009400367736816406, -0.0063991546630859375, -0.0033979415893554688, -0.000396728515625, 0.0026044845581054688, 0.0056056976318359375, 0.008606910705566406, 0.011608123779296875, 0.014609336853027344, 0.017610549926757812, 0.02061176300048828, 0.02361297607421875, 0.02661418914794922, 0.029615402221679688, 0.032616615295410156, 0.035617828369140625, 0.038619041442871094, 0.04162025451660156, 0.04462146759033203, 0.0476226806640625, 0.05062389373779297, 0.05362510681152344, 0.056626319885253906, 0.059627532958984375, 0.06262874603271484, 0.06562995910644531, 0.06863117218017578, 0.07163238525390625, 0.07463359832763672, 0.07763481140136719, 0.08063602447509766, 0.08363723754882812, 0.0866384506225586, 0.08963966369628906, 0.09264087677001953, 0.09564208984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 6.0, 11.0, 14.0, 13.0, 15.0, 6.0, 17.0, 19.0, 21.0, 29.0, 32.0, 36.0, 48.0, 55.0, 63.0, 58.0, 54.0, 54.0, 64.0, 54.0, 52.0, 50.0, 36.0, 32.0, 20.0, 22.0, 20.0, 13.0, 12.0, 9.0, 7.0, 8.0, 7.0, 5.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.056365966796875, -0.05472755432128906, -0.053089141845703125, -0.05145072937011719, -0.04981231689453125, -0.04817390441894531, -0.046535491943359375, -0.04489707946777344, -0.0432586669921875, -0.04162025451660156, -0.039981842041015625, -0.03834342956542969, -0.03670501708984375, -0.03506660461425781, -0.033428192138671875, -0.03178977966308594, -0.0301513671875, -0.028512954711914062, -0.026874542236328125, -0.025236129760742188, -0.02359771728515625, -0.021959304809570312, -0.020320892333984375, -0.018682479858398438, -0.0170440673828125, -0.015405654907226562, -0.013767242431640625, -0.012128829956054688, -0.01049041748046875, -0.008852005004882812, -0.007213592529296875, -0.0055751800537109375, -0.003936767578125, -0.0022983551025390625, -0.000659942626953125, 0.0009784698486328125, 0.00261688232421875, 0.0042552947998046875, 0.005893707275390625, 0.0075321197509765625, 0.0091705322265625, 0.010808944702148438, 0.012447357177734375, 0.014085769653320312, 0.01572418212890625, 0.017362594604492188, 0.019001007080078125, 0.020639419555664062, 0.02227783203125, 0.023916244506835938, 0.025554656982421875, 0.027193069458007812, 0.02883148193359375, 0.030469894409179688, 0.032108306884765625, 0.03374671936035156, 0.0353851318359375, 0.03702354431152344, 0.038661956787109375, 0.04030036926269531, 0.04193878173828125, 0.04357719421386719, 0.045215606689453125, 0.04685401916503906, 0.048492431640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 5.0, 11.0, 6.0, 10.0, 16.0, 19.0, 26.0, 46.0, 57.0, 77.0, 111.0, 210.0, 309.0, 573.0, 1093.0, 2460.0, 9591.0, 1012422.0, 15466.0, 3136.0, 1174.0, 669.0, 398.0, 212.0, 132.0, 91.0, 53.0, 48.0, 34.0, 34.0, 12.0, 15.0, 9.0, 7.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90625, -4.7459716796875, -4.585693359375, -4.4254150390625, -4.26513671875, -4.1048583984375, -3.944580078125, -3.7843017578125, -3.6240234375, -3.4637451171875, -3.303466796875, -3.1431884765625, -2.98291015625, -2.8226318359375, -2.662353515625, -2.5020751953125, -2.341796875, -2.1815185546875, -2.021240234375, -1.8609619140625, -1.70068359375, -1.5404052734375, -1.380126953125, -1.2198486328125, -1.0595703125, -0.8992919921875, -0.739013671875, -0.5787353515625, -0.41845703125, -0.2581787109375, -0.097900390625, 0.0623779296875, 0.22265625, 0.3829345703125, 0.543212890625, 0.7034912109375, 0.86376953125, 1.0240478515625, 1.184326171875, 1.3446044921875, 1.5048828125, 1.6651611328125, 1.825439453125, 1.9857177734375, 2.14599609375, 2.3062744140625, 2.466552734375, 2.6268310546875, 2.787109375, 2.9473876953125, 3.107666015625, 3.2679443359375, 3.42822265625, 3.5885009765625, 3.748779296875, 3.9090576171875, 4.0693359375, 4.2296142578125, 4.389892578125, 4.5501708984375, 4.71044921875, 4.8707275390625, 5.031005859375, 5.1912841796875, 5.3515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 8.0, 13.0, 56.0, 834.0, 39.0, 13.0, 5.0, 6.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0013418197631835938, -0.0013050884008407593, -0.0012683570384979248, -0.0012316256761550903, -0.0011948943138122559, -0.0011581629514694214, -0.001121431589126587, -0.0010847002267837524, -0.001047968864440918, -0.0010112375020980835, -0.000974506139755249, -0.0009377747774124146, -0.0009010434150695801, -0.0008643120527267456, -0.0008275806903839111, -0.0007908493280410767, -0.0007541179656982422, -0.0007173866033554077, -0.0006806552410125732, -0.0006439238786697388, -0.0006071925163269043, -0.0005704611539840698, -0.0005337297916412354, -0.0004969984292984009, -0.0004602670669555664, -0.00042353570461273193, -0.00038680434226989746, -0.000350072979927063, -0.0003133416175842285, -0.00027661025524139404, -0.00023987889289855957, -0.0002031475305557251, -0.00016641616821289062, -0.00012968480587005615, -9.295344352722168e-05, -5.622208118438721e-05, -1.9490718841552734e-05, 1.7240643501281738e-05, 5.397200584411621e-05, 9.070336818695068e-05, 0.00012743473052978516, 0.00016416609287261963, 0.0002008974552154541, 0.00023762881755828857, 0.00027436017990112305, 0.0003110915422439575, 0.000347822904586792, 0.00038455426692962646, 0.00042128562927246094, 0.0004580169916152954, 0.0004947483539581299, 0.0005314797163009644, 0.0005682110786437988, 0.0006049424409866333, 0.0006416738033294678, 0.0006784051656723022, 0.0007151365280151367, 0.0007518678903579712, 0.0007885992527008057, 0.0008253306150436401, 0.0008620619773864746, 0.0008987933397293091, 0.0009355247020721436, 0.000972256064414978, 0.0010089874267578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 7.0, 10.0, 18.0, 22.0, 24.0, 35.0, 46.0, 65.0, 77.0, 91.0, 135.0, 162.0, 256.0, 323.0, 481.0, 729.0, 987.0, 1534.0, 2250.0, 3592.0, 5991.0, 13290.0, 588805.0, 399843.0, 12844.0, 6129.0, 3735.0, 2172.0, 1449.0, 951.0, 659.0, 495.0, 393.0, 270.0, 176.0, 141.0, 100.0, 87.0, 43.0, 35.0, 28.0, 18.0, 9.0, 12.0, 9.0, 10.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59423828125, -0.5750656127929688, -0.5558929443359375, -0.5367202758789062, -0.517547607421875, -0.49837493896484375, -0.4792022705078125, -0.46002960205078125, -0.44085693359375, -0.42168426513671875, -0.4025115966796875, -0.38333892822265625, -0.364166259765625, -0.34499359130859375, -0.3258209228515625, -0.30664825439453125, -0.2874755859375, -0.26830291748046875, -0.2491302490234375, -0.22995758056640625, -0.210784912109375, -0.19161224365234375, -0.1724395751953125, -0.15326690673828125, -0.13409423828125, -0.11492156982421875, -0.0957489013671875, -0.07657623291015625, -0.057403564453125, -0.03823089599609375, -0.0190582275390625, 0.00011444091796875, 0.019287109375, 0.03845977783203125, 0.0576324462890625, 0.07680511474609375, 0.095977783203125, 0.11515045166015625, 0.1343231201171875, 0.15349578857421875, 0.17266845703125, 0.19184112548828125, 0.2110137939453125, 0.23018646240234375, 0.249359130859375, 0.26853179931640625, 0.2877044677734375, 0.30687713623046875, 0.3260498046875, 0.34522247314453125, 0.3643951416015625, 0.38356781005859375, 0.402740478515625, 0.42191314697265625, 0.4410858154296875, 0.46025848388671875, 0.47943115234375, 0.49860382080078125, 0.5177764892578125, 0.5369491577148438, 0.556121826171875, 0.5752944946289062, 0.5944671630859375, 0.6136398315429688, 0.6328125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 11.0, 47.0, 433.0, 382.0, 40.0, 12.0, 7.0, 4.0, 2.0, 4.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385986328125, -0.3746299743652344, -0.36327362060546875, -0.3519172668457031, -0.3405609130859375, -0.3292045593261719, -0.31784820556640625, -0.3064918518066406, -0.295135498046875, -0.2837791442871094, -0.27242279052734375, -0.2610664367675781, -0.2497100830078125, -0.23835372924804688, -0.22699737548828125, -0.21564102172851562, -0.20428466796875, -0.19292831420898438, -0.18157196044921875, -0.17021560668945312, -0.1588592529296875, -0.14750289916992188, -0.13614654541015625, -0.12479019165039062, -0.113433837890625, -0.10207748413085938, -0.09072113037109375, -0.07936477661132812, -0.0680084228515625, -0.056652069091796875, -0.04529571533203125, -0.033939361572265625, -0.0225830078125, -0.011226654052734375, 0.00012969970703125, 0.011486053466796875, 0.0228424072265625, 0.034198760986328125, 0.04555511474609375, 0.056911468505859375, 0.068267822265625, 0.07962417602539062, 0.09098052978515625, 0.10233688354492188, 0.1136932373046875, 0.12504959106445312, 0.13640594482421875, 0.14776229858398438, 0.15911865234375, 0.17047500610351562, 0.18183135986328125, 0.19318771362304688, 0.2045440673828125, 0.21590042114257812, 0.22725677490234375, 0.23861312866210938, 0.249969482421875, 0.2613258361816406, 0.27268218994140625, 0.2840385437011719, 0.2953948974609375, 0.3067512512207031, 0.31810760498046875, 0.3294639587402344, 0.3408203125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 8.0, 15.0, 13.0, 38.0, 65.0, 267.0, 395.0, 96.0, 38.0, 22.0, 14.0, 8.0, 9.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.361732482910156, -6.07496976852417, -5.788207530975342, -5.5014448165893555, -5.214682579040527, -4.927919864654541, -4.641157150268555, -4.354394912719727, -4.06763219833374, -3.780869722366333, -3.494107246398926, -3.2073445320129395, -2.9205820560455322, -2.633819580078125, -2.3470568656921387, -2.0602943897247314, -1.7735319137573242, -1.486769437789917, -1.2000068426132202, -0.9132443070411682, -0.6264817714691162, -0.339719295501709, -0.05295670032501221, 0.23380589485168457, 0.5205683708190918, 0.8073309063911438, 1.0940934419631958, 1.3808560371398926, 1.6676185131072998, 1.954380989074707, 2.2411437034606934, 2.5279061794281006, 2.8146677017211914, 3.1014301776885986, 3.388192653656006, 3.674955368041992, 3.9617178440093994, 4.248480319976807, 4.535243034362793, 4.822005271911621, 5.108767986297607, 5.395530700683594, 5.682292938232422, 5.969055652618408, 6.2558183670043945, 6.542580604553223, 6.829343318939209, 7.116106033325195, 7.402868270874023, 7.68963098526001, 7.976393222808838, 8.263155937194824, 8.549918174743652, 8.836681365966797, 9.123443603515625, 9.410205841064453, 9.696968078613281, 9.98373031616211, 10.270493507385254, 10.557255744934082, 10.84401798248291, 11.130781173706055, 11.417543411254883, 11.704305648803711, 11.991068840026855]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 5.0, 8.0, 8.0, 17.0, 8.0, 10.0, 20.0, 16.0, 19.0, 19.0, 28.0, 21.0, 28.0, 27.0, 26.0, 39.0, 33.0, 39.0, 39.0, 43.0, 44.0, 30.0, 44.0, 29.0, 37.0, 47.0, 27.0, 31.0, 39.0, 37.0, 23.0, 20.0, 15.0, 20.0, 22.0, 8.0, 14.0, 9.0, 11.0, 9.0, 4.0, 6.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3854639530181885, -0.37170493602752686, -0.35794588923454285, -0.3441868722438812, -0.3304278254508972, -0.3166688084602356, -0.302909791469574, -0.28915074467658997, -0.27539169788360596, -0.26163268089294434, -0.24787363409996033, -0.2341146171092987, -0.2203555703163147, -0.20659655332565308, -0.19283752143383026, -0.17907848954200745, -0.16531947255134583, -0.151560440659523, -0.1378014087677002, -0.12404238432645798, -0.11028335243463516, -0.09652432054281235, -0.08276529610157013, -0.06900626420974731, -0.0552472323179245, -0.041488200426101685, -0.027729172259569168, -0.013970144093036652, -0.00021111220121383667, 0.013547919690608978, 0.027306944131851196, 0.04106597602367401, 0.05482497811317444, 0.06858401000499725, 0.08234304189682007, 0.09610206633806229, 0.1098610982298851, 0.12362013012170792, 0.13737915456295013, 0.15113818645477295, 0.16489721834659576, 0.17865625023841858, 0.1924152821302414, 0.2061743140220642, 0.21993333101272583, 0.23369237780570984, 0.24745139479637146, 0.26121044158935547, 0.2749694585800171, 0.2887284755706787, 0.3024875223636627, 0.31624653935432434, 0.33000558614730835, 0.34376460313796997, 0.3575236201286316, 0.3712826669216156, 0.3850417137145996, 0.39880073070526123, 0.41255977749824524, 0.42631879448890686, 0.44007784128189087, 0.4538368582725525, 0.4675958752632141, 0.4813549220561981, 0.49511393904685974]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 10.0, 17.0, 22.0, 24.0, 43.0, 46.0, 88.0, 101.0, 165.0, 248.0, 378.0, 549.0, 839.0, 1382.0, 2407.0, 4693.0, 10575.0, 35798.0, 4094889.0, 24603.0, 8323.0, 3811.0, 1989.0, 1154.0, 749.0, 447.0, 289.0, 202.0, 143.0, 88.0, 68.0, 41.0, 34.0, 24.0, 15.0, 16.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.824249267578125, -3.68951416015625, -3.554779052734375, -3.4200439453125, -3.285308837890625, -3.15057373046875, -3.015838623046875, -2.881103515625, -2.746368408203125, -2.61163330078125, -2.476898193359375, -2.3421630859375, -2.207427978515625, -2.07269287109375, -1.937957763671875, -1.80322265625, -1.668487548828125, -1.53375244140625, -1.399017333984375, -1.2642822265625, -1.129547119140625, -0.99481201171875, -0.860076904296875, -0.725341796875, -0.590606689453125, -0.45587158203125, -0.321136474609375, -0.1864013671875, -0.051666259765625, 0.08306884765625, 0.217803955078125, 0.3525390625, 0.487274169921875, 0.62200927734375, 0.756744384765625, 0.8914794921875, 1.026214599609375, 1.16094970703125, 1.295684814453125, 1.430419921875, 1.565155029296875, 1.69989013671875, 1.834625244140625, 1.9693603515625, 2.104095458984375, 2.23883056640625, 2.373565673828125, 2.50830078125, 2.643035888671875, 2.77777099609375, 2.912506103515625, 3.0472412109375, 3.181976318359375, 3.31671142578125, 3.451446533203125, 3.586181640625, 3.720916748046875, 3.85565185546875, 3.990386962890625, 4.1251220703125, 4.259857177734375, 4.39459228515625, 4.529327392578125, 4.6640625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 11.0, 13.0, 14.0, 24.0, 27.0, 24.0, 46.0, 98.0, 134.0, 196.0, 134.0, 85.0, 53.0, 30.0, 15.0, 27.0, 11.0, 5.0, 3.0, 9.0, 4.0, 1.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1685791015625, -0.16304588317871094, -0.15751266479492188, -0.1519794464111328, -0.14644622802734375, -0.1409130096435547, -0.13537979125976562, -0.12984657287597656, -0.1243133544921875, -0.11878013610839844, -0.11324691772460938, -0.10771369934082031, -0.10218048095703125, -0.09664726257324219, -0.09111404418945312, -0.08558082580566406, -0.080047607421875, -0.07451438903808594, -0.06898117065429688, -0.06344795227050781, -0.05791473388671875, -0.05238151550292969, -0.046848297119140625, -0.04131507873535156, -0.0357818603515625, -0.030248641967773438, -0.024715423583984375, -0.019182205200195312, -0.01364898681640625, -0.008115768432617188, -0.002582550048828125, 0.0029506683349609375, 0.00848388671875, 0.014017105102539062, 0.019550323486328125, 0.025083541870117188, 0.03061676025390625, 0.03614997863769531, 0.041683197021484375, 0.04721641540527344, 0.0527496337890625, 0.05828285217285156, 0.06381607055664062, 0.06934928894042969, 0.07488250732421875, 0.08041572570800781, 0.08594894409179688, 0.09148216247558594, 0.097015380859375, 0.10254859924316406, 0.10808181762695312, 0.11361503601074219, 0.11914825439453125, 0.12468147277832031, 0.13021469116210938, 0.13574790954589844, 0.1412811279296875, 0.14681434631347656, 0.15234756469726562, 0.1578807830810547, 0.16341400146484375, 0.1689472198486328, 0.17448043823242188, 0.18001365661621094, 0.185546875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 6.0, 15.0, 69.0, 406.0, 5185.0, 4175492.0, 12334.0, 618.0, 98.0, 20.0, 12.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.87890625, -7.60357666015625, -7.3282470703125, -7.05291748046875, -6.777587890625, -6.50225830078125, -6.2269287109375, -5.95159912109375, -5.67626953125, -5.40093994140625, -5.1256103515625, -4.85028076171875, -4.574951171875, -4.29962158203125, -4.0242919921875, -3.74896240234375, -3.4736328125, -3.19830322265625, -2.9229736328125, -2.64764404296875, -2.372314453125, -2.09698486328125, -1.8216552734375, -1.54632568359375, -1.27099609375, -0.99566650390625, -0.7203369140625, -0.44500732421875, -0.169677734375, 0.10565185546875, 0.3809814453125, 0.65631103515625, 0.931640625, 1.20697021484375, 1.4822998046875, 1.75762939453125, 2.032958984375, 2.30828857421875, 2.5836181640625, 2.85894775390625, 3.13427734375, 3.40960693359375, 3.6849365234375, 3.96026611328125, 4.235595703125, 4.51092529296875, 4.7862548828125, 5.06158447265625, 5.3369140625, 5.61224365234375, 5.8875732421875, 6.16290283203125, 6.438232421875, 6.71356201171875, 6.9888916015625, 7.26422119140625, 7.53955078125, 7.81488037109375, 8.0902099609375, 8.36553955078125, 8.640869140625, 8.91619873046875, 9.1915283203125, 9.46685791015625, 9.7421875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 7.0, 10.0, 30.0, 104.0, 3747.0, 86.0, 33.0, 12.0, 10.0, 9.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5620651245117188, -0.5416107177734375, -0.5211563110351562, -0.500701904296875, -0.48024749755859375, -0.4597930908203125, -0.43933868408203125, -0.41888427734375, -0.39842987060546875, -0.3779754638671875, -0.35752105712890625, -0.337066650390625, -0.31661224365234375, -0.2961578369140625, -0.27570343017578125, -0.2552490234375, -0.23479461669921875, -0.2143402099609375, -0.19388580322265625, -0.173431396484375, -0.15297698974609375, -0.1325225830078125, -0.11206817626953125, -0.09161376953125, -0.07115936279296875, -0.0507049560546875, -0.03025054931640625, -0.009796142578125, 0.01065826416015625, 0.0311126708984375, 0.05156707763671875, 0.072021484375, 0.09247589111328125, 0.1129302978515625, 0.13338470458984375, 0.153839111328125, 0.17429351806640625, 0.1947479248046875, 0.21520233154296875, 0.23565673828125, 0.25611114501953125, 0.2765655517578125, 0.29701995849609375, 0.317474365234375, 0.33792877197265625, 0.3583831787109375, 0.37883758544921875, 0.3992919921875, 0.41974639892578125, 0.4402008056640625, 0.46065521240234375, 0.481109619140625, 0.5015640258789062, 0.5220184326171875, 0.5424728393554688, 0.56292724609375, 0.5833816528320312, 0.6038360595703125, 0.6242904663085938, 0.644744873046875, 0.6651992797851562, 0.6856536865234375, 0.7061080932617188, 0.7265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 7.0, 13.0, 14.0, 20.0, 22.0, 43.0, 60.0, 75.0, 123.0, 174.0, 127.0, 86.0, 58.0, 50.0, 31.0, 24.0, 17.0, 12.0, 6.0, 11.0, 2.0, 4.0, 6.0, 0.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0336763858795166, -1.0061780214309692, -0.9786795973777771, -0.951181173324585, -0.9236828088760376, -0.8961843848228455, -0.8686859607696533, -0.841187596321106, -0.8136892318725586, -0.7861908078193665, -0.7586924433708191, -0.731194019317627, -0.7036956548690796, -0.6761972308158875, -0.6486988067626953, -0.621200442314148, -0.5937020182609558, -0.5662035942077637, -0.5387052297592163, -0.5112068057060242, -0.4837084412574768, -0.45621001720428467, -0.4287116229534149, -0.40121322870254517, -0.3737148344516754, -0.34621644020080566, -0.3187180459499359, -0.29121965169906616, -0.263721227645874, -0.23622284829616547, -0.20872443914413452, -0.18122604489326477, -0.1537277102470398, -0.12622931599617004, -0.0987309142947197, -0.07123251259326935, -0.0437341183423996, -0.016235724091529846, 0.011262685060501099, 0.03876107931137085, 0.0662594735622406, 0.09375786781311035, 0.1212562695145607, 0.14875467121601105, 0.1762530654668808, 0.20375145971775055, 0.2312498688697815, 0.25874826312065125, 0.286246657371521, 0.31374505162239075, 0.3412434458732605, 0.36874186992645264, 0.396240234375, 0.42373865842819214, 0.4512370526790619, 0.47873544692993164, 0.506233811378479, 0.5337322354316711, 0.5612305998802185, 0.5887290239334106, 0.616227388381958, 0.6437258124351501, 0.6712242364883423, 0.6987226009368896, 0.7262210249900818]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 8.0, 7.0, 5.0, 9.0, 12.0, 9.0, 17.0, 17.0, 26.0, 16.0, 26.0, 31.0, 23.0, 30.0, 33.0, 31.0, 33.0, 38.0, 29.0, 42.0, 32.0, 34.0, 43.0, 27.0, 33.0, 35.0, 27.0, 23.0, 35.0, 31.0, 20.0, 22.0, 22.0, 24.0, 20.0, 14.0, 24.0, 14.0, 11.0, 11.0, 13.0, 9.0, 3.0, 8.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.24702009558677673, -0.2396390736103058, -0.23225806653499603, -0.22487705945968628, -0.21749603748321533, -0.21011501550674438, -0.20273400843143463, -0.19535300135612488, -0.18797197937965393, -0.18059095740318298, -0.17320995032787323, -0.16582894325256348, -0.15844792127609253, -0.15106689929962158, -0.14368589222431183, -0.13630488514900208, -0.12892386317253113, -0.12154284864664078, -0.11416183412075043, -0.10678081959486008, -0.09939980506896973, -0.09201879054307938, -0.08463777601718903, -0.07725676149129868, -0.06987574696540833, -0.062494732439517975, -0.055113717913627625, -0.047732703387737274, -0.040351688861846924, -0.032970674335956573, -0.025589659810066223, -0.018208645284175873, -0.010827615857124329, -0.0034466013312339783, 0.003934413194656372, 0.011315427720546722, 0.018696442246437073, 0.026077456772327423, 0.03345847129821777, 0.040839485824108124, 0.048220500349998474, 0.055601514875888824, 0.06298252940177917, 0.07036354392766953, 0.07774455845355988, 0.08512557297945023, 0.09250658750534058, 0.09988760203123093, 0.10726861655712128, 0.11464963108301163, 0.12203064560890198, 0.12941166758537292, 0.13679267466068268, 0.14417368173599243, 0.15155470371246338, 0.15893572568893433, 0.16631673276424408, 0.17369773983955383, 0.18107876181602478, 0.18845978379249573, 0.19584079086780548, 0.20322179794311523, 0.21060281991958618, 0.21798384189605713, 0.22536484897136688]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 4.0, 16.0, 18.0, 35.0, 56.0, 128.0, 347.0, 1049.0, 6230.0, 238307.0, 790125.0, 10133.0, 1385.0, 371.0, 143.0, 71.0, 40.0, 24.0, 15.0, 13.0, 10.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18896484375, -0.18247032165527344, -0.17597579956054688, -0.1694812774658203, -0.16298675537109375, -0.1564922332763672, -0.14999771118164062, -0.14350318908691406, -0.1370086669921875, -0.13051414489746094, -0.12401962280273438, -0.11752510070800781, -0.11103057861328125, -0.10453605651855469, -0.09804153442382812, -0.09154701232910156, -0.085052490234375, -0.07855796813964844, -0.07206344604492188, -0.06556892395019531, -0.05907440185546875, -0.05257987976074219, -0.046085357666015625, -0.03959083557128906, -0.0330963134765625, -0.026601791381835938, -0.020107269287109375, -0.013612747192382812, -0.00711822509765625, -0.0006237030029296875, 0.005870819091796875, 0.012365341186523438, 0.01885986328125, 0.025354385375976562, 0.031848907470703125, 0.03834342956542969, 0.04483795166015625, 0.05133247375488281, 0.057826995849609375, 0.06432151794433594, 0.0708160400390625, 0.07731056213378906, 0.08380508422851562, 0.09029960632324219, 0.09679412841796875, 0.10328865051269531, 0.10978317260742188, 0.11627769470214844, 0.122772216796875, 0.12926673889160156, 0.13576126098632812, 0.1422557830810547, 0.14875030517578125, 0.1552448272705078, 0.16173934936523438, 0.16823387145996094, 0.1747283935546875, 0.18122291564941406, 0.18771743774414062, 0.1942119598388672, 0.20070648193359375, 0.2072010040283203, 0.21369552612304688, 0.22019004821777344, 0.2266845703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 13.0, 14.0, 17.0, 24.0, 51.0, 87.0, 131.0, 146.0, 150.0, 112.0, 101.0, 69.0, 46.0, 19.0, 12.0, 5.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.0380859375, -1.0165138244628906, -0.9949417114257812, -0.9733695983886719, -0.9517974853515625, -0.9302253723144531, -0.9086532592773438, -0.8870811462402344, -0.865509033203125, -0.8439369201660156, -0.8223648071289062, -0.8007926940917969, -0.7792205810546875, -0.7576484680175781, -0.7360763549804688, -0.7145042419433594, -0.69293212890625, -0.6713600158691406, -0.6497879028320312, -0.6282157897949219, -0.6066436767578125, -0.5850715637207031, -0.5634994506835938, -0.5419273376464844, -0.520355224609375, -0.4987831115722656, -0.47721099853515625, -0.4556388854980469, -0.4340667724609375, -0.4124946594238281, -0.39092254638671875, -0.3693504333496094, -0.3477783203125, -0.3262062072753906, -0.30463409423828125, -0.2830619812011719, -0.2614898681640625, -0.23991775512695312, -0.21834564208984375, -0.19677352905273438, -0.175201416015625, -0.15362930297851562, -0.13205718994140625, -0.11048507690429688, -0.0889129638671875, -0.06734085083007812, -0.04576873779296875, -0.024196624755859375, -0.00262451171875, 0.018947601318359375, 0.04051971435546875, 0.062091827392578125, 0.0836639404296875, 0.10523605346679688, 0.12680816650390625, 0.14838027954101562, 0.169952392578125, 0.19152450561523438, 0.21309661865234375, 0.23466873168945312, 0.2562408447265625, 0.2778129577636719, 0.29938507080078125, 0.3209571838378906, 0.342529296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 10.0, 15.0, 45.0, 97.0, 199.0, 388.0, 1220.0, 57650.0, 983203.0, 4693.0, 554.0, 241.0, 123.0, 69.0, 30.0, 17.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05426025390625, -0.05246591567993164, -0.05067157745361328, -0.04887723922729492, -0.04708290100097656, -0.0452885627746582, -0.043494224548339844, -0.041699886322021484, -0.039905548095703125, -0.038111209869384766, -0.036316871643066406, -0.03452253341674805, -0.03272819519042969, -0.030933856964111328, -0.02913951873779297, -0.02734518051147461, -0.02555084228515625, -0.02375650405883789, -0.02196216583251953, -0.020167827606201172, -0.018373489379882812, -0.016579151153564453, -0.014784812927246094, -0.012990474700927734, -0.011196136474609375, -0.009401798248291016, -0.007607460021972656, -0.005813121795654297, -0.0040187835693359375, -0.002224445343017578, -0.00043010711669921875, 0.0013642311096191406, 0.0031585693359375, 0.004952907562255859, 0.006747245788574219, 0.008541584014892578, 0.010335922241210938, 0.012130260467529297, 0.013924598693847656, 0.015718936920166016, 0.017513275146484375, 0.019307613372802734, 0.021101951599121094, 0.022896289825439453, 0.024690628051757812, 0.026484966278076172, 0.02827930450439453, 0.03007364273071289, 0.03186798095703125, 0.03366231918334961, 0.03545665740966797, 0.03725099563598633, 0.03904533386230469, 0.04083967208862305, 0.042634010314941406, 0.044428348541259766, 0.046222686767578125, 0.048017024993896484, 0.049811363220214844, 0.0516057014465332, 0.05340003967285156, 0.05519437789916992, 0.05698871612548828, 0.05878305435180664, 0.060577392578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 9.0, 25.0, 50.0, 60.0, 100.0, 111.0, 119.0, 154.0, 113.0, 92.0, 64.0, 55.0, 28.0, 12.0, 12.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.4012908935546875, -1.353363037109375, -1.3054351806640625, -1.25750732421875, -1.2095794677734375, -1.161651611328125, -1.1137237548828125, -1.0657958984375, -1.0178680419921875, -0.969940185546875, -0.9220123291015625, -0.87408447265625, -0.8261566162109375, -0.778228759765625, -0.7303009033203125, -0.682373046875, -0.6344451904296875, -0.586517333984375, -0.5385894775390625, -0.49066162109375, -0.4427337646484375, -0.394805908203125, -0.3468780517578125, -0.2989501953125, -0.2510223388671875, -0.203094482421875, -0.1551666259765625, -0.10723876953125, -0.0593109130859375, -0.011383056640625, 0.0365447998046875, 0.08447265625, 0.1324005126953125, 0.180328369140625, 0.2282562255859375, 0.27618408203125, 0.3241119384765625, 0.372039794921875, 0.4199676513671875, 0.4678955078125, 0.5158233642578125, 0.563751220703125, 0.6116790771484375, 0.65960693359375, 0.7075347900390625, 0.755462646484375, 0.8033905029296875, 0.851318359375, 0.8992462158203125, 0.947174072265625, 0.9951019287109375, 1.04302978515625, 1.0909576416015625, 1.138885498046875, 1.1868133544921875, 1.2347412109375, 1.2826690673828125, 1.330596923828125, 1.3785247802734375, 1.42645263671875, 1.4743804931640625, 1.522308349609375, 1.5702362060546875, 1.6181640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 6.0, 7.0, 14.0, 14.0, 19.0, 32.0, 44.0, 56.0, 98.0, 146.0, 211.0, 393.0, 646.0, 1231.0, 2587.0, 6252.0, 20637.0, 934960.0, 63583.0, 10011.0, 3753.0, 1658.0, 862.0, 478.0, 277.0, 181.0, 113.0, 76.0, 60.0, 38.0, 21.0, 17.0, 10.0, 15.0, 12.0, 8.0, 9.0, 3.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005269050598144531, -0.0005097538232803345, -0.0004926025867462158, -0.00047545135021209717, -0.0004583001136779785, -0.00044114887714385986, -0.0004239976406097412, -0.00040684640407562256, -0.0003896951675415039, -0.00037254393100738525, -0.0003553926944732666, -0.00033824145793914795, -0.0003210902214050293, -0.00030393898487091064, -0.000286787748336792, -0.00026963651180267334, -0.0002524852752685547, -0.00023533403873443604, -0.00021818280220031738, -0.00020103156566619873, -0.00018388032913208008, -0.00016672909259796143, -0.00014957785606384277, -0.00013242661952972412, -0.00011527538299560547, -9.812414646148682e-05, -8.097290992736816e-05, -6.382167339324951e-05, -4.667043685913086e-05, -2.9519200325012207e-05, -1.2367963790893555e-05, 4.783272743225098e-06, 2.193450927734375e-05, 3.90857458114624e-05, 5.6236982345581055e-05, 7.338821887969971e-05, 9.053945541381836e-05, 0.00010769069194793701, 0.00012484192848205566, 0.00014199316501617432, 0.00015914440155029297, 0.00017629563808441162, 0.00019344687461853027, 0.00021059811115264893, 0.00022774934768676758, 0.00024490058422088623, 0.0002620518207550049, 0.00027920305728912354, 0.0002963542938232422, 0.00031350553035736084, 0.0003306567668914795, 0.00034780800342559814, 0.0003649592399597168, 0.00038211047649383545, 0.0003992617130279541, 0.00041641294956207275, 0.0004335641860961914, 0.00045071542263031006, 0.0004678666591644287, 0.00048501789569854736, 0.000502169132232666, 0.0005193203687667847, 0.0005364716053009033, 0.000553622841835022, 0.0005707740783691406]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 6.0, 3.0, 5.0, 8.0, 14.0, 29.0, 46.0, 95.0, 272.0, 297.0, 97.0, 43.0, 27.0, 9.0, 8.0, 12.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.319978713989258e-05, -3.2017938792705536e-05, -3.0836090445518494e-05, -2.965424209833145e-05, -2.847239375114441e-05, -2.7290545403957367e-05, -2.6108697056770325e-05, -2.4926848709583282e-05, -2.374500036239624e-05, -2.2563152015209198e-05, -2.1381303668022156e-05, -2.0199455320835114e-05, -1.901760697364807e-05, -1.783575862646103e-05, -1.6653910279273987e-05, -1.5472061932086945e-05, -1.4290213584899902e-05, -1.310836523771286e-05, -1.1926516890525818e-05, -1.0744668543338776e-05, -9.562820196151733e-06, -8.380971848964691e-06, -7.199123501777649e-06, -6.017275154590607e-06, -4.8354268074035645e-06, -3.6535784602165222e-06, -2.47173011302948e-06, -1.2898817658424377e-06, -1.0803341865539551e-07, 1.0738149285316467e-06, 2.255663275718689e-06, 3.437511622905731e-06, 4.6193599700927734e-06, 5.801208317279816e-06, 6.983056664466858e-06, 8.1649050116539e-06, 9.346753358840942e-06, 1.0528601706027985e-05, 1.1710450053215027e-05, 1.2892298400402069e-05, 1.4074146747589111e-05, 1.5255995094776154e-05, 1.6437843441963196e-05, 1.7619691789150238e-05, 1.880154013633728e-05, 1.9983388483524323e-05, 2.1165236830711365e-05, 2.2347085177898407e-05, 2.352893352508545e-05, 2.471078187227249e-05, 2.5892630219459534e-05, 2.7074478566646576e-05, 2.8256326913833618e-05, 2.943817526102066e-05, 3.06200236082077e-05, 3.1801871955394745e-05, 3.298372030258179e-05, 3.416556864976883e-05, 3.534741699695587e-05, 3.6529265344142914e-05, 3.7711113691329956e-05, 3.8892962038517e-05, 4.007481038570404e-05, 4.125665873289108e-05, 4.2438507080078125e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 11.0, 10.0, 15.0, 25.0, 33.0, 38.0, 56.0, 79.0, 83.0, 139.0, 187.0, 240.0, 337.0, 481.0, 664.0, 930.0, 1310.0, 1793.0, 2514.0, 3980.0, 8193.0, 31135.0, 723670.0, 232105.0, 22155.0, 6624.0, 3493.0, 2327.0, 1601.0, 1189.0, 839.0, 632.0, 428.0, 334.0, 227.0, 165.0, 135.0, 97.0, 67.0, 66.0, 41.0, 24.0, 15.0, 18.0, 10.0, 11.0, 6.0, 1.0, 5.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.000164031982421875, -0.00015872158110141754, -0.00015341117978096008, -0.00014810077846050262, -0.00014279037714004517, -0.0001374799758195877, -0.00013216957449913025, -0.0001268591731786728, -0.00012154877185821533, -0.00011623837053775787, -0.00011092796921730042, -0.00010561756789684296, -0.0001003071665763855, -9.499676525592804e-05, -8.968636393547058e-05, -8.437596261501312e-05, -7.906556129455566e-05, -7.37551599740982e-05, -6.844475865364075e-05, -6.313435733318329e-05, -5.782395601272583e-05, -5.251355469226837e-05, -4.720315337181091e-05, -4.1892752051353455e-05, -3.6582350730895996e-05, -3.127194941043854e-05, -2.596154808998108e-05, -2.065114676952362e-05, -1.5340745449066162e-05, -1.0030344128608704e-05, -4.719942808151245e-06, 5.904585123062134e-07, 5.900859832763672e-06, 1.121126115322113e-05, 1.652166247367859e-05, 2.1832063794136047e-05, 2.7142465114593506e-05, 3.2452866435050964e-05, 3.776326775550842e-05, 4.307366907596588e-05, 4.838407039642334e-05, 5.36944717168808e-05, 5.900487303733826e-05, 6.431527435779572e-05, 6.962567567825317e-05, 7.493607699871063e-05, 8.024647831916809e-05, 8.555687963962555e-05, 9.086728096008301e-05, 9.617768228054047e-05, 0.00010148808360099792, 0.00010679848492145538, 0.00011210888624191284, 0.0001174192875623703, 0.00012272968888282776, 0.00012804009020328522, 0.00013335049152374268, 0.00013866089284420013, 0.0001439712941646576, 0.00014928169548511505, 0.0001545920968055725, 0.00015990249812602997, 0.00016521289944648743, 0.00017052330076694489, 0.00017583370208740234]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 4.0, 6.0, 5.0, 13.0, 34.0, 67.0, 137.0, 412.0, 176.0, 62.0, 28.0, 20.0, 6.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.882978439331055e-05, -5.690380930900574e-05, -5.497783422470093e-05, -5.305185914039612e-05, -5.112588405609131e-05, -4.91999089717865e-05, -4.727393388748169e-05, -4.534795880317688e-05, -4.342198371887207e-05, -4.149600863456726e-05, -3.957003355026245e-05, -3.764405846595764e-05, -3.571808338165283e-05, -3.379210829734802e-05, -3.186613321304321e-05, -2.9940158128738403e-05, -2.8014183044433594e-05, -2.6088207960128784e-05, -2.4162232875823975e-05, -2.2236257791519165e-05, -2.0310282707214355e-05, -1.8384307622909546e-05, -1.6458332538604736e-05, -1.4532357454299927e-05, -1.2606382369995117e-05, -1.0680407285690308e-05, -8.754432201385498e-06, -6.8284571170806885e-06, -4.902482032775879e-06, -2.9765069484710693e-06, -1.0505318641662598e-06, 8.754432201385498e-07, 2.8014183044433594e-06, 4.727393388748169e-06, 6.6533684730529785e-06, 8.579343557357788e-06, 1.0505318641662598e-05, 1.2431293725967407e-05, 1.4357268810272217e-05, 1.6283243894577026e-05, 1.8209218978881836e-05, 2.0135194063186646e-05, 2.2061169147491455e-05, 2.3987144231796265e-05, 2.5913119316101074e-05, 2.7839094400405884e-05, 2.9765069484710693e-05, 3.16910445690155e-05, 3.361701965332031e-05, 3.554299473762512e-05, 3.746896982192993e-05, 3.939494490623474e-05, 4.132091999053955e-05, 4.324689507484436e-05, 4.517287015914917e-05, 4.709884524345398e-05, 4.902482032775879e-05, 5.09507954120636e-05, 5.287677049636841e-05, 5.480274558067322e-05, 5.672872066497803e-05, 5.865469574928284e-05, 6.0580670833587646e-05, 6.250664591789246e-05, 6.443262100219727e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 7.0, 12.0, 17.0, 24.0, 26.0, 38.0, 70.0, 89.0, 151.0, 183.0, 104.0, 87.0, 56.0, 34.0, 31.0, 18.0, 8.0, 3.0, 9.0, 7.0, 6.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6227833032608032, -0.6060669422149658, -0.5893505811691284, -0.5726341605186462, -0.5559177994728088, -0.5392014384269714, -0.5224850177764893, -0.5057686567306519, -0.48905229568481445, -0.47233593463897705, -0.45561954379081726, -0.43890315294265747, -0.42218679189682007, -0.40547043085098267, -0.3887540400028229, -0.3720376491546631, -0.3553212881088257, -0.3386049270629883, -0.3218885362148285, -0.3051721453666687, -0.2884557843208313, -0.2717394232749939, -0.2550230324268341, -0.2383066564798355, -0.22159028053283691, -0.20487390458583832, -0.18815752863883972, -0.17144115269184113, -0.15472477674484253, -0.13800840079784393, -0.12129202485084534, -0.10457564890384674, -0.08785927295684814, -0.07114289700984955, -0.05442652106285095, -0.037710145115852356, -0.02099376916885376, -0.004277393221855164, 0.012438982725143433, 0.02915535867214203, 0.045871734619140625, 0.06258811056613922, 0.07930448651313782, 0.09602086246013641, 0.11273723840713501, 0.1294536143541336, 0.1461699903011322, 0.1628863662481308, 0.1796027421951294, 0.196319118142128, 0.2130354940891266, 0.22975187003612518, 0.24646824598312378, 0.2631846070289612, 0.27990099787712097, 0.29661738872528076, 0.31333374977111816, 0.33005011081695557, 0.34676650166511536, 0.36348289251327515, 0.38019925355911255, 0.39691561460494995, 0.41363200545310974, 0.43034839630126953, 0.44706475734710693]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 9.0, 8.0, 7.0, 7.0, 11.0, 13.0, 16.0, 14.0, 21.0, 19.0, 27.0, 35.0, 26.0, 30.0, 26.0, 35.0, 43.0, 43.0, 34.0, 39.0, 39.0, 32.0, 42.0, 33.0, 39.0, 34.0, 24.0, 29.0, 36.0, 24.0, 28.0, 20.0, 20.0, 25.0, 19.0, 13.0, 16.0, 11.0, 14.0, 9.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.14444056153297424, -0.14018818736076355, -0.13593582808971405, -0.13168345391750336, -0.12743109464645386, -0.12317872047424316, -0.11892635375261307, -0.11467398703098297, -0.11042161285877228, -0.10616924613714218, -0.10191687941551208, -0.09766450524330139, -0.0934121385216713, -0.0891597718000412, -0.0849074050784111, -0.080655038356781, -0.07640267163515091, -0.07215030491352081, -0.06789793819189072, -0.06364557147026062, -0.05939319729804993, -0.05514083057641983, -0.050888463854789734, -0.04663609713315964, -0.04238372668623924, -0.038131359964609146, -0.03387898951768875, -0.029626622796058655, -0.02537425421178341, -0.021121885627508163, -0.016869518905878067, -0.012617150321602821, -0.008364781737327576, -0.004112413618713617, 0.00013995449990034103, 0.004392322152853012, 0.008644690737128258, 0.012897059321403503, 0.0171494260430336, 0.021401794627308846, 0.02565416321158409, 0.029906531795859337, 0.03415890038013458, 0.03841126710176468, 0.042663633823394775, 0.04691600427031517, 0.05116837099194527, 0.05542074143886566, 0.05967310816049576, 0.06392547488212585, 0.06817784160375595, 0.07243020832538605, 0.07668258249759674, 0.08093494921922684, 0.08518731594085693, 0.08943968266248703, 0.09369204938411713, 0.09794441610574722, 0.10219678282737732, 0.10644915699958801, 0.11070152372121811, 0.1149538904428482, 0.1192062571644783, 0.1234586238861084, 0.1277109980583191]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 7.0, 8.0, 3.0, 5.0, 10.0, 11.0, 10.0, 25.0, 39.0, 47.0, 74.0, 992.0, 970161.0, 76642.0, 269.0, 75.0, 43.0, 36.0, 23.0, 9.0, 3.0, 8.0, 3.0, 6.0, 7.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.193359375, -3.099029541015625, -3.00469970703125, -2.910369873046875, -2.8160400390625, -2.721710205078125, -2.62738037109375, -2.533050537109375, -2.438720703125, -2.344390869140625, -2.25006103515625, -2.155731201171875, -2.0614013671875, -1.967071533203125, -1.87274169921875, -1.778411865234375, -1.68408203125, -1.589752197265625, -1.49542236328125, -1.401092529296875, -1.3067626953125, -1.212432861328125, -1.11810302734375, -1.023773193359375, -0.929443359375, -0.835113525390625, -0.74078369140625, -0.646453857421875, -0.5521240234375, -0.457794189453125, -0.36346435546875, -0.269134521484375, -0.1748046875, -0.080474853515625, 0.01385498046875, 0.108184814453125, 0.2025146484375, 0.296844482421875, 0.39117431640625, 0.485504150390625, 0.579833984375, 0.674163818359375, 0.76849365234375, 0.862823486328125, 0.9571533203125, 1.051483154296875, 1.14581298828125, 1.240142822265625, 1.33447265625, 1.428802490234375, 1.52313232421875, 1.617462158203125, 1.7117919921875, 1.806121826171875, 1.90045166015625, 1.994781494140625, 2.089111328125, 2.183441162109375, 2.27777099609375, 2.372100830078125, 2.4664306640625, 2.560760498046875, 2.65509033203125, 2.749420166015625, 2.84375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 10.0, 13.0, 35.0, 68.0, 139.0, 167.0, 182.0, 159.0, 108.0, 68.0, 30.0, 13.0, 11.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.099853515625, -0.09791088104248047, -0.09596824645996094, -0.0940256118774414, -0.09208297729492188, -0.09014034271240234, -0.08819770812988281, -0.08625507354736328, -0.08431243896484375, -0.08236980438232422, -0.08042716979980469, -0.07848453521728516, -0.07654190063476562, -0.0745992660522461, -0.07265663146972656, -0.07071399688720703, -0.0687713623046875, -0.06682872772216797, -0.06488609313964844, -0.0629434585571289, -0.061000823974609375, -0.059058189392089844, -0.05711555480957031, -0.05517292022705078, -0.05323028564453125, -0.05128765106201172, -0.04934501647949219, -0.047402381896972656, -0.045459747314453125, -0.043517112731933594, -0.04157447814941406, -0.03963184356689453, -0.037689208984375, -0.03574657440185547, -0.03380393981933594, -0.031861305236816406, -0.029918670654296875, -0.027976036071777344, -0.026033401489257812, -0.02409076690673828, -0.02214813232421875, -0.02020549774169922, -0.018262863159179688, -0.016320228576660156, -0.014377593994140625, -0.012434959411621094, -0.010492324829101562, -0.008549690246582031, -0.0066070556640625, -0.004664421081542969, -0.0027217864990234375, -0.0007791519165039062, 0.001163482666015625, 0.0031061172485351562, 0.0050487518310546875, 0.006991386413574219, 0.00893402099609375, 0.010876655578613281, 0.012819290161132812, 0.014761924743652344, 0.016704559326171875, 0.018647193908691406, 0.020589828491210938, 0.02253246307373047, 0.02447509765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 5.0, 11.0, 11.0, 17.0, 23.0, 27.0, 59.0, 92.0, 157.0, 259.0, 400.0, 638.0, 1074.0, 1739.0, 3207.0, 6668.0, 15175.0, 42481.0, 172278.0, 630926.0, 116240.0, 32434.0, 12212.0, 5521.0, 2850.0, 1582.0, 911.0, 577.0, 348.0, 206.0, 135.0, 80.0, 62.0, 29.0, 27.0, 18.0, 16.0, 10.0, 8.0, 7.0, 8.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.11981201171875, -0.11611175537109375, -0.1124114990234375, -0.10871124267578125, -0.105010986328125, -0.10131072998046875, -0.0976104736328125, -0.09391021728515625, -0.0902099609375, -0.08650970458984375, -0.0828094482421875, -0.07910919189453125, -0.075408935546875, -0.07170867919921875, -0.0680084228515625, -0.06430816650390625, -0.06060791015625, -0.05690765380859375, -0.0532073974609375, -0.04950714111328125, -0.045806884765625, -0.04210662841796875, -0.0384063720703125, -0.03470611572265625, -0.031005859375, -0.02730560302734375, -0.0236053466796875, -0.01990509033203125, -0.016204833984375, -0.01250457763671875, -0.0088043212890625, -0.00510406494140625, -0.00140380859375, 0.00229644775390625, 0.0059967041015625, 0.00969696044921875, 0.013397216796875, 0.01709747314453125, 0.0207977294921875, 0.02449798583984375, 0.0281982421875, 0.03189849853515625, 0.0355987548828125, 0.03929901123046875, 0.042999267578125, 0.04669952392578125, 0.0503997802734375, 0.05410003662109375, 0.05780029296875, 0.06150054931640625, 0.0652008056640625, 0.06890106201171875, 0.072601318359375, 0.07630157470703125, 0.0800018310546875, 0.08370208740234375, 0.08740234375, 0.09110260009765625, 0.0948028564453125, 0.09850311279296875, 0.102203369140625, 0.10590362548828125, 0.1096038818359375, 0.11330413818359375, 0.11700439453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 12.0, 17.0, 21.0, 25.0, 36.0, 40.0, 52.0, 64.0, 59.0, 60.0, 75.0, 82.0, 63.0, 63.0, 52.0, 49.0, 50.0, 30.0, 27.0, 26.0, 16.0, 10.0, 5.0, 8.0, 8.0, 3.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.048858642578125, -0.0473475456237793, -0.045836448669433594, -0.04432535171508789, -0.04281425476074219, -0.041303157806396484, -0.03979206085205078, -0.03828096389770508, -0.036769866943359375, -0.03525876998901367, -0.03374767303466797, -0.032236576080322266, -0.030725479125976562, -0.02921438217163086, -0.027703285217285156, -0.026192188262939453, -0.02468109130859375, -0.023169994354248047, -0.021658897399902344, -0.02014780044555664, -0.018636703491210938, -0.017125606536865234, -0.015614509582519531, -0.014103412628173828, -0.012592315673828125, -0.011081218719482422, -0.009570121765136719, -0.008059024810791016, -0.0065479278564453125, -0.005036830902099609, -0.0035257339477539062, -0.002014636993408203, -0.0005035400390625, 0.0010075569152832031, 0.0025186538696289062, 0.004029750823974609, 0.0055408477783203125, 0.007051944732666016, 0.008563041687011719, 0.010074138641357422, 0.011585235595703125, 0.013096332550048828, 0.014607429504394531, 0.016118526458740234, 0.017629623413085938, 0.01914072036743164, 0.020651817321777344, 0.022162914276123047, 0.02367401123046875, 0.025185108184814453, 0.026696205139160156, 0.02820730209350586, 0.029718399047851562, 0.031229496002197266, 0.03274059295654297, 0.03425168991088867, 0.035762786865234375, 0.03727388381958008, 0.03878498077392578, 0.040296077728271484, 0.04180717468261719, 0.04331827163696289, 0.044829368591308594, 0.0463404655456543, 0.0478515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 8.0, 13.0, 11.0, 12.0, 18.0, 32.0, 34.0, 52.0, 79.0, 85.0, 156.0, 193.0, 321.0, 519.0, 1013.0, 2363.0, 7430.0, 908463.0, 117191.0, 6157.0, 2027.0, 885.0, 482.0, 310.0, 200.0, 133.0, 92.0, 59.0, 56.0, 27.0, 26.0, 18.0, 16.0, 10.0, 14.0, 8.0, 7.0, 3.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.376708984375, -0.3652687072753906, -0.35382843017578125, -0.3423881530761719, -0.3309478759765625, -0.3195075988769531, -0.30806732177734375, -0.2966270446777344, -0.285186767578125, -0.2737464904785156, -0.26230621337890625, -0.2508659362792969, -0.2394256591796875, -0.22798538208007812, -0.21654510498046875, -0.20510482788085938, -0.19366455078125, -0.18222427368164062, -0.17078399658203125, -0.15934371948242188, -0.1479034423828125, -0.13646316528320312, -0.12502288818359375, -0.11358261108398438, -0.102142333984375, -0.09070205688476562, -0.07926177978515625, -0.06782150268554688, -0.0563812255859375, -0.044940948486328125, -0.03350067138671875, -0.022060394287109375, -0.0106201171875, 0.000820159912109375, 0.01226043701171875, 0.023700714111328125, 0.0351409912109375, 0.046581268310546875, 0.05802154541015625, 0.06946182250976562, 0.080902099609375, 0.09234237670898438, 0.10378265380859375, 0.11522293090820312, 0.1266632080078125, 0.13810348510742188, 0.14954376220703125, 0.16098403930664062, 0.17242431640625, 0.18386459350585938, 0.19530487060546875, 0.20674514770507812, 0.2181854248046875, 0.22962570190429688, 0.24106597900390625, 0.2525062561035156, 0.263946533203125, 0.2753868103027344, 0.28682708740234375, 0.2982673645019531, 0.3097076416015625, 0.3211479187011719, 0.33258819580078125, 0.3440284729003906, 0.35546875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 5.0, 7.0, 8.0, 16.0, 51.0, 378.0, 412.0, 44.0, 25.0, 16.0, 16.0, 10.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010573863983154297, -0.00010093115270137787, -9.612366557121277e-05, -9.131617844104767e-05, -8.650869131088257e-05, -8.170120418071747e-05, -7.689371705055237e-05, -7.208622992038727e-05, -6.727874279022217e-05, -6.247125566005707e-05, -5.766376852989197e-05, -5.285628139972687e-05, -4.804879426956177e-05, -4.324130713939667e-05, -3.843382000923157e-05, -3.362633287906647e-05, -2.8818845748901367e-05, -2.4011358618736267e-05, -1.9203871488571167e-05, -1.4396384358406067e-05, -9.588897228240967e-06, -4.781410098075867e-06, 2.60770320892334e-08, 4.8335641622543335e-06, 9.641051292419434e-06, 1.4448538422584534e-05, 1.9256025552749634e-05, 2.4063512682914734e-05, 2.8870999813079834e-05, 3.3678486943244934e-05, 3.8485974073410034e-05, 4.3293461203575134e-05, 4.8100948333740234e-05, 5.2908435463905334e-05, 5.7715922594070435e-05, 6.252340972423553e-05, 6.733089685440063e-05, 7.213838398456573e-05, 7.694587111473083e-05, 8.175335824489594e-05, 8.656084537506104e-05, 9.136833250522614e-05, 9.617581963539124e-05, 0.00010098330676555634, 0.00010579079389572144, 0.00011059828102588654, 0.00011540576815605164, 0.00012021325528621674, 0.00012502074241638184, 0.00012982822954654694, 0.00013463571667671204, 0.00013944320380687714, 0.00014425069093704224, 0.00014905817806720734, 0.00015386566519737244, 0.00015867315232753754, 0.00016348063945770264, 0.00016828812658786774, 0.00017309561371803284, 0.00017790310084819794, 0.00018271058797836304, 0.00018751807510852814, 0.00019232556223869324, 0.00019713304936885834, 0.00020194053649902344]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 12.0, 14.0, 16.0, 27.0, 43.0, 54.0, 94.0, 139.0, 222.0, 344.0, 598.0, 1033.0, 1912.0, 4147.0, 12651.0, 205747.0, 797063.0, 14947.0, 4627.0, 2090.0, 1126.0, 638.0, 369.0, 221.0, 130.0, 101.0, 59.0, 40.0, 28.0, 18.0, 13.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163330078125, -0.1588001251220703, -0.15427017211914062, -0.14974021911621094, -0.14521026611328125, -0.14068031311035156, -0.13615036010742188, -0.1316204071044922, -0.1270904541015625, -0.12256050109863281, -0.11803054809570312, -0.11350059509277344, -0.10897064208984375, -0.10444068908691406, -0.09991073608398438, -0.09538078308105469, -0.090850830078125, -0.08632087707519531, -0.08179092407226562, -0.07726097106933594, -0.07273101806640625, -0.06820106506347656, -0.06367111206054688, -0.05914115905761719, -0.0546112060546875, -0.05008125305175781, -0.045551300048828125, -0.04102134704589844, -0.03649139404296875, -0.03196144104003906, -0.027431488037109375, -0.022901535034179688, -0.01837158203125, -0.013841629028320312, -0.009311676025390625, -0.0047817230224609375, -0.00025177001953125, 0.0042781829833984375, 0.008808135986328125, 0.013338088989257812, 0.0178680419921875, 0.022397994995117188, 0.026927947998046875, 0.03145790100097656, 0.03598785400390625, 0.04051780700683594, 0.045047760009765625, 0.04957771301269531, 0.054107666015625, 0.05863761901855469, 0.06316757202148438, 0.06769752502441406, 0.07222747802734375, 0.07675743103027344, 0.08128738403320312, 0.08581733703613281, 0.0903472900390625, 0.09487724304199219, 0.09940719604492188, 0.10393714904785156, 0.10846710205078125, 0.11299705505371094, 0.11752700805664062, 0.12205696105957031, 0.1265869140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 12.0, 19.0, 29.0, 71.0, 291.0, 410.0, 64.0, 32.0, 21.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0703125, -0.06836271286010742, -0.06641292572021484, -0.06446313858032227, -0.06251335144042969, -0.06056356430053711, -0.05861377716064453, -0.05666399002075195, -0.054714202880859375, -0.0527644157409668, -0.05081462860107422, -0.04886484146118164, -0.04691505432128906, -0.044965267181396484, -0.043015480041503906, -0.04106569290161133, -0.03911590576171875, -0.03716611862182617, -0.035216331481933594, -0.033266544342041016, -0.03131675720214844, -0.02936697006225586, -0.02741718292236328, -0.025467395782470703, -0.023517608642578125, -0.021567821502685547, -0.01961803436279297, -0.01766824722290039, -0.015718460083007812, -0.013768672943115234, -0.011818885803222656, -0.009869098663330078, -0.0079193115234375, -0.005969524383544922, -0.004019737243652344, -0.0020699501037597656, -0.0001201629638671875, 0.0018296241760253906, 0.0037794113159179688, 0.005729198455810547, 0.007678985595703125, 0.009628772735595703, 0.011578559875488281, 0.01352834701538086, 0.015478134155273438, 0.017427921295166016, 0.019377708435058594, 0.021327495574951172, 0.02327728271484375, 0.025227069854736328, 0.027176856994628906, 0.029126644134521484, 0.031076431274414062, 0.03302621841430664, 0.03497600555419922, 0.0369257926940918, 0.038875579833984375, 0.04082536697387695, 0.04277515411376953, 0.04472494125366211, 0.04667472839355469, 0.048624515533447266, 0.050574302673339844, 0.05252408981323242, 0.054473876953125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 18.0, 16.0, 28.0, 48.0, 105.0, 225.0, 254.0, 130.0, 78.0, 31.0, 13.0, 7.0, 9.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5683838129043579, -0.5517370700836182, -0.5350902676582336, -0.5184435248374939, -0.5017967224121094, -0.48514997959136963, -0.4685032367706299, -0.45185646414756775, -0.4352096915245056, -0.4185629189014435, -0.40191614627838135, -0.3852694034576416, -0.36862263083457947, -0.35197585821151733, -0.3353291153907776, -0.31868234276771545, -0.3020355701446533, -0.2853887975215912, -0.26874202489852905, -0.2520952820777893, -0.23544850945472717, -0.21880173683166504, -0.2021549791097641, -0.18550822138786316, -0.16886144876480103, -0.1522146761417389, -0.13556791841983795, -0.11892115324735641, -0.10227438807487488, -0.08562762290239334, -0.0689808577299118, -0.05233409255743027, -0.03568735718727112, -0.01904059201478958, -0.0023938268423080444, 0.014252938330173492, 0.03089970350265503, 0.047546468675136566, 0.0641932338476181, 0.08083999902009964, 0.09748676419258118, 0.11413352936506271, 0.13078029453754425, 0.1474270522594452, 0.16407382488250732, 0.18072059750556946, 0.1973673552274704, 0.21401411294937134, 0.23066088557243347, 0.2473076581954956, 0.26395440101623535, 0.2806011736392975, 0.2972479462623596, 0.31389471888542175, 0.3305414915084839, 0.34718823432922363, 0.36383500695228577, 0.3804817795753479, 0.39712852239608765, 0.4137752950191498, 0.4304220676422119, 0.44706884026527405, 0.4637156128883362, 0.4803623557090759, 0.49700912833213806]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 6.0, 5.0, 10.0, 10.0, 9.0, 17.0, 18.0, 19.0, 28.0, 23.0, 34.0, 23.0, 37.0, 35.0, 39.0, 43.0, 44.0, 49.0, 56.0, 35.0, 49.0, 32.0, 36.0, 31.0, 25.0, 42.0, 28.0, 35.0, 28.0, 21.0, 18.0, 24.0, 16.0, 16.0, 9.0, 12.0, 8.0, 9.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.09166291356086731, -0.08886117488145828, -0.08605942875146866, -0.08325769007205963, -0.08045594394207001, -0.07765420526266098, -0.07485246658325195, -0.07205072045326233, -0.0692489743232727, -0.06644723564386368, -0.06364548951387405, -0.06084375083446503, -0.0580420047044754, -0.055240266025066376, -0.05243852362036705, -0.049636781215667725, -0.0468350425362587, -0.04403330013155937, -0.041231557726860046, -0.03842981904745102, -0.035628072917461395, -0.03282633423805237, -0.030024591833353043, -0.027222849428653717, -0.02442110702395439, -0.021619364619255066, -0.01881762221455574, -0.016015881672501564, -0.013214139267802238, -0.010412396863102913, -0.007610656321048737, -0.004808913916349411, -0.0020071640610694885, 0.0007945778779685497, 0.003596319817006588, 0.006398061290383339, 0.009199803695082664, 0.01200154609978199, 0.014803286641836166, 0.017605029046535492, 0.020406771451234818, 0.023208513855934143, 0.02601025626063347, 0.028811996802687645, 0.03161373734474182, 0.034415483474731445, 0.03721722215414047, 0.0400189645588398, 0.042820706963539124, 0.04562244936823845, 0.048424191772937775, 0.0512259304523468, 0.054027676582336426, 0.05682941526174545, 0.05963115766644478, 0.062432900071144104, 0.06523464620113373, 0.06803638488054276, 0.07083813101053238, 0.0736398696899414, 0.07644161581993103, 0.07924335449934006, 0.08204509317874908, 0.08484683930873871, 0.08764857798814774]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 6.0, 9.0, 16.0, 11.0, 17.0, 14.0, 32.0, 45.0, 58.0, 82.0, 111.0, 175.0, 220.0, 338.0, 423.0, 613.0, 955.0, 1351.0, 1970.0, 3126.0, 5004.0, 8105.0, 14516.0, 28272.0, 68377.0, 3930556.0, 68706.0, 27561.0, 13627.0, 7464.0, 4379.0, 2684.0, 1752.0, 1119.0, 811.0, 524.0, 318.0, 257.0, 208.0, 118.0, 101.0, 60.0, 50.0, 44.0, 33.0, 13.0, 18.0, 12.0, 4.0, 7.0, 3.0, 0.0, 3.0], "bins": [-0.1553955078125, -0.15114116668701172, -0.14688682556152344, -0.14263248443603516, -0.13837814331054688, -0.1341238021850586, -0.1298694610595703, -0.12561511993408203, -0.12136077880859375, -0.11710643768310547, -0.11285209655761719, -0.1085977554321289, -0.10434341430664062, -0.10008907318115234, -0.09583473205566406, -0.09158039093017578, -0.0873260498046875, -0.08307170867919922, -0.07881736755371094, -0.07456302642822266, -0.07030868530273438, -0.0660543441772461, -0.06180000305175781, -0.05754566192626953, -0.05329132080078125, -0.04903697967529297, -0.04478263854980469, -0.040528297424316406, -0.036273956298828125, -0.032019615173339844, -0.027765274047851562, -0.02351093292236328, -0.019256591796875, -0.015002250671386719, -0.010747909545898438, -0.006493568420410156, -0.002239227294921875, 0.0020151138305664062, 0.0062694549560546875, 0.010523796081542969, 0.01477813720703125, 0.01903247833251953, 0.023286819458007812, 0.027541160583496094, 0.031795501708984375, 0.036049842834472656, 0.04030418395996094, 0.04455852508544922, 0.0488128662109375, 0.05306720733642578, 0.05732154846191406, 0.061575889587402344, 0.06583023071289062, 0.0700845718383789, 0.07433891296386719, 0.07859325408935547, 0.08284759521484375, 0.08710193634033203, 0.09135627746582031, 0.0956106185913086, 0.09986495971679688, 0.10411930084228516, 0.10837364196777344, 0.11262798309326172, 0.11688232421875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 6.0, 8.0, 9.0, 7.0, 13.0, 16.0, 25.0, 25.0, 41.0, 32.0, 54.0, 67.0, 80.0, 91.0, 106.0, 67.0, 58.0, 65.0, 49.0, 36.0, 29.0, 26.0, 20.0, 13.0, 13.0, 8.0, 8.0, 6.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.007656097412109375, -0.00743943452835083, -0.007222771644592285, -0.00700610876083374, -0.006789445877075195, -0.00657278299331665, -0.0063561201095581055, -0.0061394572257995605, -0.005922794342041016, -0.005706131458282471, -0.005489468574523926, -0.005272805690765381, -0.005056142807006836, -0.004839479923248291, -0.004622817039489746, -0.004406154155731201, -0.004189491271972656, -0.003972828388214111, -0.0037561655044555664, -0.0035395026206970215, -0.0033228397369384766, -0.0031061768531799316, -0.0028895139694213867, -0.002672851085662842, -0.002456188201904297, -0.002239525318145752, -0.002022862434387207, -0.0018061995506286621, -0.0015895366668701172, -0.0013728737831115723, -0.0011562108993530273, -0.0009395480155944824, -0.0007228851318359375, -0.0005062222480773926, -0.00028955936431884766, -7.289648056030273e-05, 0.0001437664031982422, 0.0003604292869567871, 0.000577092170715332, 0.000793755054473877, 0.0010104179382324219, 0.0012270808219909668, 0.0014437437057495117, 0.0016604065895080566, 0.0018770694732666016, 0.0020937323570251465, 0.0023103952407836914, 0.0025270581245422363, 0.0027437210083007812, 0.002960383892059326, 0.003177046775817871, 0.003393709659576416, 0.003610372543334961, 0.003827035427093506, 0.004043698310852051, 0.004260361194610596, 0.004477024078369141, 0.0046936869621276855, 0.0049103498458862305, 0.005127012729644775, 0.00534367561340332, 0.005560338497161865, 0.00577700138092041, 0.005993664264678955, 0.0062103271484375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 3.0, 5.0, 10.0, 7.0, 13.0, 7.0, 18.0, 31.0, 41.0, 204.0, 2112.0, 198414.0, 3990244.0, 2780.0, 238.0, 48.0, 25.0, 17.0, 18.0, 12.0, 12.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31201171875, -0.3025703430175781, -0.29312896728515625, -0.2836875915527344, -0.2742462158203125, -0.2648048400878906, -0.25536346435546875, -0.24592208862304688, -0.236480712890625, -0.22703933715820312, -0.21759796142578125, -0.20815658569335938, -0.1987152099609375, -0.18927383422851562, -0.17983245849609375, -0.17039108276367188, -0.16094970703125, -0.15150833129882812, -0.14206695556640625, -0.13262557983398438, -0.1231842041015625, -0.11374282836914062, -0.10430145263671875, -0.09486007690429688, -0.085418701171875, -0.07597732543945312, -0.06653594970703125, -0.057094573974609375, -0.0476531982421875, -0.038211822509765625, -0.02877044677734375, -0.019329071044921875, -0.0098876953125, -0.000446319580078125, 0.00899505615234375, 0.018436431884765625, 0.0278778076171875, 0.037319183349609375, 0.04676055908203125, 0.056201934814453125, 0.065643310546875, 0.07508468627929688, 0.08452606201171875, 0.09396743774414062, 0.1034088134765625, 0.11285018920898438, 0.12229156494140625, 0.13173294067382812, 0.14117431640625, 0.15061569213867188, 0.16005706787109375, 0.16949844360351562, 0.1789398193359375, 0.18838119506835938, 0.19782257080078125, 0.20726394653320312, 0.216705322265625, 0.22614669799804688, 0.23558807373046875, 0.24502944946289062, 0.2544708251953125, 0.2639122009277344, 0.27335357666015625, 0.2827949523925781, 0.292236328125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 6.0, 7.0, 7.0, 13.0, 19.0, 24.0, 35.0, 47.0, 93.0, 997.0, 2550.0, 98.0, 39.0, 21.0, 21.0, 18.0, 19.0, 10.0, 5.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01788330078125, -0.017307758331298828, -0.016732215881347656, -0.016156673431396484, -0.015581130981445312, -0.01500558853149414, -0.014430046081542969, -0.013854503631591797, -0.013278961181640625, -0.012703418731689453, -0.012127876281738281, -0.01155233383178711, -0.010976791381835938, -0.010401248931884766, -0.009825706481933594, -0.009250164031982422, -0.00867462158203125, -0.008099079132080078, -0.007523536682128906, -0.006947994232177734, -0.0063724517822265625, -0.005796909332275391, -0.005221366882324219, -0.004645824432373047, -0.004070281982421875, -0.003494739532470703, -0.0029191970825195312, -0.0023436546325683594, -0.0017681121826171875, -0.0011925697326660156, -0.0006170272827148438, -4.1484832763671875e-05, 0.0005340576171875, 0.0011096000671386719, 0.0016851425170898438, 0.0022606849670410156, 0.0028362274169921875, 0.0034117698669433594, 0.003987312316894531, 0.004562854766845703, 0.005138397216796875, 0.005713939666748047, 0.006289482116699219, 0.006865024566650391, 0.0074405670166015625, 0.008016109466552734, 0.008591651916503906, 0.009167194366455078, 0.00974273681640625, 0.010318279266357422, 0.010893821716308594, 0.011469364166259766, 0.012044906616210938, 0.01262044906616211, 0.013195991516113281, 0.013771533966064453, 0.014347076416015625, 0.014922618865966797, 0.015498161315917969, 0.01607370376586914, 0.016649246215820312, 0.017224788665771484, 0.017800331115722656, 0.018375873565673828, 0.018951416015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 9.0, 19.0, 20.0, 45.0, 74.0, 147.0, 286.0, 191.0, 90.0, 38.0, 21.0, 17.0, 18.0, 1.0, 2.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07760714739561081, -0.07515301555395126, -0.07269889116287231, -0.07024475932121277, -0.06779063493013382, -0.06533650308847427, -0.06288237869739532, -0.06042824685573578, -0.05797411873936653, -0.055519990622997284, -0.053065862506628036, -0.05061173439025879, -0.04815760254859924, -0.045703478157520294, -0.04324934631586075, -0.0407952181994915, -0.03834109008312225, -0.035886961966753006, -0.03343283385038376, -0.030978703871369362, -0.028524575755000114, -0.026070447638630867, -0.02361631765961647, -0.021162189543247223, -0.018708061426877975, -0.016253933310508728, -0.013799804262816906, -0.011345675215125084, -0.008891547098755836, -0.006437418982386589, -0.003983289934694767, -0.001529160887002945, 0.0009249597787857056, 0.0033790883608162403, 0.005833216942846775, 0.008287345990538597, 0.010741474106907845, 0.013195602223277092, 0.01564973220229149, 0.018103860318660736, 0.020557988435029984, 0.02301211655139923, 0.02546624466776848, 0.027920374646782875, 0.030374502763152122, 0.03282862901687622, 0.03528276085853577, 0.037736888974905014, 0.04019101709127426, 0.04264514520764351, 0.045099273324012756, 0.047553401440382004, 0.05000752955675125, 0.0524616613984108, 0.054915789514780045, 0.05736991763114929, 0.05982404574751854, 0.06227817386388779, 0.06473230570554733, 0.06718643009662628, 0.06964056193828583, 0.07209468632936478, 0.07454881817102432, 0.07700294256210327, 0.07945707440376282]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 6.0, 8.0, 5.0, 10.0, 10.0, 23.0, 18.0, 17.0, 27.0, 28.0, 32.0, 32.0, 37.0, 29.0, 43.0, 53.0, 55.0, 53.0, 38.0, 41.0, 40.0, 31.0, 44.0, 42.0, 45.0, 26.0, 25.0, 30.0, 28.0, 21.0, 19.0, 17.0, 5.0, 8.0, 7.0, 12.0, 2.0, 6.0, 11.0, 5.0, 0.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016146419569849968, -0.01561732031404972, -0.015088221058249474, -0.014559122733771801, -0.014030023477971554, -0.013500924222171307, -0.012971825897693634, -0.012442726641893387, -0.01191362738609314, -0.011384528130292892, -0.010855428874492645, -0.010326330550014973, -0.009797231294214725, -0.009268132038414478, -0.008739033713936806, -0.008209934458136559, -0.007680835202336311, -0.007151735946536064, -0.006622637156397104, -0.006093538366258144, -0.005564439110457897, -0.00503533985465765, -0.00450624106451869, -0.00397714227437973, -0.003448043018579483, -0.0029189439956098795, -0.002389844972640276, -0.0018607459496706724, -0.0013316469267010689, -0.0008025479037314653, -0.0002734488807618618, 0.00025565014220774174, 0.000784747302532196, 0.0013138463255017996, 0.0018429453484714031, 0.0023720443714410067, 0.00290114339441061, 0.0034302424173802137, 0.003959341440349817, 0.004488440230488777, 0.005017539486289024, 0.0055466387420892715, 0.006075737532228231, 0.006604836322367191, 0.0071339355781674385, 0.007663034833967686, 0.008192133158445358, 0.008721232414245605, 0.009250331670045853, 0.0097794309258461, 0.010308530181646347, 0.01083762850612402, 0.011366727761924267, 0.011895827017724514, 0.012424925342202187, 0.012954024598002434, 0.013483123853802681, 0.014012223109602928, 0.014541322365403175, 0.015070420689880848, 0.015599519945681095, 0.016128618270158768, 0.016657717525959015, 0.017186816781759262, 0.01771591603755951]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 4.0, 9.0, 7.0, 16.0, 17.0, 27.0, 32.0, 32.0, 65.0, 102.0, 321.0, 3393.0, 791600.0, 249871.0, 2394.0, 266.0, 105.0, 59.0, 33.0, 39.0, 30.0, 25.0, 21.0, 12.0, 4.0, 17.0, 10.0, 6.0, 4.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0240325927734375, -0.02339911460876465, -0.022765636444091797, -0.022132158279418945, -0.021498680114746094, -0.020865201950073242, -0.02023172378540039, -0.01959824562072754, -0.018964767456054688, -0.018331289291381836, -0.017697811126708984, -0.017064332962036133, -0.01643085479736328, -0.01579737663269043, -0.015163898468017578, -0.014530420303344727, -0.013896942138671875, -0.013263463973999023, -0.012629985809326172, -0.01199650764465332, -0.011363029479980469, -0.010729551315307617, -0.010096073150634766, -0.009462594985961914, -0.008829116821289062, -0.008195638656616211, -0.007562160491943359, -0.006928682327270508, -0.006295204162597656, -0.005661725997924805, -0.005028247833251953, -0.0043947696685791016, -0.00376129150390625, -0.0031278133392333984, -0.002494335174560547, -0.0018608570098876953, -0.0012273788452148438, -0.0005939006805419922, 3.9577484130859375e-05, 0.0006730556488037109, 0.0013065338134765625, 0.001940011978149414, 0.0025734901428222656, 0.003206968307495117, 0.0038404464721679688, 0.00447392463684082, 0.005107402801513672, 0.0057408809661865234, 0.006374359130859375, 0.0070078372955322266, 0.007641315460205078, 0.00827479362487793, 0.008908271789550781, 0.009541749954223633, 0.010175228118896484, 0.010808706283569336, 0.011442184448242188, 0.012075662612915039, 0.01270914077758789, 0.013342618942260742, 0.013976097106933594, 0.014609575271606445, 0.015243053436279297, 0.01587653160095215, 0.016510009765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 6.0, 32.0, 91.0, 211.0, 295.0, 231.0, 99.0, 33.0, 4.0, 9.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0237579345703125, -0.020979642868041992, -0.018201351165771484, -0.015423059463500977, -0.012644767761230469, -0.009866476058959961, -0.007088184356689453, -0.004309892654418945, -0.0015316009521484375, 0.0012466907501220703, 0.004024982452392578, 0.006803274154663086, 0.009581565856933594, 0.012359857559204102, 0.01513814926147461, 0.017916440963745117, 0.020694732666015625, 0.023473024368286133, 0.02625131607055664, 0.02902960777282715, 0.031807899475097656, 0.034586191177368164, 0.03736448287963867, 0.04014277458190918, 0.04292106628417969, 0.045699357986450195, 0.0484776496887207, 0.05125594139099121, 0.05403423309326172, 0.05681252479553223, 0.059590816497802734, 0.06236910820007324, 0.06514739990234375, 0.06792569160461426, 0.07070398330688477, 0.07348227500915527, 0.07626056671142578, 0.07903885841369629, 0.0818171501159668, 0.0845954418182373, 0.08737373352050781, 0.09015202522277832, 0.09293031692504883, 0.09570860862731934, 0.09848690032958984, 0.10126519203186035, 0.10404348373413086, 0.10682177543640137, 0.10960006713867188, 0.11237835884094238, 0.11515665054321289, 0.1179349422454834, 0.1207132339477539, 0.12349152565002441, 0.12626981735229492, 0.12904810905456543, 0.13182640075683594, 0.13460469245910645, 0.13738298416137695, 0.14016127586364746, 0.14293956756591797, 0.14571785926818848, 0.14849615097045898, 0.1512744426727295, 0.154052734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 25.0, 36.0, 86.0, 180.0, 336.0, 1122.0, 24491.0, 1012165.0, 8721.0, 789.0, 308.0, 142.0, 78.0, 32.0, 19.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004001617431640625, -0.0038654208183288574, -0.00372922420501709, -0.0035930275917053223, -0.0034568309783935547, -0.003320634365081787, -0.0031844377517700195, -0.003048241138458252, -0.0029120445251464844, -0.002775847911834717, -0.0026396512985229492, -0.0025034546852111816, -0.002367258071899414, -0.0022310614585876465, -0.002094864845275879, -0.0019586682319641113, -0.0018224716186523438, -0.0016862750053405762, -0.0015500783920288086, -0.001413881778717041, -0.0012776851654052734, -0.0011414885520935059, -0.0010052919387817383, -0.0008690953254699707, -0.0007328987121582031, -0.0005967020988464355, -0.00046050548553466797, -0.0003243088722229004, -0.0001881122589111328, -5.1915645599365234e-05, 8.428096771240234e-05, 0.00022047758102416992, 0.0003566741943359375, 0.0004928708076477051, 0.0006290674209594727, 0.0007652640342712402, 0.0009014606475830078, 0.0010376572608947754, 0.001173853874206543, 0.0013100504875183105, 0.0014462471008300781, 0.0015824437141418457, 0.0017186403274536133, 0.0018548369407653809, 0.0019910335540771484, 0.002127230167388916, 0.0022634267807006836, 0.002399623394012451, 0.0025358200073242188, 0.0026720166206359863, 0.002808213233947754, 0.0029444098472595215, 0.003080606460571289, 0.0032168030738830566, 0.0033529996871948242, 0.003489196300506592, 0.0036253929138183594, 0.003761589527130127, 0.0038977861404418945, 0.004033982753753662, 0.00417017936706543, 0.004306375980377197, 0.004442572593688965, 0.004578769207000732, 0.0047149658203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 15.0, 17.0, 36.0, 54.0, 65.0, 113.0, 136.0, 107.0, 149.0, 109.0, 79.0, 51.0, 34.0, 21.0, 11.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10443115234375, -0.10087966918945312, -0.09732818603515625, -0.09377670288085938, -0.0902252197265625, -0.08667373657226562, -0.08312225341796875, -0.07957077026367188, -0.076019287109375, -0.07246780395507812, -0.06891632080078125, -0.06536483764648438, -0.0618133544921875, -0.058261871337890625, -0.05471038818359375, -0.051158905029296875, -0.047607421875, -0.044055938720703125, -0.04050445556640625, -0.036952972412109375, -0.0334014892578125, -0.029850006103515625, -0.02629852294921875, -0.022747039794921875, -0.019195556640625, -0.015644073486328125, -0.01209259033203125, -0.008541107177734375, -0.0049896240234375, -0.001438140869140625, 0.00211334228515625, 0.005664825439453125, 0.00921630859375, 0.012767791748046875, 0.01631927490234375, 0.019870758056640625, 0.0234222412109375, 0.026973724365234375, 0.03052520751953125, 0.034076690673828125, 0.037628173828125, 0.041179656982421875, 0.04473114013671875, 0.048282623291015625, 0.0518341064453125, 0.055385589599609375, 0.05893707275390625, 0.062488555908203125, 0.0660400390625, 0.06959152221679688, 0.07314300537109375, 0.07669448852539062, 0.0802459716796875, 0.08379745483398438, 0.08734893798828125, 0.09090042114257812, 0.094451904296875, 0.09800338745117188, 0.10155487060546875, 0.10510635375976562, 0.1086578369140625, 0.11220932006835938, 0.11576080322265625, 0.11931228637695312, 0.12286376953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 8.0, 13.0, 17.0, 19.0, 30.0, 53.0, 72.0, 92.0, 154.0, 258.0, 357.0, 538.0, 886.0, 1372.0, 2615.0, 3900.0, 6728.0, 12177.0, 23293.0, 51100.0, 187261.0, 611433.0, 77560.0, 31797.0, 15780.0, 8580.0, 4745.0, 3145.0, 1678.0, 1027.0, 640.0, 405.0, 270.0, 180.0, 133.0, 79.0, 50.0, 33.0, 27.0, 15.0, 7.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.316796988248825e-05, -1.2746080756187439e-05, -1.2324191629886627e-05, -1.1902302503585815e-05, -1.1480413377285004e-05, -1.1058524250984192e-05, -1.063663512468338e-05, -1.0214745998382568e-05, -9.792856872081757e-06, -9.370967745780945e-06, -8.949078619480133e-06, -8.527189493179321e-06, -8.10530036687851e-06, -7.683411240577698e-06, -7.261522114276886e-06, -6.839632987976074e-06, -6.4177438616752625e-06, -5.995854735374451e-06, -5.573965609073639e-06, -5.152076482772827e-06, -4.730187356472015e-06, -4.308298230171204e-06, -3.886409103870392e-06, -3.46451997756958e-06, -3.0426308512687683e-06, -2.6207417249679565e-06, -2.1988525986671448e-06, -1.776963472366333e-06, -1.3550743460655212e-06, -9.331852197647095e-07, -5.112960934638977e-07, -8.940696716308594e-08, 3.3248215913772583e-07, 7.543712854385376e-07, 1.1762604117393494e-06, 1.5981495380401611e-06, 2.020038664340973e-06, 2.4419277906417847e-06, 2.8638169169425964e-06, 3.285706043243408e-06, 3.70759516954422e-06, 4.129484295845032e-06, 4.5513734221458435e-06, 4.973262548446655e-06, 5.395151674747467e-06, 5.817040801048279e-06, 6.2389299273490906e-06, 6.660819053649902e-06, 7.082708179950714e-06, 7.504597306251526e-06, 7.926486432552338e-06, 8.34837555885315e-06, 8.770264685153961e-06, 9.192153811454773e-06, 9.614042937755585e-06, 1.0035932064056396e-05, 1.0457821190357208e-05, 1.087971031665802e-05, 1.1301599442958832e-05, 1.1723488569259644e-05, 1.2145377695560455e-05, 1.2567266821861267e-05, 1.2989155948162079e-05, 1.341104507446289e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 5.0, 2.0, 2.0, 7.0, 12.0, 9.0, 13.0, 17.0, 20.0, 25.0, 30.0, 50.0, 67.0, 98.0, 96.0, 103.0, 111.0, 82.0, 59.0, 40.0, 26.0, 22.0, 24.0, 17.0, 9.0, 11.0, 5.0, 11.0, 3.0, 5.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.9073486328125e-06, -1.8477439880371094e-06, -1.7881393432617188e-06, -1.7285346984863281e-06, -1.6689300537109375e-06, -1.6093254089355469e-06, -1.5497207641601562e-06, -1.4901161193847656e-06, -1.430511474609375e-06, -1.3709068298339844e-06, -1.3113021850585938e-06, -1.2516975402832031e-06, -1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06, 1.7285346984863281e-06, 1.7881393432617188e-06, 1.8477439880371094e-06]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 6.0, 8.0, 5.0, 15.0, 25.0, 36.0, 71.0, 76.0, 149.0, 265.0, 403.0, 785.0, 1643.0, 3052.0, 7671.0, 21364.0, 73482.0, 810380.0, 93173.0, 20371.0, 8475.0, 3548.0, 1508.0, 906.0, 498.0, 255.0, 130.0, 99.0, 46.0, 39.0, 17.0, 13.0, 17.0, 10.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990795135498047e-05, -1.9331462681293488e-05, -1.8754974007606506e-05, -1.8178485333919525e-05, -1.7601996660232544e-05, -1.7025507986545563e-05, -1.644901931285858e-05, -1.58725306391716e-05, -1.529604196548462e-05, -1.4719553291797638e-05, -1.4143064618110657e-05, -1.3566575944423676e-05, -1.2990087270736694e-05, -1.2413598597049713e-05, -1.1837109923362732e-05, -1.126062124967575e-05, -1.068413257598877e-05, -1.0107643902301788e-05, -9.531155228614807e-06, -8.954666554927826e-06, -8.378177881240845e-06, -7.801689207553864e-06, -7.225200533866882e-06, -6.648711860179901e-06, -6.07222318649292e-06, -5.495734512805939e-06, -4.9192458391189575e-06, -4.342757165431976e-06, -3.766268491744995e-06, -3.189779818058014e-06, -2.6132911443710327e-06, -2.0368024706840515e-06, -1.4603137969970703e-06, -8.838251233100891e-07, -3.073364496231079e-07, 2.691522240638733e-07, 8.456408977508545e-07, 1.4221295714378357e-06, 1.998618245124817e-06, 2.575106918811798e-06, 3.1515955924987793e-06, 3.7280842661857605e-06, 4.304572939872742e-06, 4.881061613559723e-06, 5.457550287246704e-06, 6.034038960933685e-06, 6.6105276346206665e-06, 7.187016308307648e-06, 7.763504981994629e-06, 8.33999365568161e-06, 8.916482329368591e-06, 9.492971003055573e-06, 1.0069459676742554e-05, 1.0645948350429535e-05, 1.1222437024116516e-05, 1.1798925697803497e-05, 1.2375414371490479e-05, 1.295190304517746e-05, 1.3528391718864441e-05, 1.4104880392551422e-05, 1.4681369066238403e-05, 1.5257857739925385e-05, 1.5834346413612366e-05, 1.6410835087299347e-05, 1.6987323760986328e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 1.0, 8.0, 7.0, 9.0, 7.0, 18.0, 16.0, 26.0, 25.0, 34.0, 56.0, 75.0, 141.0, 232.0, 76.0, 33.0, 64.0, 31.0, 31.0, 15.0, 23.0, 8.0, 9.0, 11.0, 12.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4570693969726562e-06, -3.339722752571106e-06, -3.2223761081695557e-06, -3.1050294637680054e-06, -2.987682819366455e-06, -2.8703361749649048e-06, -2.7529895305633545e-06, -2.635642886161804e-06, -2.518296241760254e-06, -2.4009495973587036e-06, -2.2836029529571533e-06, -2.166256308555603e-06, -2.0489096641540527e-06, -1.9315630197525024e-06, -1.8142163753509521e-06, -1.6968697309494019e-06, -1.5795230865478516e-06, -1.4621764421463013e-06, -1.344829797744751e-06, -1.2274831533432007e-06, -1.1101365089416504e-06, -9.927898645401e-07, -8.754432201385498e-07, -7.580965757369995e-07, -6.407499313354492e-07, -5.234032869338989e-07, -4.0605664253234863e-07, -2.8870999813079834e-07, -1.7136335372924805e-07, -5.4016709327697754e-08, 6.332993507385254e-08, 1.8067657947540283e-07, 2.980232238769531e-07, 4.153698682785034e-07, 5.327165126800537e-07, 6.50063157081604e-07, 7.674098014831543e-07, 8.847564458847046e-07, 1.0021030902862549e-06, 1.1194497346878052e-06, 1.2367963790893555e-06, 1.3541430234909058e-06, 1.471489667892456e-06, 1.5888363122940063e-06, 1.7061829566955566e-06, 1.823529601097107e-06, 1.9408762454986572e-06, 2.0582228899002075e-06, 2.175569534301758e-06, 2.292916178703308e-06, 2.4102628231048584e-06, 2.5276094675064087e-06, 2.644956111907959e-06, 2.7623027563095093e-06, 2.8796494007110596e-06, 2.99699604511261e-06, 3.11434268951416e-06, 3.2316893339157104e-06, 3.3490359783172607e-06, 3.466382622718811e-06, 3.5837292671203613e-06, 3.7010759115219116e-06, 3.818422555923462e-06, 3.935769200325012e-06, 4.0531158447265625e-06]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 21.0, 34.0, 132.0, 511.0, 199.0, 50.0, 25.0, 8.0, 12.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11132108420133591, -0.10858423262834549, -0.10584738105535507, -0.10311053693294525, -0.10037368535995483, -0.09763683378696442, -0.094899982213974, -0.09216313064098358, -0.08942627906799316, -0.08668942749500275, -0.08395257592201233, -0.08121572434902191, -0.07847888022661209, -0.07574202865362167, -0.07300517708063126, -0.07026832550764084, -0.06753148138523102, -0.0647946298122406, -0.06205778196454048, -0.059320930391550064, -0.056584082543849945, -0.05384723097085953, -0.05111037939786911, -0.04837352782487869, -0.045636679977178574, -0.042899828404188156, -0.04016298055648804, -0.03742612898349762, -0.0346892774105072, -0.03195242956280708, -0.029215577989816666, -0.026478728279471397, -0.023741871118545532, -0.021005021408200264, -0.018268171697854996, -0.015531320124864578, -0.01279447041451931, -0.010057620704174042, -0.007320769131183624, -0.004583919420838356, -0.0018470697104930878, 0.0008897804655134678, 0.0036266306415200233, 0.006363481283187866, 0.009100330993533134, 0.011837180703878403, 0.01457403227686882, 0.01731088198721409, 0.020047731697559357, 0.022784581407904625, 0.025521431118249893, 0.02825828269124031, 0.03099513240158558, 0.03373198211193085, 0.036468833684921265, 0.03920568525791168, 0.0419425331056118, 0.04467938467860222, 0.04741623252630234, 0.050153084099292755, 0.05288993567228317, 0.05562678351998329, 0.05836363509297371, 0.06110048294067383, 0.06383733451366425]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 11.0, 21.0, 18.0, 43.0, 79.0, 102.0, 118.0, 155.0, 111.0, 125.0, 83.0, 59.0, 39.0, 23.0, 17.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009400900453329086, -0.008539849892258644, -0.007678799331188202, -0.00681774877011776, -0.0059566982090473175, -0.005095647182315588, -0.004234596621245146, -0.0033735460601747036, -0.0025124954991042614, -0.0016514449380338192, -0.0007903942605480552, 7.065641693770885e-05, 0.0009317069780081511, 0.001792757771909237, 0.002653808332979679, 0.0035148588940501213, 0.0043759094551205635, 0.005236960016191006, 0.006098010577261448, 0.00695906113833189, 0.007820111699402332, 0.008681163191795349, 0.009542213752865791, 0.010403264313936234, 0.011264314875006676, 0.012125365436077118, 0.01298641599714756, 0.013847466558218002, 0.014708517119288445, 0.015569567680358887, 0.01643061824142933, 0.01729166880249977, 0.018152719363570213, 0.019013769924640656, 0.019874820485711098, 0.02073587104678154, 0.021596921607851982, 0.022457972168922424, 0.023319022729992867, 0.02418007329106331, 0.02504112385213375, 0.025902174413204193, 0.026763224974274635, 0.027624275535345078, 0.02848532609641552, 0.029346376657485962, 0.030207427218556404, 0.031068477779626846, 0.03192953020334244, 0.03279058262705803, 0.03365163132548332, 0.034512683749198914, 0.03537373244762421, 0.0362347848713398, 0.03709583356976509, 0.03795688599348068, 0.038817934691905975, 0.03967898711562157, 0.04054003581404686, 0.04140108823776245, 0.042262136936187744, 0.043123189359903336, 0.04398423805832863, 0.04484529048204422, 0.04570633918046951]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 9.0, 15.0, 13.0, 13.0, 23.0, 18.0, 19.0, 24.0, 32.0, 35.0, 38.0, 52.0, 137.0, 15497.0, 1027444.0, 4759.0, 88.0, 38.0, 48.0, 46.0, 33.0, 39.0, 20.0, 20.0, 18.0, 13.0, 14.0, 5.0, 9.0, 2.0, 8.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.120849609375, -0.11673927307128906, -0.11262893676757812, -0.10851860046386719, -0.10440826416015625, -0.10029792785644531, -0.09618759155273438, -0.09207725524902344, -0.0879669189453125, -0.08385658264160156, -0.07974624633789062, -0.07563591003417969, -0.07152557373046875, -0.06741523742675781, -0.06330490112304688, -0.05919456481933594, -0.055084228515625, -0.05097389221191406, -0.046863555908203125, -0.04275321960449219, -0.03864288330078125, -0.03453254699707031, -0.030422210693359375, -0.026311874389648438, -0.0222015380859375, -0.018091201782226562, -0.013980865478515625, -0.009870529174804688, -0.00576019287109375, -0.0016498565673828125, 0.002460479736328125, 0.0065708160400390625, 0.01068115234375, 0.014791488647460938, 0.018901824951171875, 0.023012161254882812, 0.02712249755859375, 0.031232833862304688, 0.035343170166015625, 0.03945350646972656, 0.0435638427734375, 0.04767417907714844, 0.051784515380859375, 0.05589485168457031, 0.06000518798828125, 0.06411552429199219, 0.06822586059570312, 0.07233619689941406, 0.076446533203125, 0.08055686950683594, 0.08466720581054688, 0.08877754211425781, 0.09288787841796875, 0.09699821472167969, 0.10110855102539062, 0.10521888732910156, 0.1093292236328125, 0.11343955993652344, 0.11754989624023438, 0.12166023254394531, 0.12577056884765625, 0.1298809051513672, 0.13399124145507812, 0.13810157775878906, 0.1422119140625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [6.0, 26.0, 132.0, 359.0, 344.0, 121.0, 28.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010957717895507812, -0.0008264034986495972, -0.0005570352077484131, -0.000287666916847229, -1.8298625946044922e-05, 0.00025106966495513916, 0.0005204379558563232, 0.0007898062467575073, 0.0010591745376586914, 0.0013285428285598755, 0.0015979111194610596, 0.0018672794103622437, 0.0021366477012634277, 0.002406015992164612, 0.002675384283065796, 0.00294475257396698, 0.003214120864868164, 0.003483489155769348, 0.0037528574466705322, 0.004022225737571716, 0.0042915940284729, 0.0045609623193740845, 0.0048303306102752686, 0.005099698901176453, 0.005369067192077637, 0.005638435482978821, 0.005907803773880005, 0.006177172064781189, 0.006446540355682373, 0.006715908646583557, 0.006985276937484741, 0.007254645228385925, 0.007524013519287109, 0.0077933818101882935, 0.008062750101089478, 0.008332118391990662, 0.008601486682891846, 0.00887085497379303, 0.009140223264694214, 0.009409591555595398, 0.009678959846496582, 0.009948328137397766, 0.01021769642829895, 0.010487064719200134, 0.010756433010101318, 0.011025801301002502, 0.011295169591903687, 0.01156453788280487, 0.011833906173706055, 0.012103274464607239, 0.012372642755508423, 0.012642011046409607, 0.012911379337310791, 0.013180747628211975, 0.01345011591911316, 0.013719484210014343, 0.013988852500915527, 0.014258220791816711, 0.014527589082717896, 0.01479695737361908, 0.015066325664520264, 0.015335693955421448, 0.015605062246322632, 0.015874430537223816, 0.016143798828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 3.0, 6.0, 7.0, 10.0, 10.0, 13.0, 32.0, 30.0, 44.0, 50.0, 84.0, 131.0, 178.0, 251.0, 352.0, 541.0, 870.0, 1347.0, 2005.0, 3322.0, 5529.0, 9540.0, 17114.0, 32223.0, 66600.0, 170290.0, 455965.0, 151236.0, 61709.0, 29706.0, 16088.0, 8888.0, 5333.0, 3182.0, 2037.0, 1307.0, 793.0, 557.0, 391.0, 241.0, 181.0, 109.0, 73.0, 57.0, 40.0, 25.0, 14.0, 14.0, 17.0, 6.0, 3.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.0052490234375, -0.00508725643157959, -0.00492548942565918, -0.0047637224197387695, -0.004601955413818359, -0.004440188407897949, -0.004278421401977539, -0.004116654396057129, -0.003954887390136719, -0.0037931203842163086, -0.0036313533782958984, -0.0034695863723754883, -0.003307819366455078, -0.003146052360534668, -0.002984285354614258, -0.0028225183486938477, -0.0026607513427734375, -0.0024989843368530273, -0.002337217330932617, -0.002175450325012207, -0.002013683319091797, -0.0018519163131713867, -0.0016901493072509766, -0.0015283823013305664, -0.0013666152954101562, -0.001204848289489746, -0.001043081283569336, -0.0008813142776489258, -0.0007195472717285156, -0.0005577802658081055, -0.0003960132598876953, -0.00023424625396728516, -7.2479248046875e-05, 8.928775787353516e-05, 0.0002510547637939453, 0.00041282176971435547, 0.0005745887756347656, 0.0007363557815551758, 0.0008981227874755859, 0.001059889793395996, 0.0012216567993164062, 0.0013834238052368164, 0.0015451908111572266, 0.0017069578170776367, 0.0018687248229980469, 0.002030491828918457, 0.002192258834838867, 0.0023540258407592773, 0.0025157928466796875, 0.0026775598526000977, 0.002839326858520508, 0.003001093864440918, 0.003162860870361328, 0.0033246278762817383, 0.0034863948822021484, 0.0036481618881225586, 0.0038099288940429688, 0.003971695899963379, 0.004133462905883789, 0.004295229911804199, 0.004456996917724609, 0.0046187639236450195, 0.00478053092956543, 0.00494229793548584, 0.00510406494140625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 3.0, 5.0, 1.0, 11.0, 6.0, 19.0, 15.0, 27.0, 25.0, 31.0, 32.0, 40.0, 45.0, 63.0, 65.0, 76.0, 75.0, 69.0, 56.0, 54.0, 36.0, 40.0, 39.0, 35.0, 34.0, 13.0, 24.0, 15.0, 13.0, 5.0, 4.0, 8.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036468505859375, -0.003534287214279175, -0.0034217238426208496, -0.0033091604709625244, -0.0031965970993041992, -0.003084033727645874, -0.002971470355987549, -0.0028589069843292236, -0.0027463436126708984, -0.0026337802410125732, -0.002521216869354248, -0.002408653497695923, -0.0022960901260375977, -0.0021835267543792725, -0.0020709633827209473, -0.001958400011062622, -0.0018458366394042969, -0.0017332732677459717, -0.0016207098960876465, -0.0015081465244293213, -0.001395583152770996, -0.001283019781112671, -0.0011704564094543457, -0.0010578930377960205, -0.0009453296661376953, -0.0008327662944793701, -0.0007202029228210449, -0.0006076395511627197, -0.0004950761795043945, -0.00038251280784606934, -0.00026994943618774414, -0.00015738606452941895, -4.482269287109375e-05, 6.774067878723145e-05, 0.00018030405044555664, 0.00029286742210388184, 0.00040543079376220703, 0.0005179941654205322, 0.0006305575370788574, 0.0007431209087371826, 0.0008556842803955078, 0.000968247652053833, 0.0010808110237121582, 0.0011933743953704834, 0.0013059377670288086, 0.0014185011386871338, 0.001531064510345459, 0.0016436278820037842, 0.0017561912536621094, 0.0018687546253204346, 0.0019813179969787598, 0.002093881368637085, 0.00220644474029541, 0.0023190081119537354, 0.0024315714836120605, 0.0025441348552703857, 0.002656698226928711, 0.002769261598587036, 0.0028818249702453613, 0.0029943883419036865, 0.0031069517135620117, 0.003219515085220337, 0.003332078456878662, 0.0034446418285369873, 0.0035572052001953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 18.0, 11.0, 23.0, 26.0, 28.0, 51.0, 50.0, 64.0, 85.0, 125.0, 153.0, 229.0, 314.0, 453.0, 643.0, 1125.0, 2356.0, 6917.0, 45218.0, 964621.0, 17149.0, 4269.0, 1723.0, 919.0, 552.0, 370.0, 247.0, 205.0, 128.0, 121.0, 72.0, 54.0, 47.0, 40.0, 30.0, 29.0, 16.0, 14.0, 13.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.038116455078125, -0.03689861297607422, -0.03568077087402344, -0.034462928771972656, -0.033245086669921875, -0.032027244567871094, -0.030809402465820312, -0.02959156036376953, -0.02837371826171875, -0.02715587615966797, -0.025938034057617188, -0.024720191955566406, -0.023502349853515625, -0.022284507751464844, -0.021066665649414062, -0.01984882354736328, -0.0186309814453125, -0.01741313934326172, -0.016195297241210938, -0.014977455139160156, -0.013759613037109375, -0.012541770935058594, -0.011323928833007812, -0.010106086730957031, -0.00888824462890625, -0.007670402526855469, -0.0064525604248046875, -0.005234718322753906, -0.004016876220703125, -0.0027990341186523438, -0.0015811920166015625, -0.00036334991455078125, 0.0008544921875, 0.0020723342895507812, 0.0032901763916015625, 0.004508018493652344, 0.005725860595703125, 0.006943702697753906, 0.008161544799804688, 0.009379386901855469, 0.01059722900390625, 0.011815071105957031, 0.013032913208007812, 0.014250755310058594, 0.015468597412109375, 0.016686439514160156, 0.017904281616210938, 0.01912212371826172, 0.0203399658203125, 0.02155780792236328, 0.022775650024414062, 0.023993492126464844, 0.025211334228515625, 0.026429176330566406, 0.027647018432617188, 0.02886486053466797, 0.03008270263671875, 0.03130054473876953, 0.03251838684082031, 0.033736228942871094, 0.034954071044921875, 0.036171913146972656, 0.03738975524902344, 0.03860759735107422, 0.039825439453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 4.0, 8.0, 16.0, 31.0, 81.0, 620.0, 149.0, 34.0, 15.0, 7.0, 5.0, 10.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.233816146850586e-05, -1.1934898793697357e-05, -1.1531636118888855e-05, -1.1128373444080353e-05, -1.072511076927185e-05, -1.0321848094463348e-05, -9.918585419654846e-06, -9.515322744846344e-06, -9.112060070037842e-06, -8.70879739522934e-06, -8.305534720420837e-06, -7.902272045612335e-06, -7.499009370803833e-06, -7.095746695995331e-06, -6.692484021186829e-06, -6.289221346378326e-06, -5.885958671569824e-06, -5.482695996761322e-06, -5.07943332195282e-06, -4.676170647144318e-06, -4.2729079723358154e-06, -3.869645297527313e-06, -3.466382622718811e-06, -3.063119947910309e-06, -2.6598572731018066e-06, -2.2565945982933044e-06, -1.8533319234848022e-06, -1.4500692486763e-06, -1.0468065738677979e-06, -6.435438990592957e-07, -2.4028122425079346e-07, 1.6298145055770874e-07, 5.662441253662109e-07, 9.695068001747131e-07, 1.3727694749832153e-06, 1.7760321497917175e-06, 2.1792948246002197e-06, 2.582557499408722e-06, 2.985820174217224e-06, 3.3890828490257263e-06, 3.7923455238342285e-06, 4.195608198642731e-06, 4.598870873451233e-06, 5.002133548259735e-06, 5.405396223068237e-06, 5.8086588978767395e-06, 6.211921572685242e-06, 6.615184247493744e-06, 7.018446922302246e-06, 7.421709597110748e-06, 7.82497227191925e-06, 8.228234946727753e-06, 8.631497621536255e-06, 9.034760296344757e-06, 9.43802297115326e-06, 9.841285645961761e-06, 1.0244548320770264e-05, 1.0647810995578766e-05, 1.1051073670387268e-05, 1.145433634519577e-05, 1.1857599020004272e-05, 1.2260861694812775e-05, 1.2664124369621277e-05, 1.3067387044429779e-05, 1.3470649719238281e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 6.0, 5.0, 10.0, 18.0, 26.0, 36.0, 35.0, 41.0, 58.0, 78.0, 114.0, 161.0, 173.0, 278.0, 379.0, 515.0, 726.0, 994.0, 1570.0, 2535.0, 4636.0, 11104.0, 45467.0, 910771.0, 45187.0, 11350.0, 4644.0, 2526.0, 1501.0, 971.0, 730.0, 461.0, 368.0, 265.0, 212.0, 125.0, 110.0, 90.0, 62.0, 56.0, 43.0, 22.0, 16.0, 21.0, 14.0, 16.0, 10.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.009674072265625, -0.0093461275100708, -0.009018182754516602, -0.008690237998962402, -0.008362293243408203, -0.008034348487854004, -0.007706403732299805, -0.0073784589767456055, -0.007050514221191406, -0.006722569465637207, -0.006394624710083008, -0.006066679954528809, -0.005738735198974609, -0.00541079044342041, -0.005082845687866211, -0.004754900932312012, -0.0044269561767578125, -0.004099011421203613, -0.003771066665649414, -0.003443121910095215, -0.0031151771545410156, -0.0027872323989868164, -0.002459287643432617, -0.002131342887878418, -0.0018033981323242188, -0.0014754533767700195, -0.0011475086212158203, -0.0008195638656616211, -0.0004916191101074219, -0.00016367435455322266, 0.00016427040100097656, 0.0004922151565551758, 0.000820159912109375, 0.0011481046676635742, 0.0014760494232177734, 0.0018039941787719727, 0.002131938934326172, 0.002459883689880371, 0.0027878284454345703, 0.0031157732009887695, 0.0034437179565429688, 0.003771662712097168, 0.004099607467651367, 0.004427552223205566, 0.004755496978759766, 0.005083441734313965, 0.005411386489868164, 0.005739331245422363, 0.0060672760009765625, 0.006395220756530762, 0.006723165512084961, 0.00705111026763916, 0.007379055023193359, 0.007706999778747559, 0.008034944534301758, 0.008362889289855957, 0.008690834045410156, 0.009018778800964355, 0.009346723556518555, 0.009674668312072754, 0.010002613067626953, 0.010330557823181152, 0.010658502578735352, 0.01098644733428955, 0.01131439208984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 4.0, 5.0, 4.0, 11.0, 8.0, 19.0, 25.0, 42.0, 253.0, 459.0, 68.0, 41.0, 23.0, 8.0, 9.0, 4.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0060272216796875, -0.005813121795654297, -0.005599021911621094, -0.005384922027587891, -0.0051708221435546875, -0.004956722259521484, -0.004742622375488281, -0.004528522491455078, -0.004314422607421875, -0.004100322723388672, -0.0038862228393554688, -0.0036721229553222656, -0.0034580230712890625, -0.0032439231872558594, -0.0030298233032226562, -0.002815723419189453, -0.00260162353515625, -0.002387523651123047, -0.0021734237670898438, -0.0019593238830566406, -0.0017452239990234375, -0.0015311241149902344, -0.0013170242309570312, -0.0011029243469238281, -0.000888824462890625, -0.0006747245788574219, -0.00046062469482421875, -0.0002465248107910156, -3.24249267578125e-05, 0.00018167495727539062, 0.00039577484130859375, 0.0006098747253417969, 0.000823974609375, 0.0010380744934082031, 0.0012521743774414062, 0.0014662742614746094, 0.0016803741455078125, 0.0018944740295410156, 0.0021085739135742188, 0.002322673797607422, 0.002536773681640625, 0.002750873565673828, 0.0029649734497070312, 0.0031790733337402344, 0.0033931732177734375, 0.0036072731018066406, 0.0038213729858398438, 0.004035472869873047, 0.00424957275390625, 0.004463672637939453, 0.004677772521972656, 0.004891872406005859, 0.0051059722900390625, 0.005320072174072266, 0.005534172058105469, 0.005748271942138672, 0.005962371826171875, 0.006176471710205078, 0.006390571594238281, 0.006604671478271484, 0.0068187713623046875, 0.007032871246337891, 0.007246971130371094, 0.007461071014404297, 0.0076751708984375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 9.0, 10.0, 6.0, 14.0, 29.0, 35.0, 40.0, 100.0, 178.0, 225.0, 155.0, 70.0, 49.0, 19.0, 16.0, 13.0, 9.0, 7.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06038687378168106, -0.05856429785490036, -0.05674172192811966, -0.05491914600133896, -0.053096573799848557, -0.051273997873067856, -0.049451421946287155, -0.047628846019506454, -0.04580627381801605, -0.04398369789123535, -0.04216112196445465, -0.04033854603767395, -0.03851597383618355, -0.03669339790940285, -0.03487082198262215, -0.033048246055841446, -0.031225670129060745, -0.029403094202280045, -0.027580520138144493, -0.025757944211363792, -0.02393537014722824, -0.02211279422044754, -0.02029021829366684, -0.01846764236688614, -0.016645068302750587, -0.014822493307292461, -0.012999918311834335, -0.011177342385053635, -0.009354767389595509, -0.0075321923941373825, -0.005709616467356682, -0.0038870414718985558, -0.0020644664764404297, -0.00024189124815165997, 0.0015806839801371098, 0.003403259441256523, 0.005225834436714649, 0.007048409432172775, 0.008870985358953476, 0.010693560354411602, 0.012516135349869728, 0.014338710345327854, 0.01616128534078598, 0.01798386126756668, 0.01980643719434738, 0.021629011258482933, 0.023451587185263634, 0.025274161249399185, 0.027096737176179886, 0.028919313102960587, 0.030741887167096138, 0.03256446123123169, 0.03438703715801239, 0.03620961308479309, 0.03803218901157379, 0.03985476493835449, 0.04167734086513519, 0.043499916791915894, 0.045322492718696594, 0.047145068645477295, 0.0489676408469677, 0.0507902167737484, 0.0526127927005291, 0.0544353686273098, 0.0562579408288002]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 3.0, 10.0, 2.0, 6.0, 7.0, 12.0, 11.0, 13.0, 15.0, 16.0, 21.0, 25.0, 34.0, 28.0, 38.0, 47.0, 42.0, 42.0, 45.0, 46.0, 48.0, 39.0, 42.0, 38.0, 43.0, 33.0, 34.0, 39.0, 23.0, 35.0, 26.0, 25.0, 16.0, 16.0, 20.0, 13.0, 10.0, 7.0, 8.0, 4.0, 5.0, 5.0, 5.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007344689220190048, -0.007059444207698107, -0.006774199195206165, -0.0064889537170529366, -0.006203708704560995, -0.005918463692069054, -0.005633218213915825, -0.0053479732014238834, -0.005062728188931942, -0.0047774831764400005, -0.004492238163948059, -0.00420699268579483, -0.003921747673302889, -0.0036365026608109474, -0.0033512574154883623, -0.003066012170165777, -0.0027807671576738358, -0.0024955221451818943, -0.002210276899859309, -0.001925031770952046, -0.0016397866420447826, -0.0013545415131375194, -0.001069296384230256, -0.000784051138907671, -0.0004988061264157295, -0.00021356099750846624, 7.168413139879704e-05, 0.0003569292603060603, 0.0006421743892133236, 0.0009274195181205869, 0.0012126646470278502, 0.0014979098923504353, 0.0017831549048423767, 0.002068399917334318, 0.0023536451626569033, 0.0026388904079794884, 0.00292413542047143, 0.0032093804329633713, 0.0034946256782859564, 0.0037798709236085415, 0.004065115936100483, 0.004350360948592424, 0.004635605961084366, 0.004920851439237595, 0.005206096451729536, 0.0054913414642214775, 0.005776586942374706, 0.006061831954866648, 0.006347076967358589, 0.006632321979850531, 0.006917566992342472, 0.007202812470495701, 0.007488057482987642, 0.007773302495479584, 0.008058547973632812, 0.008343793451786041, 0.008629037998616695, 0.008914283476769924, 0.009199528023600578, 0.009484773501753807, 0.009770018979907036, 0.01005526352673769, 0.010340509004890919, 0.010625753551721573, 0.010910999029874802]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 10.0, 14.0, 15.0, 24.0, 36.0, 35.0, 45.0, 86.0, 124.0, 177.0, 266.0, 377.0, 627.0, 1017.0, 1817.0, 3684.0, 8444.0, 26860.0, 4086077.0, 42114.0, 11829.0, 4832.0, 2406.0, 1236.0, 740.0, 459.0, 281.0, 199.0, 146.0, 97.0, 59.0, 45.0, 29.0, 21.0, 12.0, 16.0, 5.0, 9.0, 6.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0498046875, -0.0483245849609375, -0.046844482421875, -0.0453643798828125, -0.04388427734375, -0.0424041748046875, -0.040924072265625, -0.0394439697265625, -0.0379638671875, -0.0364837646484375, -0.035003662109375, -0.0335235595703125, -0.03204345703125, -0.0305633544921875, -0.029083251953125, -0.0276031494140625, -0.026123046875, -0.0246429443359375, -0.023162841796875, -0.0216827392578125, -0.02020263671875, -0.0187225341796875, -0.017242431640625, -0.0157623291015625, -0.0142822265625, -0.0128021240234375, -0.011322021484375, -0.0098419189453125, -0.00836181640625, -0.0068817138671875, -0.005401611328125, -0.0039215087890625, -0.00244140625, -0.0009613037109375, 0.000518798828125, 0.0019989013671875, 0.00347900390625, 0.0049591064453125, 0.006439208984375, 0.0079193115234375, 0.0093994140625, 0.0108795166015625, 0.012359619140625, 0.0138397216796875, 0.01531982421875, 0.0167999267578125, 0.018280029296875, 0.0197601318359375, 0.021240234375, 0.0227203369140625, 0.024200439453125, 0.0256805419921875, 0.02716064453125, 0.0286407470703125, 0.030120849609375, 0.0316009521484375, 0.0330810546875, 0.0345611572265625, 0.036041259765625, 0.0375213623046875, 0.03900146484375, 0.0404815673828125, 0.041961669921875, 0.0434417724609375, 0.044921875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 2.0, 9.0, 8.0, 7.0, 9.0, 14.0, 18.0, 23.0, 42.0, 62.0, 93.0, 122.0, 139.0, 117.0, 86.0, 57.0, 39.0, 36.0, 23.0, 21.0, 14.0, 10.0, 10.0, 4.0, 7.0, 4.0, 1.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002803802490234375, -0.002717941999435425, -0.0026320815086364746, -0.0025462210178375244, -0.0024603605270385742, -0.002374500036239624, -0.002288639545440674, -0.0022027790546417236, -0.0021169185638427734, -0.0020310580730438232, -0.001945197582244873, -0.0018593370914459229, -0.0017734766006469727, -0.0016876161098480225, -0.0016017556190490723, -0.001515895128250122, -0.0014300346374511719, -0.0013441741466522217, -0.0012583136558532715, -0.0011724531650543213, -0.001086592674255371, -0.001000732183456421, -0.0009148716926574707, -0.0008290112018585205, -0.0007431507110595703, -0.0006572902202606201, -0.0005714297294616699, -0.0004855692386627197, -0.00039970874786376953, -0.00031384825706481934, -0.00022798776626586914, -0.00014212727546691895, -5.626678466796875e-05, 2.9593706130981445e-05, 0.00011545419692993164, 0.00020131468772888184, 0.00028717517852783203, 0.0003730356693267822, 0.0004588961601257324, 0.0005447566509246826, 0.0006306171417236328, 0.000716477632522583, 0.0008023381233215332, 0.0008881986141204834, 0.0009740591049194336, 0.0010599195957183838, 0.001145780086517334, 0.0012316405773162842, 0.0013175010681152344, 0.0014033615589141846, 0.0014892220497131348, 0.001575082540512085, 0.0016609430313110352, 0.0017468035221099854, 0.0018326640129089355, 0.0019185245037078857, 0.002004384994506836, 0.002090245485305786, 0.0021761059761047363, 0.0022619664669036865, 0.0023478269577026367, 0.002433687448501587, 0.002519547939300537, 0.0026054084300994873, 0.0026912689208984375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 4.0, 6.0, 7.0, 3.0, 22.0, 29.0, 48.0, 72.0, 123.0, 213.0, 324.0, 650.0, 1291.0, 2890.0, 8589.0, 39111.0, 4088905.0, 38056.0, 8338.0, 2893.0, 1227.0, 684.0, 329.0, 199.0, 101.0, 58.0, 45.0, 21.0, 11.0, 5.0, 13.0, 8.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0183868408203125, -0.01763606071472168, -0.01688528060913086, -0.01613450050354004, -0.015383720397949219, -0.014632940292358398, -0.013882160186767578, -0.013131380081176758, -0.012380599975585938, -0.011629819869995117, -0.010879039764404297, -0.010128259658813477, -0.009377479553222656, -0.008626699447631836, -0.007875919342041016, -0.007125139236450195, -0.006374359130859375, -0.005623579025268555, -0.004872798919677734, -0.004122018814086914, -0.0033712387084960938, -0.0026204586029052734, -0.0018696784973144531, -0.0011188983917236328, -0.0003681182861328125, 0.0003826618194580078, 0.0011334419250488281, 0.0018842220306396484, 0.0026350021362304688, 0.003385782241821289, 0.004136562347412109, 0.00488734245300293, 0.00563812255859375, 0.00638890266418457, 0.007139682769775391, 0.007890462875366211, 0.008641242980957031, 0.009392023086547852, 0.010142803192138672, 0.010893583297729492, 0.011644363403320312, 0.012395143508911133, 0.013145923614501953, 0.013896703720092773, 0.014647483825683594, 0.015398263931274414, 0.016149044036865234, 0.016899824142456055, 0.017650604248046875, 0.018401384353637695, 0.019152164459228516, 0.019902944564819336, 0.020653724670410156, 0.021404504776000977, 0.022155284881591797, 0.022906064987182617, 0.023656845092773438, 0.024407625198364258, 0.025158405303955078, 0.0259091854095459, 0.02665996551513672, 0.02741074562072754, 0.02816152572631836, 0.02891230583190918, 0.0296630859375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 14.0, 20.0, 31.0, 105.0, 2110.0, 1611.0, 78.0, 23.0, 16.0, 10.0, 11.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00450897216796875, -0.004335522651672363, -0.0041620731353759766, -0.00398862361907959, -0.003815174102783203, -0.0036417245864868164, -0.0034682750701904297, -0.003294825553894043, -0.0031213760375976562, -0.0029479265213012695, -0.002774477005004883, -0.002601027488708496, -0.0024275779724121094, -0.0022541284561157227, -0.002080678939819336, -0.0019072294235229492, -0.0017337799072265625, -0.0015603303909301758, -0.001386880874633789, -0.0012134313583374023, -0.0010399818420410156, -0.0008665323257446289, -0.0006930828094482422, -0.0005196332931518555, -0.00034618377685546875, -0.00017273426055908203, 7.152557373046875e-07, 0.0001741647720336914, 0.0003476142883300781, 0.0005210638046264648, 0.0006945133209228516, 0.0008679628372192383, 0.001041412353515625, 0.0012148618698120117, 0.0013883113861083984, 0.0015617609024047852, 0.0017352104187011719, 0.0019086599349975586, 0.0020821094512939453, 0.002255558967590332, 0.0024290084838867188, 0.0026024580001831055, 0.002775907516479492, 0.002949357032775879, 0.0031228065490722656, 0.0032962560653686523, 0.003469705581665039, 0.0036431550979614258, 0.0038166046142578125, 0.003990054130554199, 0.004163503646850586, 0.004336953163146973, 0.004510402679443359, 0.004683852195739746, 0.004857301712036133, 0.0050307512283325195, 0.005204200744628906, 0.005377650260925293, 0.00555109977722168, 0.005724549293518066, 0.005897998809814453, 0.00607144832611084, 0.0062448978424072266, 0.006418347358703613, 0.006591796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 6.0, 19.0, 10.0, 27.0, 62.0, 124.0, 261.0, 254.0, 120.0, 54.0, 34.0, 11.0, 10.0, 7.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006153257098048925, -0.0055395811796188354, -0.004925905726850033, -0.004312229808419943, -0.003698553889989853, -0.003084877971559763, -0.0024712022859603167, -0.0018575266003608704, -0.0012438506819307804, -0.0006301748799160123, -1.6499077901244164e-05, 0.000597176724113524, 0.001210852526128292, 0.001824528444558382, 0.0024382041301578283, 0.0030518798157572746, 0.0036655557341873646, 0.0042792316526174545, 0.004892907105386257, 0.005506583023816347, 0.006120258942246437, 0.006733934860676527, 0.007347610779106617, 0.00796128623187542, 0.008574962615966797, 0.0091886380687356, 0.009802314452826977, 0.01041598990559578, 0.011029666289687157, 0.01164334174245596, 0.012257017195224762, 0.01287069357931614, 0.013484369963407516, 0.014098045416176319, 0.014711721800267696, 0.015325397253036499, 0.015939073637127876, 0.016552750021219254, 0.01716642454266548, 0.01778010092675686, 0.018393777310848236, 0.019007453694939613, 0.01962112821638584, 0.02023480460047722, 0.020848480984568596, 0.021462157368659973, 0.0220758318901062, 0.02268950827419758, 0.023303182795643806, 0.023916859179735184, 0.024530533701181412, 0.02514421008527279, 0.025757886469364166, 0.026371560990810394, 0.02698523737490177, 0.02759891375899315, 0.028212588280439377, 0.028826264664530754, 0.029439939185976982, 0.03005361557006836, 0.030667291954159737, 0.031280968338251114, 0.03189464285969734, 0.03250831738114357, 0.033121995627880096]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 8.0, 8.0, 8.0, 9.0, 4.0, 14.0, 10.0, 19.0, 21.0, 25.0, 33.0, 30.0, 35.0, 33.0, 36.0, 33.0, 45.0, 35.0, 44.0, 39.0, 46.0, 39.0, 37.0, 37.0, 33.0, 43.0, 27.0, 29.0, 28.0, 28.0, 13.0, 22.0, 16.0, 23.0, 14.0, 12.0, 10.0, 7.0, 12.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.00344871892593801, -0.0033506317995488644, -0.0032525446731597185, -0.0031544575467705727, -0.0030563706532120705, -0.002958283293992281, -0.0028601964004337788, -0.002762109274044633, -0.002664022147655487, -0.002565935021266341, -0.0024678478948771954, -0.0023697607684880495, -0.0022716736420989037, -0.0021735867485404015, -0.0020754996221512556, -0.0019774124957621098, -0.001879325369372964, -0.001781238242983818, -0.0016831511165946722, -0.0015850641066208482, -0.0014869769802317023, -0.0013888898538425565, -0.0012908028438687325, -0.0011927157174795866, -0.0010946285910904408, -0.000996541464701295, -0.00089845439651981, -0.000800367328338325, -0.0007022802019491792, -0.0006041930755600333, -0.0005061060073785484, -0.00040801893919706345, -0.00030993157997727394, -0.00021184448269195855, -0.00011375738540664315, -1.5670288121327758e-05, 8.241680916398764e-05, 0.0001805039355531335, 0.0002785910037346184, 0.00037667807191610336, 0.0004747651983052492, 0.0005728523246943951, 0.00067093939287588, 0.0007690264610573649, 0.0008671135874465108, 0.0009652007138356566, 0.0010632877238094807, 0.0011613748501986265, 0.0012594619765877724, 0.0013575491029769182, 0.001455636229366064, 0.001553723239339888, 0.001651810365729034, 0.0017498974921181798, 0.0018479845020920038, 0.0019460716284811497, 0.0020441587548702955, 0.0021422458812594414, 0.0022403330076485872, 0.002338420134037733, 0.0024365070275962353, 0.0025345943868160248, 0.002632681280374527, 0.002730768406763673, 0.0028288555331528187]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 7.0, 19.0, 21.0, 29.0, 38.0, 73.0, 86.0, 166.0, 383.0, 857.0, 2229.0, 8163.0, 51563.0, 829153.0, 135188.0, 14964.0, 3328.0, 1216.0, 503.0, 216.0, 135.0, 72.0, 45.0, 40.0, 19.0, 9.0, 11.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0011129379272460938, -0.0010817497968673706, -0.0010505616664886475, -0.0010193735361099243, -0.0009881854057312012, -0.000956997275352478, -0.0009258091449737549, -0.0008946210145950317, -0.0008634328842163086, -0.0008322447538375854, -0.0008010566234588623, -0.0007698684930801392, -0.000738680362701416, -0.0007074922323226929, -0.0006763041019439697, -0.0006451159715652466, -0.0006139278411865234, -0.0005827397108078003, -0.0005515515804290771, -0.000520363450050354, -0.0004891753196716309, -0.0004579871892929077, -0.00042679905891418457, -0.0003956109285354614, -0.0003644227981567383, -0.00033323466777801514, -0.000302046537399292, -0.00027085840702056885, -0.0002396702766418457, -0.00020848214626312256, -0.00017729401588439941, -0.00014610588550567627, -0.00011491775512695312, -8.372962474822998e-05, -5.2541494369506836e-05, -2.135336399078369e-05, 9.834766387939453e-06, 4.10228967666626e-05, 7.221102714538574e-05, 0.00010339915752410889, 0.00013458728790283203, 0.00016577541828155518, 0.00019696354866027832, 0.00022815167903900146, 0.0002593398094177246, 0.00029052793979644775, 0.0003217160701751709, 0.00035290420055389404, 0.0003840923309326172, 0.00041528046131134033, 0.0004464685916900635, 0.0004776567220687866, 0.0005088448524475098, 0.0005400329828262329, 0.0005712211132049561, 0.0006024092435836792, 0.0006335973739624023, 0.0006647855043411255, 0.0006959736347198486, 0.0007271617650985718, 0.0007583498954772949, 0.0007895380258560181, 0.0008207261562347412, 0.0008519142866134644, 0.0008831024169921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 11.0, 12.0, 20.0, 22.0, 21.0, 31.0, 45.0, 61.0, 82.0, 63.0, 79.0, 88.0, 70.0, 80.0, 61.0, 47.0, 31.0, 38.0, 32.0, 17.0, 18.0, 13.0, 9.0, 10.0, 12.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004360198974609375, -0.004212379455566406, -0.0040645599365234375, -0.003916740417480469, -0.0037689208984375, -0.0036211013793945312, -0.0034732818603515625, -0.0033254623413085938, -0.003177642822265625, -0.0030298233032226562, -0.0028820037841796875, -0.0027341842651367188, -0.00258636474609375, -0.0024385452270507812, -0.0022907257080078125, -0.0021429061889648438, -0.001995086669921875, -0.0018472671508789062, -0.0016994476318359375, -0.0015516281127929688, -0.00140380859375, -0.0012559890747070312, -0.0011081695556640625, -0.0009603500366210938, -0.000812530517578125, -0.0006647109985351562, -0.0005168914794921875, -0.00036907196044921875, -0.00022125244140625, -7.343292236328125e-05, 7.43865966796875e-05, 0.00022220611572265625, 0.000370025634765625, 0.0005178451538085938, 0.0006656646728515625, 0.0008134841918945312, 0.0009613037109375, 0.0011091232299804688, 0.0012569427490234375, 0.0014047622680664062, 0.001552581787109375, 0.0017004013061523438, 0.0018482208251953125, 0.0019960403442382812, 0.00214385986328125, 0.0022916793823242188, 0.0024394989013671875, 0.0025873184204101562, 0.002735137939453125, 0.0028829574584960938, 0.0030307769775390625, 0.0031785964965820312, 0.003326416015625, 0.0034742355346679688, 0.0036220550537109375, 0.0037698745727539062, 0.003917694091796875, 0.004065513610839844, 0.0042133331298828125, 0.004361152648925781, 0.00450897216796875, 0.004656791687011719, 0.0048046112060546875, 0.004952430725097656, 0.005100250244140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 8.0, 15.0, 10.0, 14.0, 22.0, 29.0, 39.0, 45.0, 52.0, 65.0, 103.0, 105.0, 143.0, 265.0, 458.0, 1300.0, 4797.0, 25813.0, 503044.0, 479525.0, 25423.0, 4559.0, 1322.0, 495.0, 243.0, 142.0, 99.0, 87.0, 61.0, 46.0, 40.0, 34.0, 38.0, 20.0, 14.0, 17.0, 13.0, 10.0, 5.0, 9.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002551078796386719, -0.00024737603962421417, -0.00023964419960975647, -0.00023191235959529877, -0.00022418051958084106, -0.00021644867956638336, -0.00020871683955192566, -0.00020098499953746796, -0.00019325315952301025, -0.00018552131950855255, -0.00017778947949409485, -0.00017005763947963715, -0.00016232579946517944, -0.00015459395945072174, -0.00014686211943626404, -0.00013913027942180634, -0.00013139843940734863, -0.00012366659939289093, -0.00011593475937843323, -0.00010820291936397552, -0.00010047107934951782, -9.273923933506012e-05, -8.500739932060242e-05, -7.727555930614471e-05, -6.954371929168701e-05, -6.181187927722931e-05, -5.4080039262771606e-05, -4.6348199248313904e-05, -3.86163592338562e-05, -3.08845192193985e-05, -2.3152679204940796e-05, -1.5420839190483093e-05, -7.68899917602539e-06, 4.284083843231201e-08, 7.774680852890015e-06, 1.5506520867347717e-05, 2.323836088180542e-05, 3.097020089626312e-05, 3.8702040910720825e-05, 4.643388092517853e-05, 5.416572093963623e-05, 6.189756095409393e-05, 6.962940096855164e-05, 7.736124098300934e-05, 8.509308099746704e-05, 9.282492101192474e-05, 0.00010055676102638245, 0.00010828860104084015, 0.00011602044105529785, 0.00012375228106975555, 0.00013148412108421326, 0.00013921596109867096, 0.00014694780111312866, 0.00015467964112758636, 0.00016241148114204407, 0.00017014332115650177, 0.00017787516117095947, 0.00018560700118541718, 0.00019333884119987488, 0.00020107068121433258, 0.00020880252122879028, 0.00021653436124324799, 0.0002242662012577057, 0.0002319980412721634, 0.0002397298812866211]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 5.0, 10.0, 5.0, 11.0, 13.0, 20.0, 21.0, 23.0, 22.0, 19.0, 32.0, 27.0, 31.0, 50.0, 39.0, 43.0, 38.0, 35.0, 45.0, 43.0, 48.0, 43.0, 42.0, 29.0, 42.0, 40.0, 34.0, 26.0, 22.0, 23.0, 15.0, 16.0, 20.0, 11.0, 6.0, 6.0, 12.0, 4.0, 7.0, 8.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.006664276123046875, -0.006462395191192627, -0.006260514259338379, -0.006058633327484131, -0.005856752395629883, -0.005654871463775635, -0.005452990531921387, -0.005251109600067139, -0.005049228668212891, -0.004847347736358643, -0.0046454668045043945, -0.0044435858726501465, -0.0042417049407958984, -0.00403982400894165, -0.0038379430770874023, -0.0036360621452331543, -0.0034341812133789062, -0.003232300281524658, -0.00303041934967041, -0.002828538417816162, -0.002626657485961914, -0.002424776554107666, -0.002222895622253418, -0.00202101469039917, -0.0018191337585449219, -0.0016172528266906738, -0.0014153718948364258, -0.0012134909629821777, -0.0010116100311279297, -0.0008097290992736816, -0.0006078481674194336, -0.00040596723556518555, -0.0002040863037109375, -2.205371856689453e-06, 0.0001996755599975586, 0.00040155649185180664, 0.0006034374237060547, 0.0008053183555603027, 0.0010071992874145508, 0.0012090802192687988, 0.0014109611511230469, 0.001612842082977295, 0.001814723014831543, 0.002016603946685791, 0.002218484878540039, 0.002420365810394287, 0.002622246742248535, 0.002824127674102783, 0.0030260086059570312, 0.0032278895378112793, 0.0034297704696655273, 0.0036316514015197754, 0.0038335323333740234, 0.0040354132652282715, 0.0042372941970825195, 0.004439175128936768, 0.004641056060791016, 0.004842936992645264, 0.005044817924499512, 0.00524669885635376, 0.005448579788208008, 0.005650460720062256, 0.005852341651916504, 0.006054222583770752, 0.006256103515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 98.0, 0.0, 0.0, 388.0, 0.0, 0.0, 0.0, 1481.0, 0.0, 0.0, 0.0, 5910.0, 0.0, 0.0, 0.0, 33008.0, 0.0, 0.0, 967297.0, 0.0, 0.0, 0.0, 32936.0, 0.0, 0.0, 0.0, 5567.0, 0.0, 0.0, 0.0, 1370.0, 0.0, 0.0, 355.0, 0.0, 0.0, 0.0, 98.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 3.0], "bins": [-5.364418029785156e-07, -5.206093192100525e-07, -5.047768354415894e-07, -4.889443516731262e-07, -4.731118679046631e-07, -4.5727938413619995e-07, -4.414469003677368e-07, -4.256144165992737e-07, -4.0978193283081055e-07, -3.939494490623474e-07, -3.781169652938843e-07, -3.6228448152542114e-07, -3.46451997756958e-07, -3.3061951398849487e-07, -3.1478703022003174e-07, -2.989545464515686e-07, -2.8312206268310547e-07, -2.6728957891464233e-07, -2.514570951461792e-07, -2.3562461137771606e-07, -2.1979212760925293e-07, -2.039596438407898e-07, -1.8812716007232666e-07, -1.7229467630386353e-07, -1.564621925354004e-07, -1.4062970876693726e-07, -1.2479722499847412e-07, -1.0896474123001099e-07, -9.313225746154785e-08, -7.729977369308472e-08, -6.146728992462158e-08, -4.563480615615845e-08, -2.9802322387695312e-08, -1.3969838619232178e-08, 1.862645149230957e-09, 1.7695128917694092e-08, 3.3527612686157227e-08, 4.936009645462036e-08, 6.51925802230835e-08, 8.102506399154663e-08, 9.685754776000977e-08, 1.126900315284729e-07, 1.2852251529693604e-07, 1.4435499906539917e-07, 1.601874828338623e-07, 1.7601996660232544e-07, 1.9185245037078857e-07, 2.076849341392517e-07, 2.2351741790771484e-07, 2.39349901676178e-07, 2.551823854446411e-07, 2.7101486921310425e-07, 2.868473529815674e-07, 3.026798367500305e-07, 3.1851232051849365e-07, 3.343448042869568e-07, 3.501772880554199e-07, 3.6600977182388306e-07, 3.818422555923462e-07, 3.976747393608093e-07, 4.1350722312927246e-07, 4.293397068977356e-07, 4.4517219066619873e-07, 4.6100467443466187e-07, 4.76837158203125e-07]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 0.0, 10.0, 0.0, 0.0, 19.0, 0.0, 0.0, 36.0, 0.0, 0.0, 61.0, 0.0, 0.0, 79.0, 0.0, 107.0, 0.0, 0.0, 104.0, 0.0, 0.0, 127.0, 0.0, 0.0, 134.0, 0.0, 114.0, 0.0, 0.0, 85.0, 0.0, 0.0, 53.0, 0.0, 0.0, 28.0, 0.0, 0.0, 19.0, 0.0, 17.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 0.0, 0.0, 2.0, 0.0, 4.0], "bins": [-7.152557373046875e-07, -6.938353180885315e-07, -6.724148988723755e-07, -6.509944796562195e-07, -6.295740604400635e-07, -6.081536412239075e-07, -5.867332220077515e-07, -5.653128027915955e-07, -5.438923835754395e-07, -5.224719643592834e-07, -5.010515451431274e-07, -4.796311259269714e-07, -4.5821070671081543e-07, -4.367902874946594e-07, -4.153698682785034e-07, -3.939494490623474e-07, -3.725290298461914e-07, -3.511086106300354e-07, -3.296881914138794e-07, -3.082677721977234e-07, -2.868473529815674e-07, -2.654269337654114e-07, -2.4400651454925537e-07, -2.2258609533309937e-07, -2.0116567611694336e-07, -1.7974525690078735e-07, -1.5832483768463135e-07, -1.3690441846847534e-07, -1.1548399925231934e-07, -9.406358003616333e-08, -7.264316082000732e-08, -5.122274160385132e-08, -2.9802322387695312e-08, -8.381903171539307e-09, 1.30385160446167e-08, 3.4458935260772705e-08, 5.587935447692871e-08, 7.729977369308472e-08, 9.872019290924072e-08, 1.2014061212539673e-07, 1.4156103134155273e-07, 1.6298145055770874e-07, 1.8440186977386475e-07, 2.0582228899002075e-07, 2.2724270820617676e-07, 2.4866312742233276e-07, 2.7008354663848877e-07, 2.915039658546448e-07, 3.129243850708008e-07, 3.343448042869568e-07, 3.557652235031128e-07, 3.771856427192688e-07, 3.986060619354248e-07, 4.200264811515808e-07, 4.414469003677368e-07, 4.628673195838928e-07, 4.842877388000488e-07, 5.057081580162048e-07, 5.271285772323608e-07, 5.485489964485168e-07, 5.699694156646729e-07, 5.913898348808289e-07, 6.128102540969849e-07, 6.342306733131409e-07, 6.556510925292969e-07]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 25.0, 0.0, 40.0, 0.0, 122.0, 0.0, 0.0, 325.0, 0.0, 1238.0, 0.0, 0.0, 5998.0, 0.0, 32215.0, 0.0, 968513.0, 0.0, 0.0, 32142.0, 0.0, 6244.0, 0.0, 1201.0, 0.0, 0.0, 317.0, 0.0, 111.0, 0.0, 0.0, 37.0, 0.0, 22.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.497146725654602e-07, -7.245689630508423e-07, -6.994232535362244e-07, -6.742775440216064e-07, -6.491318345069885e-07, -6.239861249923706e-07, -5.988404154777527e-07, -5.736947059631348e-07, -5.485489964485168e-07, -5.234032869338989e-07, -4.98257577419281e-07, -4.731118679046631e-07, -4.4796615839004517e-07, -4.2282044887542725e-07, -3.976747393608093e-07, -3.725290298461914e-07, -3.473833203315735e-07, -3.2223761081695557e-07, -2.9709190130233765e-07, -2.7194619178771973e-07, -2.468004822731018e-07, -2.2165477275848389e-07, -1.9650906324386597e-07, -1.7136335372924805e-07, -1.4621764421463013e-07, -1.210719347000122e-07, -9.592622518539429e-08, -7.078051567077637e-08, -4.563480615615845e-08, -2.0489096641540527e-08, 4.6566128730773926e-09, 2.9802322387695312e-08, 5.494803190231323e-08, 8.009374141693115e-08, 1.0523945093154907e-07, 1.30385160446167e-07, 1.555308699607849e-07, 1.8067657947540283e-07, 2.0582228899002075e-07, 2.3096799850463867e-07, 2.561137080192566e-07, 2.812594175338745e-07, 3.0640512704849243e-07, 3.3155083656311035e-07, 3.5669654607772827e-07, 3.818422555923462e-07, 4.069879651069641e-07, 4.3213367462158203e-07, 4.5727938413619995e-07, 4.824250936508179e-07, 5.075708031654358e-07, 5.327165126800537e-07, 5.578622221946716e-07, 5.830079317092896e-07, 6.081536412239075e-07, 6.332993507385254e-07, 6.584450602531433e-07, 6.835907697677612e-07, 7.087364792823792e-07, 7.338821887969971e-07, 7.59027898311615e-07, 7.841736078262329e-07, 8.093193173408508e-07, 8.344650268554688e-07]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 878.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0], "bins": [-2.384185791015625e-07, -2.3283064365386963e-07, -2.2724270820617676e-07, -2.2165477275848389e-07, -2.1606683731079102e-07, -2.1047890186309814e-07, -2.0489096641540527e-07, -1.993030309677124e-07, -1.9371509552001953e-07, -1.8812716007232666e-07, -1.825392246246338e-07, -1.7695128917694092e-07, -1.7136335372924805e-07, -1.6577541828155518e-07, -1.601874828338623e-07, -1.5459954738616943e-07, -1.4901161193847656e-07, -1.434236764907837e-07, -1.3783574104309082e-07, -1.3224780559539795e-07, -1.2665987014770508e-07, -1.210719347000122e-07, -1.1548399925231934e-07, -1.0989606380462646e-07, -1.043081283569336e-07, -9.872019290924072e-08, -9.313225746154785e-08, -8.754432201385498e-08, -8.195638656616211e-08, -7.636845111846924e-08, -7.078051567077637e-08, -6.51925802230835e-08, -5.960464477539063e-08, -5.4016709327697754e-08, -4.842877388000488e-08, -4.284083843231201e-08, -3.725290298461914e-08, -3.166496753692627e-08, -2.60770320892334e-08, -2.0489096641540527e-08, -1.4901161193847656e-08, -9.313225746154785e-09, -3.725290298461914e-09, 1.862645149230957e-09, 7.450580596923828e-09, 1.30385160446167e-08, 1.862645149230957e-08, 2.421438694000244e-08, 2.9802322387695312e-08, 3.5390257835388184e-08, 4.0978193283081055e-08, 4.6566128730773926e-08, 5.21540641784668e-08, 5.774199962615967e-08, 6.332993507385254e-08, 6.891787052154541e-08, 7.450580596923828e-08, 8.009374141693115e-08, 8.568167686462402e-08, 9.12696123123169e-08, 9.685754776000977e-08, 1.0244548320770264e-07, 1.0803341865539551e-07, 1.1362135410308838e-07, 1.1920928955078125e-07]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 6.0, 10.0, 10.0, 17.0, 31.0, 82.0, 151.0, 319.0, 207.0, 94.0, 36.0, 26.0, 6.0, 8.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004593722987920046, -0.004201252944767475, -0.0038087833672761917, -0.003416313324123621, -0.003023843513801694, -0.002631373703479767, -0.002238903660327196, -0.001846433850005269, -0.001453964039683342, -0.001061494229361415, -0.000669024302624166, -0.0002765543758869171, 0.00011591543443500996, 0.000508385244756937, 0.0009008552879095078, 0.0012933250982314348, 0.001685794908553362, 0.002078264718875289, 0.002470734529197216, 0.0028632045723497868, 0.003255674382671714, 0.003648144192993641, 0.004040614236146212, 0.004433084279298782, 0.004825553856790066, 0.0052180238999426365, 0.00561049347743392, 0.006002963520586491, 0.006395433098077774, 0.006787903141230345, 0.0071803731843829155, 0.007572842761874199, 0.007965313270688057, 0.00835778284817934, 0.008750253356993198, 0.009142722934484482, 0.009535192511975765, 0.009927662089467049, 0.010320132598280907, 0.01071260217577219, 0.011105071753263474, 0.011497541330754757, 0.011890011839568615, 0.012282481417059898, 0.012674950994551182, 0.013067420572042465, 0.013459891080856323, 0.013852360658347607, 0.014244831167161465, 0.014637300744652748, 0.015029771253466606, 0.01542224083095789, 0.015814710408449173, 0.01620718091726303, 0.01659965142607689, 0.016992120072245598, 0.017384590581059456, 0.017777061089873314, 0.018169529736042023, 0.01856200024485588, 0.01895447075366974, 0.019346939399838448, 0.019739409908652306, 0.020131880417466164, 0.020524349063634872]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 5.0, 10.0, 4.0, 6.0, 10.0, 13.0, 18.0, 22.0, 24.0, 32.0, 38.0, 43.0, 40.0, 36.0, 45.0, 53.0, 40.0, 52.0, 49.0, 52.0, 40.0, 32.0, 56.0, 38.0, 27.0, 38.0, 28.0, 18.0, 25.0, 17.0, 19.0, 8.0, 17.0, 11.0, 10.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.002756757428869605, -0.002689383225515485, -0.0026220090221613646, -0.0025546348188072443, -0.002487260615453124, -0.002419886412099004, -0.0023525122087448835, -0.0022851380053907633, -0.002217763802036643, -0.0021503895986825228, -0.0020830153953284025, -0.0020156411919742823, -0.001948266988620162, -0.0018808927852660418, -0.0018135185819119215, -0.0017461443785578012, -0.0016787700587883592, -0.001611395855434239, -0.0015440216520801187, -0.0014766474487259984, -0.0014092732453718781, -0.001341899042017758, -0.0012745247222483158, -0.0012071505188941956, -0.0011397763155400753, -0.001072402112185955, -0.0010050279088318348, -0.0009376537054777145, -0.0008702795021235943, -0.000802905298769474, -0.0007355310372076929, -0.0006681568338535726, -0.0006007828051224351, -0.0005334086017683148, -0.0004660343984141946, -0.00039866016595624387, -0.0003312859626021236, -0.00026391175924800336, -0.00019653752679005265, -0.0001291633234359324, -6.178912008181214e-05, 5.585090548265725e-06, 7.29593011783436e-05, 0.00014033351908437908, 0.00020770772243849933, 0.0002750819257926196, 0.0003424561582505703, 0.00040983036160469055, 0.0004772045649588108, 0.0005445787683129311, 0.0006119529716670513, 0.0006793271750211716, 0.0007467013783752918, 0.0008140755817294121, 0.0008814498432911932, 0.0009488240466453135, 0.0010161981917917728, 0.001083572395145893, 0.0011509465985000134, 0.0012183208018541336, 0.0012856950052082539, 0.0013530692085623741, 0.0014204434119164944, 0.0014878176152706146, 0.0015551919350400567]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 2.0, 10.0, 18.0, 19.0, 36.0, 45.0, 70.0, 104.0, 199.0, 298.0, 537.0, 950.0, 1676.0, 3190.0, 6449.0, 14196.0, 36541.0, 125991.0, 601926.0, 177504.0, 45587.0, 17214.0, 7645.0, 3741.0, 1990.0, 1070.0, 579.0, 382.0, 220.0, 114.0, 98.0, 54.0, 33.0, 15.0, 15.0, 9.0, 7.0, 9.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0055084228515625, -0.005334138870239258, -0.005159854888916016, -0.0049855709075927734, -0.004811286926269531, -0.004637002944946289, -0.004462718963623047, -0.004288434982299805, -0.0041141510009765625, -0.00393986701965332, -0.003765583038330078, -0.003591299057006836, -0.0034170150756835938, -0.0032427310943603516, -0.0030684471130371094, -0.002894163131713867, -0.002719879150390625, -0.002545595169067383, -0.0023713111877441406, -0.0021970272064208984, -0.0020227432250976562, -0.001848459243774414, -0.0016741752624511719, -0.0014998912811279297, -0.0013256072998046875, -0.0011513233184814453, -0.0009770393371582031, -0.0008027553558349609, -0.0006284713745117188, -0.00045418739318847656, -0.0002799034118652344, -0.00010561943054199219, 6.866455078125e-05, 0.0002429485321044922, 0.0004172325134277344, 0.0005915164947509766, 0.0007658004760742188, 0.0009400844573974609, 0.0011143684387207031, 0.0012886524200439453, 0.0014629364013671875, 0.0016372203826904297, 0.0018115043640136719, 0.001985788345336914, 0.0021600723266601562, 0.0023343563079833984, 0.0025086402893066406, 0.002682924270629883, 0.002857208251953125, 0.003031492233276367, 0.0032057762145996094, 0.0033800601959228516, 0.0035543441772460938, 0.003728628158569336, 0.003902912139892578, 0.00407719612121582, 0.0042514801025390625, 0.004425764083862305, 0.004600048065185547, 0.004774332046508789, 0.004948616027832031, 0.0051229000091552734, 0.005297183990478516, 0.005471467971801758, 0.005645751953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 9.0, 16.0, 20.0, 32.0, 38.0, 62.0, 64.0, 94.0, 101.0, 89.0, 103.0, 92.0, 64.0, 60.0, 48.0, 25.0, 22.0, 23.0, 13.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0008788108825683594, -0.0008571147918701172, -0.000835418701171875, -0.0008137226104736328, -0.0007920265197753906, -0.0007703304290771484, -0.0007486343383789062, -0.0007269382476806641, -0.0007052421569824219, -0.0006835460662841797, -0.0006618499755859375, -0.0006401538848876953, -0.0006184577941894531, -0.0005967617034912109, -0.0005750656127929688, -0.0005533695220947266, -0.0005316734313964844, -0.0005099773406982422, -0.00048828125, -0.0004665851593017578, -0.0004448890686035156, -0.00042319297790527344, -0.00040149688720703125, -0.00037980079650878906, -0.0003581047058105469, -0.0003364086151123047, -0.0003147125244140625, -0.0002930164337158203, -0.0002713203430175781, -0.00024962425231933594, -0.00022792816162109375, -0.00020623207092285156, -0.00018453598022460938, -0.0001628398895263672, -0.000141143798828125, -0.00011944770812988281, -9.775161743164062e-05, -7.605552673339844e-05, -5.435943603515625e-05, -3.266334533691406e-05, -1.0967254638671875e-05, 1.0728836059570312e-05, 3.24249267578125e-05, 5.412101745605469e-05, 7.581710815429688e-05, 9.751319885253906e-05, 0.00011920928955078125, 0.00014090538024902344, 0.00016260147094726562, 0.0001842975616455078, 0.00020599365234375, 0.0002276897430419922, 0.0002493858337402344, 0.00027108192443847656, 0.00029277801513671875, 0.00031447410583496094, 0.0003361701965332031, 0.0003578662872314453, 0.0003795623779296875, 0.0004012584686279297, 0.0004229545593261719, 0.00044465065002441406, 0.00046634674072265625, 0.00048804283142089844, 0.0005097389221191406]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 2.0, 3.0, 6.0, 7.0, 13.0, 19.0, 32.0, 30.0, 48.0, 83.0, 115.0, 166.0, 218.0, 305.0, 434.0, 629.0, 900.0, 1449.0, 2202.0, 3646.0, 5753.0, 9809.0, 17367.0, 33135.0, 69133.0, 176710.0, 418208.0, 167304.0, 66444.0, 32396.0, 16877.0, 9585.0, 5751.0, 3415.0, 2042.0, 1371.0, 947.0, 616.0, 402.0, 305.0, 212.0, 141.0, 99.0, 66.0, 57.0, 30.0, 28.0, 15.0, 15.0, 11.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00115203857421875, -0.0011129528284072876, -0.0010738670825958252, -0.0010347813367843628, -0.0009956955909729004, -0.000956609845161438, -0.0009175240993499756, -0.0008784383535385132, -0.0008393526077270508, -0.0008002668619155884, -0.000761181116104126, -0.0007220953702926636, -0.0006830096244812012, -0.0006439238786697388, -0.0006048381328582764, -0.000565752387046814, -0.0005266666412353516, -0.00048758089542388916, -0.00044849514961242676, -0.00040940940380096436, -0.00037032365798950195, -0.00033123791217803955, -0.00029215216636657715, -0.00025306642055511475, -0.00021398067474365234, -0.00017489492893218994, -0.00013580918312072754, -9.672343730926514e-05, -5.7637691497802734e-05, -1.8551945686340332e-05, 2.053380012512207e-05, 5.961954593658447e-05, 9.870529174804688e-05, 0.00013779103755950928, 0.00017687678337097168, 0.00021596252918243408, 0.0002550482749938965, 0.0002941340208053589, 0.0003332197666168213, 0.0003723055124282837, 0.0004113912582397461, 0.0004504770040512085, 0.0004895627498626709, 0.0005286484956741333, 0.0005677342414855957, 0.0006068199872970581, 0.0006459057331085205, 0.0006849914789199829, 0.0007240772247314453, 0.0007631629705429077, 0.0008022487163543701, 0.0008413344621658325, 0.0008804202079772949, 0.0009195059537887573, 0.0009585916996002197, 0.0009976774454116821, 0.0010367631912231445, 0.001075848937034607, 0.0011149346828460693, 0.0011540204286575317, 0.0011931061744689941, 0.0012321919202804565, 0.001271277666091919, 0.0013103634119033813, 0.0013494491577148438]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 12.0, 16.0, 10.0, 23.0, 13.0, 34.0, 35.0, 41.0, 57.0, 49.0, 58.0, 65.0, 79.0, 76.0, 71.0, 60.0, 51.0, 47.0, 26.0, 32.0, 26.0, 18.0, 22.0, 19.0, 15.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000827789306640625, -0.0007990747690200806, -0.0007703602313995361, -0.0007416456937789917, -0.0007129311561584473, -0.0006842166185379028, -0.0006555020809173584, -0.000626787543296814, -0.0005980730056762695, -0.0005693584680557251, -0.0005406439304351807, -0.0005119293928146362, -0.0004832148551940918, -0.00045450031757354736, -0.00042578577995300293, -0.0003970712423324585, -0.00036835670471191406, -0.00033964216709136963, -0.0003109276294708252, -0.00028221309185028076, -0.00025349855422973633, -0.0002247840166091919, -0.00019606947898864746, -0.00016735494136810303, -0.0001386404037475586, -0.00010992586612701416, -8.121132850646973e-05, -5.249679088592529e-05, -2.378225326538086e-05, 4.932284355163574e-06, 3.364682197570801e-05, 6.236135959625244e-05, 9.107589721679688e-05, 0.00011979043483734131, 0.00014850497245788574, 0.00017721951007843018, 0.0002059340476989746, 0.00023464858531951904, 0.0002633631229400635, 0.0002920776605606079, 0.00032079219818115234, 0.0003495067358016968, 0.0003782212734222412, 0.00040693581104278564, 0.0004356503486633301, 0.0004643648862838745, 0.0004930794239044189, 0.0005217939615249634, 0.0005505084991455078, 0.0005792230367660522, 0.0006079375743865967, 0.0006366521120071411, 0.0006653666496276855, 0.00069408118724823, 0.0007227957248687744, 0.0007515102624893188, 0.0007802248001098633, 0.0008089393377304077, 0.0008376538753509521, 0.0008663684129714966, 0.000895082950592041, 0.0009237974882125854, 0.0009525120258331299, 0.0009812265634536743, 0.0010099411010742188]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 16.0, 13.0, 7.0, 10.0, 19.0, 25.0, 28.0, 43.0, 58.0, 62.0, 83.0, 129.0, 149.0, 258.0, 406.0, 792.0, 1736.0, 5341.0, 173753.0, 855587.0, 5980.0, 1854.0, 812.0, 414.0, 270.0, 192.0, 129.0, 105.0, 61.0, 51.0, 27.0, 24.0, 32.0, 25.0, 17.0, 8.0, 6.0, 10.0, 7.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004180908203125, -0.004046201705932617, -0.003911495208740234, -0.0037767887115478516, -0.0036420822143554688, -0.003507375717163086, -0.003372669219970703, -0.0032379627227783203, -0.0031032562255859375, -0.0029685497283935547, -0.002833843231201172, -0.002699136734008789, -0.0025644302368164062, -0.0024297237396240234, -0.0022950172424316406, -0.002160310745239258, -0.002025604248046875, -0.0018908977508544922, -0.0017561912536621094, -0.0016214847564697266, -0.0014867782592773438, -0.001352071762084961, -0.0012173652648925781, -0.0010826587677001953, -0.0009479522705078125, -0.0008132457733154297, -0.0006785392761230469, -0.0005438327789306641, -0.00040912628173828125, -0.00027441978454589844, -0.00013971328735351562, -5.0067901611328125e-06, 0.00012969970703125, 0.0002644062042236328, 0.0003991127014160156, 0.0005338191986083984, 0.0006685256958007812, 0.0008032321929931641, 0.0009379386901855469, 0.0010726451873779297, 0.0012073516845703125, 0.0013420581817626953, 0.0014767646789550781, 0.001611471176147461, 0.0017461776733398438, 0.0018808841705322266, 0.0020155906677246094, 0.002150297164916992, 0.002285003662109375, 0.002419710159301758, 0.0025544166564941406, 0.0026891231536865234, 0.0028238296508789062, 0.002958536148071289, 0.003093242645263672, 0.0032279491424560547, 0.0033626556396484375, 0.0034973621368408203, 0.003632068634033203, 0.003766775131225586, 0.0039014816284179688, 0.0040361881256103516, 0.004170894622802734, 0.004305601119995117, 0.0044403076171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 7.0, 13.0, 0.0, 26.0, 0.0, 93.0, 232.0, 0.0, 288.0, 0.0, 207.0, 0.0, 96.0, 31.0, 0.0, 8.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.192153811454773e-07, -8.847564458847046e-07, -8.502975106239319e-07, -8.158385753631592e-07, -7.813796401023865e-07, -7.469207048416138e-07, -7.124617695808411e-07, -6.780028343200684e-07, -6.435438990592957e-07, -6.09084963798523e-07, -5.746260285377502e-07, -5.401670932769775e-07, -5.057081580162048e-07, -4.7124922275543213e-07, -4.367902874946594e-07, -4.023313522338867e-07, -3.67872416973114e-07, -3.334134817123413e-07, -2.989545464515686e-07, -2.644956111907959e-07, -2.300366759300232e-07, -1.955777406692505e-07, -1.6111880540847778e-07, -1.2665987014770508e-07, -9.220093488693237e-08, -5.774199962615967e-08, -2.3283064365386963e-08, 1.1175870895385742e-08, 4.563480615615845e-08, 8.009374141693115e-08, 1.1455267667770386e-07, 1.4901161193847656e-07, 1.8347054719924927e-07, 2.1792948246002197e-07, 2.523884177207947e-07, 2.868473529815674e-07, 3.213062882423401e-07, 3.557652235031128e-07, 3.902241587638855e-07, 4.246830940246582e-07, 4.591420292854309e-07, 4.936009645462036e-07, 5.280598998069763e-07, 5.62518835067749e-07, 5.969777703285217e-07, 6.314367055892944e-07, 6.658956408500671e-07, 7.003545761108398e-07, 7.348135113716125e-07, 7.692724466323853e-07, 8.03731381893158e-07, 8.381903171539307e-07, 8.726492524147034e-07, 9.071081876754761e-07, 9.415671229362488e-07, 9.760260581970215e-07, 1.0104849934577942e-06, 1.044943928718567e-06, 1.0794028639793396e-06, 1.1138617992401123e-06, 1.148320734500885e-06, 1.1827796697616577e-06, 1.2172386050224304e-06, 1.2516975402832031e-06]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 7.0, 8.0, 8.0, 24.0, 18.0, 32.0, 38.0, 45.0, 70.0, 96.0, 117.0, 137.0, 198.0, 275.0, 326.0, 433.0, 549.0, 810.0, 1140.0, 1558.0, 2366.0, 4357.0, 13735.0, 790192.0, 209676.0, 10618.0, 3803.0, 2279.0, 1540.0, 1086.0, 775.0, 542.0, 419.0, 310.0, 229.0, 177.0, 136.0, 115.0, 82.0, 56.0, 51.0, 33.0, 35.0, 14.0, 17.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.001140594482421875, -0.0011059492826461792, -0.0010713040828704834, -0.0010366588830947876, -0.0010020136833190918, -0.000967368483543396, -0.0009327232837677002, -0.0008980780839920044, -0.0008634328842163086, -0.0008287876844406128, -0.000794142484664917, -0.0007594972848892212, -0.0007248520851135254, -0.0006902068853378296, -0.0006555616855621338, -0.000620916485786438, -0.0005862712860107422, -0.0005516260862350464, -0.0005169808864593506, -0.0004823356866836548, -0.000447690486907959, -0.0004130452871322632, -0.0003784000873565674, -0.0003437548875808716, -0.0003091096878051758, -0.00027446448802948, -0.00023981928825378418, -0.00020517408847808838, -0.00017052888870239258, -0.00013588368892669678, -0.00010123848915100098, -6.659328937530518e-05, -3.1948089599609375e-05, 2.6971101760864258e-06, 3.7342309951782227e-05, 7.198750972747803e-05, 0.00010663270950317383, 0.00014127790927886963, 0.00017592310905456543, 0.00021056830883026123, 0.00024521350860595703, 0.00027985870838165283, 0.00031450390815734863, 0.00034914910793304443, 0.00038379430770874023, 0.00041843950748443604, 0.00045308470726013184, 0.00048772990703582764, 0.0005223751068115234, 0.0005570203065872192, 0.000591665506362915, 0.0006263107061386108, 0.0006609559059143066, 0.0006956011056900024, 0.0007302463054656982, 0.000764891505241394, 0.0007995367050170898, 0.0008341819047927856, 0.0008688271045684814, 0.0009034723043441772, 0.000938117504119873, 0.0009727627038955688, 0.0010074079036712646, 0.0010420531034469604, 0.0010766983032226562]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 5.0, 15.0, 16.0, 80.0, 416.0, 343.0, 69.0, 26.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007772445678710938, -0.0007536560297012329, -0.0007300674915313721, -0.0007064789533615112, -0.0006828904151916504, -0.0006593018770217896, -0.0006357133388519287, -0.0006121248006820679, -0.000588536262512207, -0.0005649477243423462, -0.0005413591861724854, -0.0005177706480026245, -0.0004941821098327637, -0.00047059357166290283, -0.000447005033493042, -0.00042341649532318115, -0.0003998279571533203, -0.00037623941898345947, -0.00035265088081359863, -0.0003290623426437378, -0.00030547380447387695, -0.0002818852663040161, -0.0002582967281341553, -0.00023470818996429443, -0.0002111196517944336, -0.00018753111362457275, -0.00016394257545471191, -0.00014035403728485107, -0.00011676549911499023, -9.31769609451294e-05, -6.958842277526855e-05, -4.5999884605407715e-05, -2.2411346435546875e-05, 1.1771917343139648e-06, 2.4765729904174805e-05, 4.8354268074035645e-05, 7.194280624389648e-05, 9.553134441375732e-05, 0.00011911988258361816, 0.000142708420753479, 0.00016629695892333984, 0.00018988549709320068, 0.00021347403526306152, 0.00023706257343292236, 0.0002606511116027832, 0.00028423964977264404, 0.0003078281879425049, 0.0003314167261123657, 0.00035500526428222656, 0.0003785938024520874, 0.00040218234062194824, 0.0004257708787918091, 0.0004493594169616699, 0.00047294795513153076, 0.0004965364933013916, 0.0005201250314712524, 0.0005437135696411133, 0.0005673021078109741, 0.000590890645980835, 0.0006144791841506958, 0.0006380677223205566, 0.0006616562604904175, 0.0006852447986602783, 0.0007088333368301392, 0.000732421875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 7.0, 18.0, 30.0, 35.0, 55.0, 113.0, 150.0, 202.0, 130.0, 90.0, 56.0, 22.0, 27.0, 14.0, 6.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0040842583402991295, -0.0039343987591564655, -0.003784538945183158, -0.0036346791312098503, -0.0034848195500671864, -0.0033349597360938787, -0.003185099922120571, -0.003035240340977907, -0.0028853805270045996, -0.002735520713031292, -0.002585661131888628, -0.0024358013179153204, -0.002285941503942013, -0.002136081922799349, -0.0019862221088260412, -0.0018363624112680554, -0.0016865027137100697, -0.0015366430161520839, -0.001386783318594098, -0.0012369235046207905, -0.0010870638070628047, -0.0009372041095048189, -0.0007873443537391722, -0.0006374845979735255, -0.00048762490041553974, -0.0003377651737537235, -0.00018790544709190726, -3.8045720430091023e-05, 0.00011181400623172522, 0.000261673703789711, 0.0004115334595553577, 0.0005613932153210044, 0.0007112524472177029, 0.0008611121447756886, 0.0010109718423336744, 0.001160831656306982, 0.0013106913538649678, 0.0014605510514229536, 0.0016104108653962612, 0.001760270562954247, 0.0019101302605122328, 0.0020599900744855404, 0.0022098496556282043, 0.002359709469601512, 0.0025095692835748196, 0.0026594288647174835, 0.002809288678690791, 0.0029591484926640987, 0.0031090080738067627, 0.0032588678877800703, 0.0034087274689227343, 0.003558587282896042, 0.003708446864038706, 0.0038583066780120134, 0.004008166491985321, 0.004158026073127985, 0.004307885654270649, 0.004457745235413313, 0.004607605282217264, 0.004757464863359928, 0.004907324444502592, 0.005057184025645256, 0.005207044072449207, 0.005356903653591871, 0.0055067637003958225]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [6.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 9.0, 4.0, 3.0, 16.0, 16.0, 15.0, 13.0, 17.0, 21.0, 28.0, 33.0, 30.0, 29.0, 22.0, 30.0, 46.0, 50.0, 36.0, 30.0, 40.0, 43.0, 28.0, 32.0, 41.0, 26.0, 39.0, 44.0, 30.0, 25.0, 26.0, 22.0, 24.0, 23.0, 18.0, 10.0, 12.0, 6.0, 12.0, 14.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0009674841421656311, -0.0009320353274233639, -0.0008965865708887577, -0.0008611377561464906, -0.0008256889996118844, -0.0007902401848696172, -0.000754791428335011, -0.0007193426135927439, -0.0006838937988504767, -0.0006484449841082096, -0.0006129962275736034, -0.0005775474128313363, -0.00054209865629673, -0.0005066498415544629, -0.00047120105591602623, -0.00043575227027758956, -0.00040030351374298334, -0.00036485472810454667, -0.00032940594246611, -0.00029395712772384286, -0.00025850837118923664, -0.00022305957099888474, -0.00018761077080853283, -0.00015216198517009616, -0.00011671319953165948, -8.126441389322281e-05, -4.581562097882852e-05, -1.036682806443423e-05, 2.5081957574002445e-05, 6.053074321243912e-05, 9.597954340279102e-05, 0.0001314283290412277, 0.0001668771728873253, 0.00020232595852576196, 0.00023777474416419864, 0.00027322355890646577, 0.000308672315441072, 0.0003441211301833391, 0.0003795699158217758, 0.00041501870146021247, 0.00045046748709864914, 0.0004859162727370858, 0.000521365087479353, 0.0005568138440139592, 0.0005922626587562263, 0.0006277114152908325, 0.0006631602300330997, 0.0006986090447753668, 0.000734057801309973, 0.0007695066160522401, 0.0008049553725868464, 0.0008404041873291135, 0.0008758529438637197, 0.0009113017586059868, 0.000946750515140593, 0.0009821993298828602, 0.0010176481446251273, 0.0010530969593673944, 0.0010885457741096616, 0.0011239944724366069, 0.001159443287178874, 0.0011948921019211411, 0.0012303409166634083, 0.0012657896149903536, 0.0013012384297326207]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 5.0, 12.0, 12.0, 27.0, 41.0, 60.0, 59.0, 101.0, 183.0, 263.0, 357.0, 564.0, 893.0, 1593.0, 2703.0, 5385.0, 12706.0, 62439.0, 4053838.0, 32640.0, 9820.0, 4447.0, 2280.0, 1313.0, 861.0, 465.0, 375.0, 245.0, 175.0, 116.0, 76.0, 61.0, 41.0, 27.0, 18.0, 21.0, 18.0, 13.0, 5.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003772735595703125, -0.0036443471908569336, -0.003515958786010742, -0.0033875703811645508, -0.0032591819763183594, -0.003130793571472168, -0.0030024051666259766, -0.002874016761779785, -0.0027456283569335938, -0.0026172399520874023, -0.002488851547241211, -0.0023604631423950195, -0.002232074737548828, -0.0021036863327026367, -0.0019752979278564453, -0.001846909523010254, -0.0017185211181640625, -0.001590132713317871, -0.0014617443084716797, -0.0013333559036254883, -0.0012049674987792969, -0.0010765790939331055, -0.0009481906890869141, -0.0008198022842407227, -0.0006914138793945312, -0.0005630254745483398, -0.00043463706970214844, -0.00030624866485595703, -0.00017786026000976562, -4.947185516357422e-05, 7.891654968261719e-05, 0.0002073049545288086, 0.000335693359375, 0.0004640817642211914, 0.0005924701690673828, 0.0007208585739135742, 0.0008492469787597656, 0.000977635383605957, 0.0011060237884521484, 0.0012344121932983398, 0.0013628005981445312, 0.0014911890029907227, 0.001619577407836914, 0.0017479658126831055, 0.0018763542175292969, 0.0020047426223754883, 0.0021331310272216797, 0.002261519432067871, 0.0023899078369140625, 0.002518296241760254, 0.0026466846466064453, 0.0027750730514526367, 0.002903461456298828, 0.0030318498611450195, 0.003160238265991211, 0.0032886266708374023, 0.0034170150756835938, 0.003545403480529785, 0.0036737918853759766, 0.003802180290222168, 0.003930568695068359, 0.004058957099914551, 0.004187345504760742, 0.004315733909606934, 0.004444122314453125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 19.0, 14.0, 9.0, 22.0, 29.0, 41.0, 48.0, 54.0, 65.0, 57.0, 62.0, 75.0, 72.0, 65.0, 57.0, 64.0, 49.0, 43.0, 35.0, 32.0, 16.0, 18.0, 10.0, 8.0, 7.0, 2.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0003910064697265625, -0.0003774799406528473, -0.0003639534115791321, -0.00035042688250541687, -0.00033690035343170166, -0.00032337382435798645, -0.00030984729528427124, -0.00029632076621055603, -0.0002827942371368408, -0.0002692677080631256, -0.0002557411789894104, -0.0002422146499156952, -0.00022868812084197998, -0.00021516159176826477, -0.00020163506269454956, -0.00018810853362083435, -0.00017458200454711914, -0.00016105547547340393, -0.00014752894639968872, -0.0001340024173259735, -0.0001204758882522583, -0.00010694935917854309, -9.342283010482788e-05, -7.989630103111267e-05, -6.636977195739746e-05, -5.284324288368225e-05, -3.931671380996704e-05, -2.579018473625183e-05, -1.2263655662536621e-05, 1.2628734111785889e-06, 1.4789402484893799e-05, 2.831593155860901e-05, 4.184246063232422e-05, 5.536898970603943e-05, 6.889551877975464e-05, 8.242204785346985e-05, 9.594857692718506e-05, 0.00010947510600090027, 0.00012300163507461548, 0.0001365281641483307, 0.0001500546932220459, 0.0001635812222957611, 0.00017710775136947632, 0.00019063428044319153, 0.00020416080951690674, 0.00021768733859062195, 0.00023121386766433716, 0.00024474039673805237, 0.0002582669258117676, 0.0002717934548854828, 0.000285319983959198, 0.0002988465130329132, 0.0003123730421066284, 0.00032589957118034363, 0.00033942610025405884, 0.00035295262932777405, 0.00036647915840148926, 0.00038000568747520447, 0.0003935322165489197, 0.0004070587456226349, 0.0004205852746963501, 0.0004341118037700653, 0.0004476383328437805, 0.00046116486191749573, 0.00047469139099121094]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 9.0, 13.0, 16.0, 24.0, 45.0, 81.0, 215.0, 945.0, 8844.0, 4116371.0, 64292.0, 2674.0, 413.0, 131.0, 71.0, 35.0, 28.0, 21.0, 10.0, 4.0, 2.0, 8.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00595855712890625, -0.0057648420333862305, -0.005571126937866211, -0.005377411842346191, -0.005183696746826172, -0.004989981651306152, -0.004796266555786133, -0.004602551460266113, -0.004408836364746094, -0.004215121269226074, -0.004021406173706055, -0.003827691078186035, -0.0036339759826660156, -0.003440260887145996, -0.0032465457916259766, -0.003052830696105957, -0.0028591156005859375, -0.002665400505065918, -0.0024716854095458984, -0.002277970314025879, -0.0020842552185058594, -0.0018905401229858398, -0.0016968250274658203, -0.0015031099319458008, -0.0013093948364257812, -0.0011156797409057617, -0.0009219646453857422, -0.0007282495498657227, -0.0005345344543457031, -0.0003408193588256836, -0.00014710426330566406, 4.661083221435547e-05, 0.000240325927734375, 0.00043404102325439453, 0.0006277561187744141, 0.0008214712142944336, 0.0010151863098144531, 0.0012089014053344727, 0.0014026165008544922, 0.0015963315963745117, 0.0017900466918945312, 0.0019837617874145508, 0.0021774768829345703, 0.00237119197845459, 0.0025649070739746094, 0.002758622169494629, 0.0029523372650146484, 0.003146052360534668, 0.0033397674560546875, 0.003533482551574707, 0.0037271976470947266, 0.003920912742614746, 0.004114627838134766, 0.004308342933654785, 0.004502058029174805, 0.004695773124694824, 0.004889488220214844, 0.005083203315734863, 0.005276918411254883, 0.005470633506774902, 0.005664348602294922, 0.005858063697814941, 0.006051778793334961, 0.0062454938888549805, 0.006439208984375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 18.0, 21.0, 40.0, 94.0, 479.0, 2738.0, 461.0, 92.0, 44.0, 20.0, 22.0, 15.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010738372802734375, -0.0010491609573364258, -0.001024484634399414, -0.0009998083114624023, -0.0009751319885253906, -0.0009504556655883789, -0.0009257793426513672, -0.0009011030197143555, -0.0008764266967773438, -0.000851750373840332, -0.0008270740509033203, -0.0008023977279663086, -0.0007777214050292969, -0.0007530450820922852, -0.0007283687591552734, -0.0007036924362182617, -0.00067901611328125, -0.0006543397903442383, -0.0006296634674072266, -0.0006049871444702148, -0.0005803108215332031, -0.0005556344985961914, -0.0005309581756591797, -0.000506281852722168, -0.00048160552978515625, -0.00045692920684814453, -0.0004322528839111328, -0.0004075765609741211, -0.0003829002380371094, -0.00035822391510009766, -0.00033354759216308594, -0.0003088712692260742, -0.0002841949462890625, -0.0002595186233520508, -0.00023484230041503906, -0.00021016597747802734, -0.00018548965454101562, -0.0001608133316040039, -0.0001361370086669922, -0.00011146068572998047, -8.678436279296875e-05, -6.210803985595703e-05, -3.743171691894531e-05, -1.2755393981933594e-05, 1.1920928955078125e-05, 3.6597251892089844e-05, 6.127357482910156e-05, 8.594989776611328e-05, 0.000110626220703125, 0.00013530254364013672, 0.00015997886657714844, 0.00018465518951416016, 0.00020933151245117188, 0.0002340078353881836, 0.0002586841583251953, 0.00028336048126220703, 0.00030803680419921875, 0.00033271312713623047, 0.0003573894500732422, 0.0003820657730102539, 0.0004067420959472656, 0.00043141841888427734, 0.00045609474182128906, 0.0004807710647583008, 0.0005054473876953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 9.0, 12.0, 14.0, 15.0, 20.0, 37.0, 48.0, 76.0, 97.0, 101.0, 148.0, 108.0, 92.0, 56.0, 52.0, 22.0, 18.0, 10.0, 11.0, 6.0, 4.0, 6.0, 3.0, 4.0, 8.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009207038674503565, -0.00088558963034302, -0.0008504753932356834, -0.0008153612143360078, -0.0007802469772286713, -0.0007451327401213348, -0.0007100185612216592, -0.0006749043241143227, -0.0006397900870069861, -0.0006046758498996496, -0.0005695616127923131, -0.0005344474338926375, -0.000499333196785301, -0.00046421895967796445, -0.0004291047516744584, -0.0003939905436709523, -0.0003588763065636158, -0.0003237620694562793, -0.0002886478614527732, -0.00025353365344926715, -0.00021841941634193063, -0.00018330519378650934, -0.00014819097123108804, -0.00011307676322758198, -7.796252612024546e-05, -4.2848303564824164e-05, -7.734081009402871e-06, 2.738014154601842e-05, 6.249436410143971e-05, 9.760858665686101e-05, 0.0001327228092122823, 0.00016783701721578836, 0.00020295125432312489, 0.00023806547687854618, 0.00027317969943396747, 0.00030829390743747354, 0.00034340814454481006, 0.0003785223816521466, 0.00041363658965565264, 0.0004487507976591587, 0.00048386503476649523, 0.0005189792718738317, 0.0005540935089811683, 0.0005892076878808439, 0.0006243219249881804, 0.0006594361620955169, 0.0006945503409951925, 0.000729664578102529, 0.0007647788152098656, 0.0007998930523172021, 0.0008350072894245386, 0.0008701214683242142, 0.0009052357054315507, 0.0009403499425388873, 0.0009754641214385629, 0.0010105783585458994, 0.001045692595653236, 0.0010808068327605724, 0.001115921069867909, 0.0011510353069752455, 0.0011861494276672602, 0.0012212636647745967, 0.0012563779018819332, 0.0012914921389892697, 0.0013266063760966063]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 17.0, 10.0, 14.0, 17.0, 17.0, 31.0, 35.0, 33.0, 23.0, 30.0, 52.0, 44.0, 38.0, 50.0, 57.0, 50.0, 48.0, 52.0, 46.0, 40.0, 41.0, 32.0, 45.0, 34.0, 22.0, 23.0, 17.0, 18.0, 16.0, 12.0, 7.0, 9.0, 7.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041233206866309047, -0.00039586066850461066, -0.00037938926834613085, -0.0003629178972914815, -0.0003464464971330017, -0.0003299750969745219, -0.0003135037259198725, -0.0002970323257613927, -0.0002805609256029129, -0.0002640895254444331, -0.0002476181252859533, -0.00023114675423130393, -0.00021467535407282412, -0.0001982039539143443, -0.00018173256830777973, -0.00016526118270121515, -0.00014878978254273534, -0.00013231838238425553, -0.00011584699677769095, -9.937560389516875e-05, -8.290421101264656e-05, -6.643281813012436e-05, -4.9961425247602165e-05, -3.349003236507997e-05, -1.7018639482557774e-05, -5.47246600035578e-07, 1.5924146282486618e-05, 3.239553916500881e-05, 4.886693204753101e-05, 6.53383249300532e-05, 8.18097178125754e-05, 9.82811106950976e-05, 0.00011475244536995888, 0.0001312238455284387, 0.00014769523113500327, 0.00016416661674156785, 0.00018063801690004766, 0.00019710941705852747, 0.00021358080266509205, 0.00023005218827165663, 0.00024652358843013644, 0.00026299498858861625, 0.00027946638874709606, 0.0002959377598017454, 0.0003124091599602252, 0.00032888056011870503, 0.0003453519311733544, 0.0003618233313318342, 0.000378294731490314, 0.0003947661316487938, 0.0004112375318072736, 0.000427708902861923, 0.0004441803030204028, 0.0004606517031788826, 0.00047712307423353195, 0.0004935945034958422, 0.0005100658745504916, 0.0005265372456051409, 0.0005430086748674512, 0.0005594800459221005, 0.0005759514169767499, 0.0005924228462390602, 0.0006088942172937095, 0.0006253656465560198, 0.0006418370176106691]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 9.0, 5.0, 10.0, 18.0, 19.0, 16.0, 33.0, 38.0, 49.0, 60.0, 89.0, 106.0, 148.0, 228.0, 363.0, 601.0, 1197.0, 3117.0, 11394.0, 69564.0, 809643.0, 128176.0, 16116.0, 4006.0, 1529.0, 739.0, 395.0, 245.0, 163.0, 122.0, 87.0, 67.0, 51.0, 39.0, 22.0, 21.0, 22.0, 13.0, 9.0, 8.0, 2.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.006261825561523e-05, -8.66791233420372e-05, -8.329562842845917e-05, -7.991213351488113e-05, -7.65286386013031e-05, -7.314514368772507e-05, -6.976164877414703e-05, -6.6378153860569e-05, -6.299465894699097e-05, -5.961116403341293e-05, -5.62276691198349e-05, -5.2844174206256866e-05, -4.946067929267883e-05, -4.60771843791008e-05, -4.2693689465522766e-05, -3.931019455194473e-05, -3.59266996383667e-05, -3.2543204724788666e-05, -2.9159709811210632e-05, -2.57762148976326e-05, -2.2392719984054565e-05, -1.9009225070476532e-05, -1.56257301568985e-05, -1.2242235243320465e-05, -8.858740329742432e-06, -5.475245416164398e-06, -2.0917505025863647e-06, 1.2917444109916687e-06, 4.675239324569702e-06, 8.058734238147736e-06, 1.1442229151725769e-05, 1.4825724065303802e-05, 1.8209218978881836e-05, 2.159271389245987e-05, 2.4976208806037903e-05, 2.8359703719615936e-05, 3.174319863319397e-05, 3.5126693546772e-05, 3.851018846035004e-05, 4.189368337392807e-05, 4.5277178287506104e-05, 4.866067320108414e-05, 5.204416811466217e-05, 5.5427663028240204e-05, 5.881115794181824e-05, 6.219465285539627e-05, 6.55781477689743e-05, 6.896164268255234e-05, 7.234513759613037e-05, 7.57286325097084e-05, 7.911212742328644e-05, 8.249562233686447e-05, 8.58791172504425e-05, 8.926261216402054e-05, 9.264610707759857e-05, 9.60296019911766e-05, 9.941309690475464e-05, 0.00010279659181833267, 0.0001061800867319107, 0.00010956358164548874, 0.00011294707655906677, 0.0001163305714726448, 0.00011971406638622284, 0.00012309756129980087, 0.0001264810562133789]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 6.0, 6.0, 11.0, 16.0, 12.0, 20.0, 19.0, 29.0, 37.0, 32.0, 39.0, 36.0, 53.0, 38.0, 64.0, 55.0, 53.0, 56.0, 47.0, 41.0, 45.0, 48.0, 47.0, 41.0, 33.0, 24.0, 12.0, 12.0, 11.0, 11.0, 14.0, 5.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003762245178222656, -0.0003623291850090027, -0.00034843385219573975, -0.0003345385193824768, -0.00032064318656921387, -0.00030674785375595093, -0.000292852520942688, -0.00027895718812942505, -0.0002650618553161621, -0.00025116652250289917, -0.00023727118968963623, -0.0002233758568763733, -0.00020948052406311035, -0.0001955851912498474, -0.00018168985843658447, -0.00016779452562332153, -0.0001538991928100586, -0.00014000385999679565, -0.00012610852718353271, -0.00011221319437026978, -9.831786155700684e-05, -8.44225287437439e-05, -7.052719593048096e-05, -5.663186311721802e-05, -4.273653030395508e-05, -2.884119749069214e-05, -1.49458646774292e-05, -1.0505318641662598e-06, 1.284480094909668e-05, 2.674013376235962e-05, 4.063546657562256e-05, 5.45307993888855e-05, 6.842613220214844e-05, 8.232146501541138e-05, 9.621679782867432e-05, 0.00011011213064193726, 0.0001240074634552002, 0.00013790279626846313, 0.00015179812908172607, 0.00016569346189498901, 0.00017958879470825195, 0.0001934841275215149, 0.00020737946033477783, 0.00022127479314804077, 0.0002351701259613037, 0.00024906545877456665, 0.0002629607915878296, 0.00027685612440109253, 0.00029075145721435547, 0.0003046467900276184, 0.00031854212284088135, 0.0003324374556541443, 0.0003463327884674072, 0.00036022812128067017, 0.0003741234540939331, 0.00038801878690719604, 0.000401914119720459, 0.0004158094525337219, 0.00042970478534698486, 0.0004436001181602478, 0.00045749545097351074, 0.0004713907837867737, 0.0004852861166000366, 0.0004991814494132996, 0.0005130767822265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 5.0, 16.0, 21.0, 30.0, 38.0, 73.0, 97.0, 104.0, 198.0, 320.0, 1002.0, 6254.0, 101999.0, 911023.0, 23183.0, 2649.0, 709.0, 268.0, 177.0, 120.0, 61.0, 71.0, 42.0, 23.0, 16.0, 18.0, 12.0, 6.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6776065826416016e-05, -3.526173532009125e-05, -3.374740481376648e-05, -3.223307430744171e-05, -3.071874380111694e-05, -2.9204413294792175e-05, -2.7690082788467407e-05, -2.617575228214264e-05, -2.466142177581787e-05, -2.3147091269493103e-05, -2.1632760763168335e-05, -2.0118430256843567e-05, -1.86040997505188e-05, -1.708976924419403e-05, -1.5575438737869263e-05, -1.4061108231544495e-05, -1.2546777725219727e-05, -1.1032447218894958e-05, -9.51811671257019e-06, -8.003786206245422e-06, -6.489455699920654e-06, -4.975125193595886e-06, -3.460794687271118e-06, -1.94646418094635e-06, -4.3213367462158203e-07, 1.082196831703186e-06, 2.596527338027954e-06, 4.110857844352722e-06, 5.62518835067749e-06, 7.139518857002258e-06, 8.653849363327026e-06, 1.0168179869651794e-05, 1.1682510375976562e-05, 1.319684088230133e-05, 1.4711171388626099e-05, 1.6225501894950867e-05, 1.7739832401275635e-05, 1.9254162907600403e-05, 2.076849341392517e-05, 2.228282392024994e-05, 2.3797154426574707e-05, 2.5311484932899475e-05, 2.6825815439224243e-05, 2.834014594554901e-05, 2.985447645187378e-05, 3.136880695819855e-05, 3.2883137464523315e-05, 3.4397467970848083e-05, 3.591179847717285e-05, 3.742612898349762e-05, 3.894045948982239e-05, 4.0454789996147156e-05, 4.1969120502471924e-05, 4.348345100879669e-05, 4.499778151512146e-05, 4.651211202144623e-05, 4.8026442527770996e-05, 4.9540773034095764e-05, 5.105510354042053e-05, 5.25694340467453e-05, 5.408376455307007e-05, 5.5598095059394836e-05, 5.7112425565719604e-05, 5.862675607204437e-05, 6.014108657836914e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 5.0, 13.0, 18.0, 17.0, 20.0, 36.0, 31.0, 31.0, 44.0, 64.0, 72.0, 56.0, 54.0, 75.0, 65.0, 54.0, 75.0, 52.0, 49.0, 36.0, 26.0, 29.0, 27.0, 11.0, 11.0, 12.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009632110595703125, -0.0009235888719558716, -0.0008839666843414307, -0.0008443444967269897, -0.0008047223091125488, -0.0007651001214981079, -0.000725477933883667, -0.0006858557462692261, -0.0006462335586547852, -0.0006066113710403442, -0.0005669891834259033, -0.0005273669958114624, -0.0004877448081970215, -0.00044812262058258057, -0.00040850043296813965, -0.00036887824535369873, -0.0003292560577392578, -0.0002896338701248169, -0.000250011682510376, -0.00021038949489593506, -0.00017076730728149414, -0.00013114511966705322, -9.15229320526123e-05, -5.190074443817139e-05, -1.2278556823730469e-05, 2.734363079071045e-05, 6.696581840515137e-05, 0.00010658800601959229, 0.0001462101936340332, 0.00018583238124847412, 0.00022545456886291504, 0.00026507675647735596, 0.0003046989440917969, 0.0003443211317062378, 0.0003839433193206787, 0.00042356550693511963, 0.00046318769454956055, 0.0005028098821640015, 0.0005424320697784424, 0.0005820542573928833, 0.0006216764450073242, 0.0006612986326217651, 0.0007009208202362061, 0.000740543007850647, 0.0007801651954650879, 0.0008197873830795288, 0.0008594095706939697, 0.0008990317583084106, 0.0009386539459228516, 0.0009782761335372925, 0.0010178983211517334, 0.0010575205087661743, 0.0010971426963806152, 0.0011367648839950562, 0.001176387071609497, 0.001216009259223938, 0.001255631446838379, 0.0012952536344528198, 0.0013348758220672607, 0.0013744980096817017, 0.0014141201972961426, 0.0014537423849105835, 0.0014933645725250244, 0.0015329867601394653, 0.0015726089477539062]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1948.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1044605.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2005.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 17.0, 0.0, 20.0, 0.0, 0.0, 34.0, 0.0, 48.0, 0.0, 0.0, 90.0, 0.0, 111.0, 0.0, 0.0, 128.0, 0.0, 135.0, 0.0, 117.0, 0.0, 0.0, 101.0, 0.0, 67.0, 0.0, 0.0, 71.0, 0.0, 36.0, 0.0, 0.0, 23.0, 0.0, 8.0, 0.0, 0.0, 4.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.102506399154663e-07, -7.860362529754639e-07, -7.618218660354614e-07, -7.37607479095459e-07, -7.133930921554565e-07, -6.891787052154541e-07, -6.649643182754517e-07, -6.407499313354492e-07, -6.165355443954468e-07, -5.923211574554443e-07, -5.681067705154419e-07, -5.438923835754395e-07, -5.19677996635437e-07, -4.954636096954346e-07, -4.7124922275543213e-07, -4.470348358154297e-07, -4.2282044887542725e-07, -3.986060619354248e-07, -3.7439167499542236e-07, -3.501772880554199e-07, -3.259629011154175e-07, -3.0174851417541504e-07, -2.775341272354126e-07, -2.5331974029541016e-07, -2.2910535335540771e-07, -2.0489096641540527e-07, -1.8067657947540283e-07, -1.564621925354004e-07, -1.3224780559539795e-07, -1.0803341865539551e-07, -8.381903171539307e-08, -5.960464477539063e-08, -3.5390257835388184e-08, -1.1175870895385742e-08, 1.30385160446167e-08, 3.725290298461914e-08, 6.146728992462158e-08, 8.568167686462402e-08, 1.0989606380462646e-07, 1.341104507446289e-07, 1.5832483768463135e-07, 1.825392246246338e-07, 2.0675361156463623e-07, 2.3096799850463867e-07, 2.551823854446411e-07, 2.7939677238464355e-07, 3.03611159324646e-07, 3.2782554626464844e-07, 3.520399332046509e-07, 3.762543201446533e-07, 4.0046870708465576e-07, 4.246830940246582e-07, 4.4889748096466064e-07, 4.731118679046631e-07, 4.973262548446655e-07, 5.21540641784668e-07, 5.457550287246704e-07, 5.699694156646729e-07, 5.941838026046753e-07, 6.183981895446777e-07, 6.426125764846802e-07, 6.668269634246826e-07, 6.910413503646851e-07, 7.152557373046875e-07]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 7.0, 5.0, 19.0, 15.0, 26.0, 43.0, 59.0, 84.0, 124.0, 159.0, 151.0, 92.0, 81.0, 41.0, 22.0, 20.0, 10.0, 5.0, 7.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008186378399841487, -0.0007920170901343226, -0.0007653962820768356, -0.0007387755322270095, -0.0007121547823771834, -0.0006855339743196964, -0.0006589132244698703, -0.0006322924746200442, -0.0006056717247702181, -0.000579050974920392, -0.000552430166862905, -0.0005258094170130789, -0.0004991886671632528, -0.0004725678882095963, -0.0004459471092559397, -0.0004193263594061136, -0.00039270558045245707, -0.0003660848014988005, -0.0003394640516489744, -0.00031284327269531786, -0.00028622252284549177, -0.0002596017438918352, -0.0002329809794900939, -0.00020636021508835256, -0.00017973945068661124, -0.0001531186862848699, -0.00012649792188312858, -9.987715020542964e-05, -7.325638580368832e-05, -4.663561412598938e-05, -2.001484972424805e-05, 6.605914677493274e-06, 3.32266790792346e-05, 5.9847443480975926e-05, 8.646820788271725e-05, 0.00011308897956041619, 0.0001397097366861999, 0.00016633051563985646, 0.00019295128004159778, 0.0002195720444433391, 0.0002461927942931652, 0.00027281357324682176, 0.00029943432309664786, 0.0003260551020503044, 0.0003526758519001305, 0.00037929663085378706, 0.0004059174098074436, 0.0004325381596572697, 0.00045915893861092627, 0.0004857797175645828, 0.0005124004674144089, 0.000539021217264235, 0.000565642025321722, 0.0005922627751715481, 0.0006188835250213742, 0.0006455043330788612, 0.0006721250829286873, 0.0006987458327785134, 0.0007253666408360004, 0.0007519873906858265, 0.0007786081405356526, 0.0008052289485931396, 0.0008318496984429657, 0.0008584704482927918, 0.0008850911981426179]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 13.0, 10.0, 17.0, 20.0, 24.0, 42.0, 41.0, 21.0, 36.0, 59.0, 46.0, 52.0, 57.0, 69.0, 54.0, 62.0, 50.0, 53.0, 44.0, 40.0, 38.0, 26.0, 30.0, 21.0, 13.0, 17.0, 13.0, 13.0, 5.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003279922530055046, -0.00031572103034704924, -0.00030344980768859386, -0.0002911785850301385, -0.0002789073623716831, -0.00026663613971322775, -0.0002543648879509419, -0.00024209366529248655, -0.00022982244263403118, -0.0002175512199755758, -0.00020527999731712043, -0.00019300876010674983, -0.00018073753744829446, -0.0001684663147898391, -0.0001561950775794685, -0.00014392385492101312, -0.00013165263226255774, -0.00011938140960410237, -0.00010711017966968939, -9.48389497352764e-05, -8.256772707682103e-05, -7.029650441836566e-05, -5.802527448395267e-05, -4.5754044549539685e-05, -3.3482821891084313e-05, -2.1211595594650134e-05, -8.940369298215955e-06, 3.3308569982182235e-06, 1.5602083294652402e-05, 2.7873305953107774e-05, 4.014453588752076e-05, 5.2415765821933746e-05, 6.468695937655866e-05, 7.695818203501403e-05, 8.922941196942702e-05, 0.00010150064190384, 0.00011377186456229538, 0.00012604308722075075, 0.00013831432443112135, 0.00015058554708957672, 0.0001628567697480321, 0.00017512799240648746, 0.00018739921506494284, 0.00019967045227531344, 0.0002119416749337688, 0.00022421289759222418, 0.00023648413480259478, 0.00024875535746105015, 0.0002610265801195055, 0.0002732978027779609, 0.00028556902543641627, 0.00029784024809487164, 0.00031011149985715747, 0.00032238272251561284, 0.0003346539451740682, 0.0003469251678325236, 0.00035919639049097896, 0.00037146761314943433, 0.0003837388358078897, 0.00039601005846634507, 0.00040828128112480044, 0.0004205525037832558, 0.00043282375554554164, 0.000445094978203997, 0.0004573662008624524]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 7.0, 7.0, 7.0, 15.0, 21.0, 25.0, 41.0, 67.0, 101.0, 137.0, 229.0, 304.0, 514.0, 841.0, 1260.0, 2211.0, 3789.0, 7109.0, 13653.0, 31421.0, 88447.0, 405079.0, 354373.0, 80651.0, 29308.0, 12964.0, 6740.0, 3668.0, 2081.0, 1265.0, 760.0, 533.0, 315.0, 190.0, 139.0, 91.0, 49.0, 48.0, 28.0, 24.0, 17.0, 10.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.00074005126953125, -0.0007188841700553894, -0.0006977170705795288, -0.0006765499711036682, -0.0006553828716278076, -0.000634215772151947, -0.0006130486726760864, -0.0005918815732002258, -0.0005707144737243652, -0.0005495473742485046, -0.000528380274772644, -0.0005072131752967834, -0.00048604607582092285, -0.00046487897634506226, -0.00044371187686920166, -0.00042254477739334106, -0.00040137767791748047, -0.0003802105784416199, -0.0003590434789657593, -0.0003378763794898987, -0.0003167092800140381, -0.0002955421805381775, -0.0002743750810623169, -0.0002532079815864563, -0.0002320408821105957, -0.0002108737826347351, -0.0001897066831588745, -0.00016853958368301392, -0.00014737248420715332, -0.00012620538473129272, -0.00010503828525543213, -8.387118577957153e-05, -6.270408630371094e-05, -4.153698682785034e-05, -2.0369887351989746e-05, 7.972121238708496e-07, 2.1964311599731445e-05, 4.313141107559204e-05, 6.429851055145264e-05, 8.546561002731323e-05, 0.00010663270950317383, 0.00012779980897903442, 0.00014896690845489502, 0.00017013400793075562, 0.0001913011074066162, 0.0002124682068824768, 0.0002336353063583374, 0.000254802405834198, 0.0002759695053100586, 0.0002971366047859192, 0.0003183037042617798, 0.0003394708037376404, 0.000360637903213501, 0.00038180500268936157, 0.00040297210216522217, 0.00042413920164108276, 0.00044530630111694336, 0.00046647340059280396, 0.00048764050006866455, 0.0005088075995445251, 0.0005299746990203857, 0.0005511417984962463, 0.0005723088979721069, 0.0005934759974479675, 0.0006146430969238281]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 8.0, 10.0, 12.0, 20.0, 21.0, 35.0, 27.0, 38.0, 34.0, 48.0, 57.0, 58.0, 70.0, 77.0, 63.0, 72.0, 57.0, 56.0, 45.0, 38.0, 25.0, 28.0, 23.0, 22.0, 6.0, 14.0, 4.0, 5.0, 10.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001373291015625, -0.0001328159123659134, -0.00012830272316932678, -0.00012378953397274017, -0.00011927634477615356, -0.00011476315557956696, -0.00011024996638298035, -0.00010573677718639374, -0.00010122358798980713, -9.671039879322052e-05, -9.219720959663391e-05, -8.76840204000473e-05, -8.31708312034607e-05, -7.865764200687408e-05, -7.414445281028748e-05, -6.963126361370087e-05, -6.511807441711426e-05, -6.060488522052765e-05, -5.609169602394104e-05, -5.157850682735443e-05, -4.706531763076782e-05, -4.255212843418121e-05, -3.8038939237594604e-05, -3.3525750041007996e-05, -2.9012560844421387e-05, -2.4499371647834778e-05, -1.998618245124817e-05, -1.547299325466156e-05, -1.0959804058074951e-05, -6.446614861488342e-06, -1.9334256649017334e-06, 2.5797635316848755e-06, 7.092952728271484e-06, 1.1606141924858093e-05, 1.6119331121444702e-05, 2.063252031803131e-05, 2.514570951461792e-05, 2.965889871120453e-05, 3.417208790779114e-05, 3.8685277104377747e-05, 4.3198466300964355e-05, 4.7711655497550964e-05, 5.222484469413757e-05, 5.673803389072418e-05, 6.125122308731079e-05, 6.57644122838974e-05, 7.027760148048401e-05, 7.479079067707062e-05, 7.930397987365723e-05, 8.381716907024384e-05, 8.833035826683044e-05, 9.284354746341705e-05, 9.735673666000366e-05, 0.00010186992585659027, 0.00010638311505317688, 0.00011089630424976349, 0.0001154094934463501, 0.0001199226826429367, 0.00012443587183952332, 0.00012894906103610992, 0.00013346225023269653, 0.00013797543942928314, 0.00014248862862586975, 0.00014700181782245636, 0.00015151500701904297]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 6.0, 10.0, 14.0, 15.0, 14.0, 24.0, 39.0, 56.0, 77.0, 127.0, 252.0, 519.0, 1182.0, 2942.0, 8024.0, 25004.0, 93618.0, 450946.0, 356662.0, 76362.0, 21275.0, 6819.0, 2515.0, 1043.0, 462.0, 224.0, 115.0, 73.0, 39.0, 35.0, 19.0, 12.0, 6.0, 6.0, 9.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0006322860717773438, -0.0006156153976917267, -0.0005989447236061096, -0.0005822740495204926, -0.0005656033754348755, -0.0005489327013492584, -0.0005322620272636414, -0.0005155913531780243, -0.0004989206790924072, -0.00048225000500679016, -0.0004655793309211731, -0.00044890865683555603, -0.00043223798274993896, -0.0004155673086643219, -0.00039889663457870483, -0.00038222596049308777, -0.0003655552864074707, -0.00034888461232185364, -0.00033221393823623657, -0.0003155432641506195, -0.00029887259006500244, -0.0002822019159793854, -0.0002655312418937683, -0.00024886056780815125, -0.00023218989372253418, -0.00021551921963691711, -0.00019884854555130005, -0.00018217787146568298, -0.00016550719738006592, -0.00014883652329444885, -0.0001321658492088318, -0.00011549517512321472, -9.882450103759766e-05, -8.215382695198059e-05, -6.548315286636353e-05, -4.881247878074646e-05, -3.2141804695129395e-05, -1.547113060951233e-05, 1.1995434761047363e-06, 1.7870217561721802e-05, 3.454089164733887e-05, 5.121156573295593e-05, 6.7882239818573e-05, 8.455291390419006e-05, 0.00010122358798980713, 0.0001178942620754242, 0.00013456493616104126, 0.00015123561024665833, 0.0001679062843322754, 0.00018457695841789246, 0.00020124763250350952, 0.0002179183065891266, 0.00023458898067474365, 0.0002512596547603607, 0.0002679303288459778, 0.00028460100293159485, 0.0003012716770172119, 0.000317942351102829, 0.00033461302518844604, 0.0003512836992740631, 0.0003679543733596802, 0.00038462504744529724, 0.0004012957215309143, 0.00041796639561653137, 0.00043463706970214844]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 12.0, 3.0, 11.0, 14.0, 23.0, 34.0, 32.0, 37.0, 45.0, 36.0, 38.0, 44.0, 55.0, 66.0, 57.0, 70.0, 61.0, 49.0, 46.0, 40.0, 43.0, 41.0, 15.0, 27.0, 26.0, 13.0, 13.0, 15.0, 6.0, 5.0, 8.0, 4.0, 1.0, 2.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017499923706054688, -0.00016838312149047852, -0.00016176700592041016, -0.0001551508903503418, -0.00014853477478027344, -0.00014191865921020508, -0.00013530254364013672, -0.00012868642807006836, -0.0001220703125, -0.00011545419692993164, -0.00010883808135986328, -0.00010222196578979492, -9.560585021972656e-05, -8.89897346496582e-05, -8.237361907958984e-05, -7.575750350952148e-05, -6.914138793945312e-05, -6.252527236938477e-05, -5.5909156799316406e-05, -4.929304122924805e-05, -4.267692565917969e-05, -3.606081008911133e-05, -2.944469451904297e-05, -2.282857894897461e-05, -1.621246337890625e-05, -9.59634780883789e-06, -2.9802322387695312e-06, 3.635883331298828e-06, 1.0251998901367188e-05, 1.6868114471435547e-05, 2.3484230041503906e-05, 3.0100345611572266e-05, 3.6716461181640625e-05, 4.3332576751708984e-05, 4.9948692321777344e-05, 5.65648078918457e-05, 6.318092346191406e-05, 6.979703903198242e-05, 7.641315460205078e-05, 8.302927017211914e-05, 8.96453857421875e-05, 9.626150131225586e-05, 0.00010287761688232422, 0.00010949373245239258, 0.00011610984802246094, 0.0001227259635925293, 0.00012934207916259766, 0.00013595819473266602, 0.00014257431030273438, 0.00014919042587280273, 0.0001558065414428711, 0.00016242265701293945, 0.0001690387725830078, 0.00017565488815307617, 0.00018227100372314453, 0.0001888871192932129, 0.00019550323486328125, 0.0002021193504333496, 0.00020873546600341797, 0.00021535158157348633, 0.0002219676971435547, 0.00022858381271362305, 0.0002351999282836914, 0.00024181604385375977, 0.0002484321594238281]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 11.0, 7.0, 12.0, 19.0, 24.0, 48.0, 52.0, 71.0, 124.0, 220.0, 442.0, 987.0, 2689.0, 15194.0, 1003931.0, 19468.0, 3052.0, 1088.0, 472.0, 227.0, 150.0, 68.0, 64.0, 38.0, 25.0, 19.0, 13.0, 11.0, 7.0, 6.0, 7.0, 0.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000244140625, -0.00023587793111801147, -0.00022761523723602295, -0.00021935254335403442, -0.0002110898494720459, -0.00020282715559005737, -0.00019456446170806885, -0.00018630176782608032, -0.0001780390739440918, -0.00016977638006210327, -0.00016151368618011475, -0.00015325099229812622, -0.0001449882984161377, -0.00013672560453414917, -0.00012846291065216064, -0.00012020021677017212, -0.0001119375228881836, -0.00010367482900619507, -9.541213512420654e-05, -8.714944124221802e-05, -7.888674736022949e-05, -7.062405347824097e-05, -6.236135959625244e-05, -5.4098665714263916e-05, -4.583597183227539e-05, -3.7573277950286865e-05, -2.931058406829834e-05, -2.1047890186309814e-05, -1.2785196304321289e-05, -4.522502422332764e-06, 3.7401914596557617e-06, 1.2002885341644287e-05, 2.0265579223632812e-05, 2.8528273105621338e-05, 3.679096698760986e-05, 4.505366086959839e-05, 5.3316354751586914e-05, 6.157904863357544e-05, 6.984174251556396e-05, 7.810443639755249e-05, 8.636713027954102e-05, 9.462982416152954e-05, 0.00010289251804351807, 0.00011115521192550659, 0.00011941790580749512, 0.00012768059968948364, 0.00013594329357147217, 0.0001442059874534607, 0.00015246868133544922, 0.00016073137521743774, 0.00016899406909942627, 0.0001772567629814148, 0.00018551945686340332, 0.00019378215074539185, 0.00020204484462738037, 0.0002103075385093689, 0.00021857023239135742, 0.00022683292627334595, 0.00023509562015533447, 0.000243358314037323, 0.0002516210079193115, 0.00025988370180130005, 0.0002681463956832886, 0.0002764090895652771, 0.0002846717834472656]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 207.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 539.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 206.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.7229467630386353e-07, -1.6577541828155518e-07, -1.5925616025924683e-07, -1.5273690223693848e-07, -1.4621764421463013e-07, -1.3969838619232178e-07, -1.3317912817001343e-07, -1.2665987014770508e-07, -1.2014061212539673e-07, -1.1362135410308838e-07, -1.0710209608078003e-07, -1.0058283805847168e-07, -9.406358003616333e-08, -8.754432201385498e-08, -8.102506399154663e-08, -7.450580596923828e-08, -6.798654794692993e-08, -6.146728992462158e-08, -5.494803190231323e-08, -4.842877388000488e-08, -4.190951585769653e-08, -3.5390257835388184e-08, -2.8870999813079834e-08, -2.2351741790771484e-08, -1.5832483768463135e-08, -9.313225746154785e-09, -2.7939677238464355e-09, 3.725290298461914e-09, 1.0244548320770264e-08, 1.6763806343078613e-08, 2.3283064365386963e-08, 2.9802322387695312e-08, 3.632158041000366e-08, 4.284083843231201e-08, 4.936009645462036e-08, 5.587935447692871e-08, 6.239861249923706e-08, 6.891787052154541e-08, 7.543712854385376e-08, 8.195638656616211e-08, 8.847564458847046e-08, 9.499490261077881e-08, 1.0151416063308716e-07, 1.0803341865539551e-07, 1.1455267667770386e-07, 1.210719347000122e-07, 1.2759119272232056e-07, 1.341104507446289e-07, 1.4062970876693726e-07, 1.471489667892456e-07, 1.5366822481155396e-07, 1.601874828338623e-07, 1.6670674085617065e-07, 1.73225998878479e-07, 1.7974525690078735e-07, 1.862645149230957e-07, 1.9278377294540405e-07, 1.993030309677124e-07, 2.0582228899002075e-07, 2.123415470123291e-07, 2.1886080503463745e-07, 2.253800630569458e-07, 2.3189932107925415e-07, 2.384185791015625e-07]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 7.0, 6.0, 11.0, 13.0, 13.0, 34.0, 47.0, 83.0, 143.0, 282.0, 519.0, 1072.0, 2353.0, 5692.0, 19962.0, 961802.0, 42699.0, 7883.0, 3142.0, 1420.0, 626.0, 330.0, 169.0, 89.0, 57.0, 45.0, 20.0, 5.0, 7.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.739398956298828e-05, -9.441189467906952e-05, -9.142979979515076e-05, -8.8447704911232e-05, -8.546561002731323e-05, -8.248351514339447e-05, -7.950142025947571e-05, -7.651932537555695e-05, -7.353723049163818e-05, -7.055513560771942e-05, -6.757304072380066e-05, -6.45909458398819e-05, -6.160885095596313e-05, -5.862675607204437e-05, -5.564466118812561e-05, -5.266256630420685e-05, -4.9680471420288086e-05, -4.6698376536369324e-05, -4.371628165245056e-05, -4.07341867685318e-05, -3.775209188461304e-05, -3.4769997000694275e-05, -3.178790211677551e-05, -2.880580723285675e-05, -2.5823712348937988e-05, -2.2841617465019226e-05, -1.9859522581100464e-05, -1.68774276971817e-05, -1.389533281326294e-05, -1.0913237929344177e-05, -7.931143045425415e-06, -4.949048161506653e-06, -1.9669532775878906e-06, 1.0151416063308716e-06, 3.997236490249634e-06, 6.979331374168396e-06, 9.961426258087158e-06, 1.294352114200592e-05, 1.5925616025924683e-05, 1.8907710909843445e-05, 2.1889805793762207e-05, 2.487190067768097e-05, 2.785399556159973e-05, 3.0836090445518494e-05, 3.3818185329437256e-05, 3.680028021335602e-05, 3.978237509727478e-05, 4.276446998119354e-05, 4.5746564865112305e-05, 4.872865974903107e-05, 5.171075463294983e-05, 5.469284951686859e-05, 5.7674944400787354e-05, 6.0657039284706116e-05, 6.363913416862488e-05, 6.662122905254364e-05, 6.96033239364624e-05, 7.258541882038116e-05, 7.556751370429993e-05, 7.854960858821869e-05, 8.153170347213745e-05, 8.451379835605621e-05, 8.749589323997498e-05, 9.047798812389374e-05, 9.34600830078125e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 6.0, 2.0, 3.0, 1.0, 3.0, 10.0, 11.0, 22.0, 28.0, 144.0, 368.0, 260.0, 71.0, 23.0, 8.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4749507904052734e-05, -3.365706652402878e-05, -3.256462514400482e-05, -3.1472183763980865e-05, -3.037974238395691e-05, -2.9287301003932953e-05, -2.8194859623908997e-05, -2.710241824388504e-05, -2.6009976863861084e-05, -2.4917535483837128e-05, -2.382509410381317e-05, -2.2732652723789215e-05, -2.164021134376526e-05, -2.0547769963741302e-05, -1.9455328583717346e-05, -1.836288720369339e-05, -1.7270445823669434e-05, -1.6178004443645477e-05, -1.5085563063621521e-05, -1.3993121683597565e-05, -1.2900680303573608e-05, -1.1808238923549652e-05, -1.0715797543525696e-05, -9.62335616350174e-06, -8.530914783477783e-06, -7.438473403453827e-06, -6.346032023429871e-06, -5.253590643405914e-06, -4.161149263381958e-06, -3.0687078833580017e-06, -1.9762665033340454e-06, -8.838251233100891e-07, 2.086162567138672e-07, 1.3010576367378235e-06, 2.3934990167617798e-06, 3.485940396785736e-06, 4.578381776809692e-06, 5.670823156833649e-06, 6.763264536857605e-06, 7.855705916881561e-06, 8.948147296905518e-06, 1.0040588676929474e-05, 1.113303005695343e-05, 1.2225471436977386e-05, 1.3317912817001343e-05, 1.4410354197025299e-05, 1.5502795577049255e-05, 1.659523695707321e-05, 1.7687678337097168e-05, 1.8780119717121124e-05, 1.987256109714508e-05, 2.0965002477169037e-05, 2.2057443857192993e-05, 2.314988523721695e-05, 2.4242326617240906e-05, 2.5334767997264862e-05, 2.642720937728882e-05, 2.7519650757312775e-05, 2.861209213733673e-05, 2.9704533517360687e-05, 3.0796974897384644e-05, 3.18894162774086e-05, 3.2981857657432556e-05, 3.407429903745651e-05, 3.516674041748047e-05]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 8.0, 16.0, 21.0, 30.0, 34.0, 54.0, 77.0, 108.0, 127.0, 146.0, 110.0, 81.0, 51.0, 33.0, 25.0, 22.0, 13.0, 16.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000589753151871264, -0.000569464173167944, -0.0005491751944646239, -0.0005288862157613039, -0.0005085972370579839, -0.0004883082583546638, -0.0004680193087551743, -0.00044773033005185425, -0.0004274413513485342, -0.0004071523726452142, -0.0003868633939418942, -0.00036657441523857415, -0.0003462854656390846, -0.00032599648693576455, -0.0003057075082324445, -0.0002854185295291245, -0.00026512955082580447, -0.00024484057212248445, -0.00022455159341916442, -0.00020426262926775962, -0.0001839736505644396, -0.00016368467186111957, -0.00014339570770971477, -0.00012310672900639474, -0.00010281775030307472, -8.252877159975469e-05, -6.223980017239228e-05, -4.195082510705106e-05, -2.166185004170984e-05, -1.372871338389814e-06, 1.89161000889726e-05, 3.920507151633501e-05, 5.949410842731595e-05, 7.978308713063598e-05, 0.00010007205855799839, 0.0001203610299853608, 0.00014065000868868083, 0.00016093898739200085, 0.00018122795154340565, 0.00020151693024672568, 0.0002218059089500457, 0.00024209488765336573, 0.00026238386635668576, 0.0002826728450600058, 0.00030296179465949535, 0.0003232507733628154, 0.0003435397520661354, 0.00036382873076945543, 0.00038411770947277546, 0.0004044066881760955, 0.0004246956668794155, 0.00044498464558273554, 0.00046527362428605556, 0.0004855626029893756, 0.0005058515816926956, 0.0005261405603960156, 0.0005464295390993357, 0.0005667185178026557, 0.0005870074965059757, 0.0006072964752092957, 0.0006275854539126158, 0.0006478744326159358, 0.0006681634113192558, 0.0006884523900225759, 0.000708741310518235]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 7.0, 16.0, 11.0, 5.0, 18.0, 17.0, 16.0, 18.0, 19.0, 35.0, 35.0, 37.0, 38.0, 47.0, 59.0, 43.0, 46.0, 54.0, 58.0, 53.0, 49.0, 30.0, 47.0, 47.0, 38.0, 25.0, 18.0, 19.0, 14.0, 19.0, 11.0, 18.0, 9.0, 11.0, 7.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004166070430073887, -0.0004056436591781676, -0.000394680246245116, -0.00038371686241589487, -0.00037275347858667374, -0.00036179006565362215, -0.000350826681824401, -0.0003398632979951799, -0.0003288998850621283, -0.0003179365012329072, -0.0003069730882998556, -0.00029600970447063446, -0.00028504632064141333, -0.0002740829368121922, -0.0002631195238791406, -0.0002521561400499195, -0.00024119275622069836, -0.000230229357839562, -0.00021926597401034087, -0.0002083025756292045, -0.00019733919179998338, -0.00018637579341884702, -0.00017541239503771067, -0.00016444901120848954, -0.00015348561282735318, -0.00014252221444621682, -0.0001315588306169957, -0.00012059543223585933, -0.00010963204113068059, -9.866865002550185e-05, -8.770525164436549e-05, -7.674186053918675e-05, -6.577849853783846e-05, -5.4815107432659715e-05, -4.3851712689502165e-05, -3.2888317946344614e-05, -2.192492684116587e-05, -1.0961535735987127e-05, 1.862645149230957e-09, 1.0965253750327975e-05, 2.1928644855506718e-05, 3.289203596068546e-05, 4.385543070384301e-05, 5.481882544700056e-05, 6.57822165521793e-05, 7.674560765735805e-05, 8.770900603849441e-05, 9.867239714367315e-05, 0.0001096357882488519, 0.00012059917935403064, 0.00013156257045920938, 0.00014252596884034574, 0.00015348935266956687, 0.00016445275105070323, 0.00017541614943183959, 0.00018637953326106071, 0.00019734293164219707, 0.00020830633002333343, 0.00021926971385255456, 0.00023023311223369092, 0.00024119651061482728, 0.0002521598944440484, 0.0002631233073771, 0.0002740866912063211, 0.00028505007503554225]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 5.0, 6.0, 10.0, 9.0, 17.0, 12.0, 37.0, 48.0, 57.0, 81.0, 187.0, 319.0, 520.0, 858.0, 1654.0, 3421.0, 17996.0, 4112754.0, 47884.0, 4047.0, 1896.0, 1017.0, 666.0, 326.0, 185.0, 98.0, 53.0, 42.0, 26.0, 19.0, 9.0, 8.0, 6.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00093841552734375, -0.0009066909551620483, -0.0008749663829803467, -0.000843241810798645, -0.0008115172386169434, -0.0007797926664352417, -0.00074806809425354, -0.0007163435220718384, -0.0006846189498901367, -0.0006528943777084351, -0.0006211698055267334, -0.0005894452333450317, -0.0005577206611633301, -0.0005259960889816284, -0.0004942715167999268, -0.0004625469446182251, -0.00043082237243652344, -0.0003990978002548218, -0.0003673732280731201, -0.00033564865589141846, -0.0003039240837097168, -0.00027219951152801514, -0.00024047493934631348, -0.00020875036716461182, -0.00017702579498291016, -0.0001453012228012085, -0.00011357665061950684, -8.185207843780518e-05, -5.0127506256103516e-05, -1.8402934074401855e-05, 1.3321638107299805e-05, 4.5046210289001465e-05, 7.677078247070312e-05, 0.00010849535465240479, 0.00014021992683410645, 0.0001719444990158081, 0.00020366907119750977, 0.00023539364337921143, 0.0002671182155609131, 0.00029884278774261475, 0.0003305673599243164, 0.00036229193210601807, 0.0003940165042877197, 0.0004257410764694214, 0.00045746564865112305, 0.0004891902208328247, 0.0005209147930145264, 0.000552639365196228, 0.0005843639373779297, 0.0006160885095596313, 0.000647813081741333, 0.0006795376539230347, 0.0007112622261047363, 0.000742986798286438, 0.0007747113704681396, 0.0008064359426498413, 0.000838160514831543, 0.0008698850870132446, 0.0009016096591949463, 0.000933334231376648, 0.0009650588035583496, 0.0009967833757400513, 0.001028507947921753, 0.0010602325201034546, 0.0010919570922851562]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 6.0, 6.0, 10.0, 8.0, 7.0, 15.0, 12.0, 9.0, 21.0, 25.0, 27.0, 34.0, 34.0, 31.0, 55.0, 45.0, 43.0, 46.0, 65.0, 51.0, 44.0, 42.0, 41.0, 39.0, 46.0, 32.0, 40.0, 24.0, 22.0, 21.0, 14.0, 17.0, 20.0, 11.0, 11.0, 4.0, 10.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00021791458129882812, -0.00021186843514442444, -0.00020582228899002075, -0.00019977614283561707, -0.00019372999668121338, -0.0001876838505268097, -0.000181637704372406, -0.00017559155821800232, -0.00016954541206359863, -0.00016349926590919495, -0.00015745311975479126, -0.00015140697360038757, -0.0001453608274459839, -0.0001393146812915802, -0.00013326853513717651, -0.00012722238898277283, -0.00012117624282836914, -0.00011513009667396545, -0.00010908395051956177, -0.00010303780436515808, -9.69916582107544e-05, -9.094551205635071e-05, -8.489936590194702e-05, -7.885321974754333e-05, -7.280707359313965e-05, -6.676092743873596e-05, -6.0714781284332275e-05, -5.466863512992859e-05, -4.86224889755249e-05, -4.2576342821121216e-05, -3.653019666671753e-05, -3.0484050512313843e-05, -2.4437904357910156e-05, -1.839175820350647e-05, -1.2345612049102783e-05, -6.299465894699097e-06, -2.5331974029541016e-07, 5.792826414108276e-06, 1.1838972568511963e-05, 1.788511872291565e-05, 2.3931264877319336e-05, 2.9977411031723022e-05, 3.602355718612671e-05, 4.2069703340530396e-05, 4.811584949493408e-05, 5.416199564933777e-05, 6.0208141803741455e-05, 6.625428795814514e-05, 7.230043411254883e-05, 7.834658026695251e-05, 8.43927264213562e-05, 9.043887257575989e-05, 9.648501873016357e-05, 0.00010253116488456726, 0.00010857731103897095, 0.00011462345719337463, 0.00012066960334777832, 0.000126715749502182, 0.0001327618956565857, 0.00013880804181098938, 0.00014485418796539307, 0.00015090033411979675, 0.00015694648027420044, 0.00016299262642860413, 0.0001690387725830078]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 7.0, 8.0, 12.0, 19.0, 28.0, 51.0, 79.0, 159.0, 467.0, 1555.0, 5845.0, 87038.0, 4080443.0, 14304.0, 2711.0, 907.0, 327.0, 135.0, 68.0, 50.0, 23.0, 16.0, 11.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010080337524414062, -0.0009785965085029602, -0.0009491592645645142, -0.0009197220206260681, -0.0008902847766876221, -0.000860847532749176, -0.00083141028881073, -0.0008019730448722839, -0.0007725358009338379, -0.0007430985569953918, -0.0007136613130569458, -0.0006842240691184998, -0.0006547868251800537, -0.0006253495812416077, -0.0005959123373031616, -0.0005664750933647156, -0.0005370378494262695, -0.0005076006054878235, -0.00047816336154937744, -0.0004487261176109314, -0.00041928887367248535, -0.0003898516297340393, -0.00036041438579559326, -0.0003309771418571472, -0.00030153989791870117, -0.0002721026539802551, -0.00024266541004180908, -0.00021322816610336304, -0.000183790922164917, -0.00015435367822647095, -0.0001249164342880249, -9.547919034957886e-05, -6.604194641113281e-05, -3.660470247268677e-05, -7.167458534240723e-06, 2.2269785404205322e-05, 5.170702934265137e-05, 8.114427328109741e-05, 0.00011058151721954346, 0.0001400187611579895, 0.00016945600509643555, 0.0001988932490348816, 0.00022833049297332764, 0.0002577677369117737, 0.0002872049808502197, 0.00031664222478866577, 0.0003460794687271118, 0.00037551671266555786, 0.0004049539566040039, 0.00043439120054244995, 0.000463828444480896, 0.000493265688419342, 0.0005227029323577881, 0.0005521401762962341, 0.0005815774202346802, 0.0006110146641731262, 0.0006404519081115723, 0.0006698891520500183, 0.0006993263959884644, 0.0007287636399269104, 0.0007582008838653564, 0.0007876381278038025, 0.0008170753717422485, 0.0008465126156806946, 0.0008759498596191406]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 7.0, 4.0, 7.0, 10.0, 9.0, 22.0, 30.0, 118.0, 451.0, 2244.0, 795.0, 219.0, 61.0, 39.0, 21.0, 8.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0001957416534423828, -0.0001910543069243431, -0.0001863669604063034, -0.0001816796138882637, -0.000176992267370224, -0.0001723049208521843, -0.0001676175743341446, -0.0001629302278161049, -0.00015824288129806519, -0.00015355553478002548, -0.00014886818826198578, -0.00014418084174394608, -0.00013949349522590637, -0.00013480614870786667, -0.00013011880218982697, -0.00012543145567178726, -0.00012074410915374756, -0.00011605676263570786, -0.00011136941611766815, -0.00010668206959962845, -0.00010199472308158875, -9.730737656354904e-05, -9.262003004550934e-05, -8.793268352746964e-05, -8.324533700942993e-05, -7.855799049139023e-05, -7.387064397335052e-05, -6.918329745531082e-05, -6.449595093727112e-05, -5.9808604419231415e-05, -5.512125790119171e-05, -5.043391138315201e-05, -4.5746564865112305e-05, -4.10592183470726e-05, -3.63718718290329e-05, -3.1684525310993195e-05, -2.699717879295349e-05, -2.2309832274913788e-05, -1.7622485756874084e-05, -1.2935139238834381e-05, -8.247792720794678e-06, -3.5604462027549744e-06, 1.126900315284729e-06, 5.814246833324432e-06, 1.0501593351364136e-05, 1.5188939869403839e-05, 1.9876286387443542e-05, 2.4563632905483246e-05, 2.925097942352295e-05, 3.393832594156265e-05, 3.8625672459602356e-05, 4.331301897764206e-05, 4.800036549568176e-05, 5.2687712013721466e-05, 5.737505853176117e-05, 6.206240504980087e-05, 6.674975156784058e-05, 7.143709808588028e-05, 7.612444460391998e-05, 8.081179112195969e-05, 8.549913763999939e-05, 9.018648415803909e-05, 9.48738306760788e-05, 9.95611771941185e-05, 0.0001042485237121582]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 11.0, 3.0, 15.0, 17.0, 21.0, 25.0, 45.0, 78.0, 96.0, 144.0, 153.0, 127.0, 76.0, 54.0, 39.0, 32.0, 7.0, 19.0, 9.0, 13.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003225227410439402, -0.0003102122573181987, -0.0002979017735924572, -0.0002855913189705461, -0.0002732808352448046, -0.0002609703515190631, -0.0002486598677933216, -0.00023634939861949533, -0.00022403892944566905, -0.00021172844571992755, -0.00019941797654610127, -0.00018710749282035977, -0.0001747970236465335, -0.00016248653992079198, -0.00015017605619505048, -0.0001378655870212242, -0.0001255551032954827, -0.0001132446268456988, -0.00010093415039591491, -8.86236666701734e-05, -7.631319749634713e-05, -6.400271377060562e-05, -5.169223732082173e-05, -3.938176087103784e-05, -2.707128442125395e-05, -1.4760807061975356e-05, -2.450329702696763e-06, 9.860148566076532e-06, 2.2170625015860423e-05, 3.448110510362312e-05, 4.6791581553407013e-05, 5.9102058003190905e-05, 7.14125344529748e-05, 8.372301090275869e-05, 9.603348735254258e-05, 0.00010834397107828408, 0.00012065444025211036, 0.00013296492397785187, 0.00014527540770359337, 0.00015758587687741965, 0.00016989634605124593, 0.00018220682977698743, 0.0001945172989508137, 0.00020682778267655522, 0.0002191382518503815, 0.000231448735576123, 0.0002437592193018645, 0.000256069703027606, 0.00026838015764951706, 0.00028069064137525856, 0.00029300112510100007, 0.0003053115797229111, 0.0003176220634486526, 0.00032993254717439413, 0.00034224303090013564, 0.00035455351462587714, 0.00036686399835161865, 0.00037917448207736015, 0.00039148496580310166, 0.0004037954204250127, 0.0004161059041507542, 0.0004284163878764957, 0.0004407268716022372, 0.0004530373262241483, 0.0004653478099498898]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 9.0, 11.0, 18.0, 11.0, 11.0, 22.0, 24.0, 33.0, 28.0, 27.0, 43.0, 45.0, 50.0, 53.0, 44.0, 41.0, 46.0, 49.0, 48.0, 49.0, 39.0, 56.0, 35.0, 35.0, 42.0, 17.0, 21.0, 13.0, 11.0, 13.0, 13.0, 6.0, 12.0, 5.0, 9.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00022118148626759648, -0.00021492889209184796, -0.00020867629791609943, -0.0002024237037403509, -0.00019617110956460238, -0.00018991851538885385, -0.00018366592121310532, -0.0001774133270373568, -0.00017116073286160827, -0.00016490813868585974, -0.0001586555445101112, -0.00015240295033436269, -0.00014615035615861416, -0.00013989776198286563, -0.0001336451678071171, -0.00012739257363136858, -0.00012113998673157766, -0.00011488739255582914, -0.00010863479838008061, -0.00010238220420433208, -9.612961002858356e-05, -8.987702312879264e-05, -8.362442895304412e-05, -7.737183477729559e-05, -7.111924060154706e-05, -6.486664642579854e-05, -5.861405225005001e-05, -5.236145807430148e-05, -4.6108863898552954e-05, -3.9856273360783234e-05, -3.360367918503471e-05, -2.735108500928618e-05, -2.1098487195558846e-05, -1.4845893019810319e-05, -8.593299753556494e-06, -2.3407064873026684e-06, 3.911887688445859e-06, 1.0164480045204982e-05, 1.641707422095351e-05, 2.2669668396702036e-05, 2.8922262572450563e-05, 3.517485674819909e-05, 4.142745092394762e-05, 4.768004146171734e-05, 5.3932635637465864e-05, 6.018522981321439e-05, 6.643782398896292e-05, 7.269041816471145e-05, 7.894301234045997e-05, 8.51956065162085e-05, 9.144820069195703e-05, 9.770079486770555e-05, 0.00010395338904345408, 0.000110205975943245, 0.00011645857011899352, 0.00012271116429474205, 0.00012896375847049057, 0.0001352163526462391, 0.00014146894682198763, 0.00014772154099773616, 0.00015397413517348468, 0.0001602267293492332, 0.00016647932352498174, 0.00017273191770073026, 0.0001789845118764788]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 9.0, 10.0, 12.0, 13.0, 11.0, 35.0, 57.0, 84.0, 107.0, 165.0, 300.0, 474.0, 920.0, 1768.0, 3546.0, 9036.0, 28090.0, 308158.0, 636326.0, 40474.0, 10737.0, 3941.0, 1898.0, 945.0, 594.0, 282.0, 184.0, 136.0, 69.0, 59.0, 34.0, 18.0, 21.0, 12.0, 8.0, 10.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.445148468017578e-05, -3.334321081638336e-05, -3.223493695259094e-05, -3.112666308879852e-05, -3.0018389225006104e-05, -2.8910115361213684e-05, -2.7801841497421265e-05, -2.6693567633628845e-05, -2.5585293769836426e-05, -2.4477019906044006e-05, -2.3368746042251587e-05, -2.2260472178459167e-05, -2.1152198314666748e-05, -2.004392445087433e-05, -1.893565058708191e-05, -1.782737672328949e-05, -1.671910285949707e-05, -1.561082899570465e-05, -1.4502555131912231e-05, -1.3394281268119812e-05, -1.2286007404327393e-05, -1.1177733540534973e-05, -1.0069459676742554e-05, -8.961185812950134e-06, -7.852911949157715e-06, -6.744638085365295e-06, -5.636364221572876e-06, -4.5280903577804565e-06, -3.419816493988037e-06, -2.3115426301956177e-06, -1.2032687664031982e-06, -9.499490261077881e-08, 1.0132789611816406e-06, 2.12155282497406e-06, 3.2298266887664795e-06, 4.338100552558899e-06, 5.446374416351318e-06, 6.554648280143738e-06, 7.662922143936157e-06, 8.771196007728577e-06, 9.879469871520996e-06, 1.0987743735313416e-05, 1.2096017599105835e-05, 1.3204291462898254e-05, 1.4312565326690674e-05, 1.5420839190483093e-05, 1.6529113054275513e-05, 1.7637386918067932e-05, 1.874566078186035e-05, 1.985393464565277e-05, 2.096220850944519e-05, 2.207048237323761e-05, 2.317875623703003e-05, 2.428703010082245e-05, 2.5395303964614868e-05, 2.6503577828407288e-05, 2.7611851692199707e-05, 2.8720125555992126e-05, 2.9828399419784546e-05, 3.0936673283576965e-05, 3.2044947147369385e-05, 3.3153221011161804e-05, 3.4261494874954224e-05, 3.536976873874664e-05, 3.647804260253906e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 18.0, 12.0, 24.0, 17.0, 36.0, 29.0, 46.0, 41.0, 59.0, 65.0, 58.0, 54.0, 53.0, 55.0, 47.0, 53.0, 52.0, 47.0, 41.0, 34.0, 26.0, 20.0, 17.0, 16.0, 8.0, 17.0, 5.0, 8.0, 5.0, 2.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001697540283203125, -0.00016495771706104279, -0.00016016140580177307, -0.00015536509454250336, -0.00015056878328323364, -0.00014577247202396393, -0.00014097616076469421, -0.0001361798495054245, -0.00013138353824615479, -0.00012658722698688507, -0.00012179091572761536, -0.00011699460446834564, -0.00011219829320907593, -0.00010740198194980621, -0.0001026056706905365, -9.780935943126678e-05, -9.301304817199707e-05, -8.821673691272736e-05, -8.342042565345764e-05, -7.862411439418793e-05, -7.382780313491821e-05, -6.90314918756485e-05, -6.423518061637878e-05, -5.943886935710907e-05, -5.4642558097839355e-05, -4.984624683856964e-05, -4.504993557929993e-05, -4.025362432003021e-05, -3.54573130607605e-05, -3.0661001801490784e-05, -2.586469054222107e-05, -2.1068379282951355e-05, -1.627206802368164e-05, -1.1475756764411926e-05, -6.679445505142212e-06, -1.8831342458724976e-06, 2.913177013397217e-06, 7.709488272666931e-06, 1.2505799531936646e-05, 1.730211079120636e-05, 2.2098422050476074e-05, 2.689473330974579e-05, 3.16910445690155e-05, 3.648735582828522e-05, 4.128366708755493e-05, 4.6079978346824646e-05, 5.087628960609436e-05, 5.5672600865364075e-05, 6.046891212463379e-05, 6.52652233839035e-05, 7.006153464317322e-05, 7.485784590244293e-05, 7.965415716171265e-05, 8.445046842098236e-05, 8.924677968025208e-05, 9.404309093952179e-05, 9.88394021987915e-05, 0.00010363571345806122, 0.00010843202471733093, 0.00011322833597660065, 0.00011802464723587036, 0.00012282095849514008, 0.0001276172697544098, 0.0001324135810136795, 0.00013720989227294922]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 10.0, 18.0, 24.0, 26.0, 26.0, 43.0, 84.0, 62.0, 107.0, 150.0, 187.0, 373.0, 900.0, 3321.0, 18953.0, 290935.0, 697182.0, 28967.0, 4692.0, 1148.0, 415.0, 226.0, 153.0, 115.0, 91.0, 67.0, 62.0, 60.0, 37.0, 22.0, 19.0, 12.0, 9.0, 15.0, 6.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.357929229736328e-06, -9.057112038135529e-06, -8.756294846534729e-06, -8.45547765493393e-06, -8.15466046333313e-06, -7.85384327173233e-06, -7.553026080131531e-06, -7.252208888530731e-06, -6.951391696929932e-06, -6.650574505329132e-06, -6.3497573137283325e-06, -6.048940122127533e-06, -5.748122930526733e-06, -5.447305738925934e-06, -5.146488547325134e-06, -4.845671355724335e-06, -4.544854164123535e-06, -4.244036972522736e-06, -3.943219780921936e-06, -3.6424025893211365e-06, -3.341585397720337e-06, -3.0407682061195374e-06, -2.739951014518738e-06, -2.4391338229179382e-06, -2.1383166313171387e-06, -1.8374994397163391e-06, -1.5366822481155396e-06, -1.23586505651474e-06, -9.350478649139404e-07, -6.342306733131409e-07, -3.334134817123413e-07, -3.259629011154175e-08, 2.682209014892578e-07, 5.690380930900574e-07, 8.698552846908569e-07, 1.1706724762916565e-06, 1.471489667892456e-06, 1.7723068594932556e-06, 2.073124051094055e-06, 2.3739412426948547e-06, 2.6747584342956543e-06, 2.975575625896454e-06, 3.2763928174972534e-06, 3.577210009098053e-06, 3.8780272006988525e-06, 4.178844392299652e-06, 4.479661583900452e-06, 4.780478775501251e-06, 5.081295967102051e-06, 5.38211315870285e-06, 5.68293035030365e-06, 5.9837475419044495e-06, 6.284564733505249e-06, 6.585381925106049e-06, 6.886199116706848e-06, 7.187016308307648e-06, 7.487833499908447e-06, 7.788650691509247e-06, 8.089467883110046e-06, 8.390285074710846e-06, 8.691102266311646e-06, 8.991919457912445e-06, 9.292736649513245e-06, 9.593553841114044e-06, 9.894371032714844e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 4.0, 13.0, 15.0, 12.0, 13.0, 26.0, 33.0, 22.0, 39.0, 37.0, 42.0, 47.0, 30.0, 42.0, 35.0, 43.0, 57.0, 50.0, 56.0, 41.0, 31.0, 27.0, 33.0, 41.0, 31.0, 25.0, 25.0, 21.0, 20.0, 18.0, 11.0, 12.0, 11.0, 9.0, 6.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0002460479736328125, -0.00023815780878067017, -0.00023026764392852783, -0.0002223774790763855, -0.00021448731422424316, -0.00020659714937210083, -0.0001987069845199585, -0.00019081681966781616, -0.00018292665481567383, -0.0001750364899635315, -0.00016714632511138916, -0.00015925616025924683, -0.0001513659954071045, -0.00014347583055496216, -0.00013558566570281982, -0.0001276955008506775, -0.00011980533599853516, -0.00011191517114639282, -0.00010402500629425049, -9.613484144210815e-05, -8.824467658996582e-05, -8.035451173782349e-05, -7.246434688568115e-05, -6.457418203353882e-05, -5.6684017181396484e-05, -4.879385232925415e-05, -4.0903687477111816e-05, -3.301352262496948e-05, -2.512335777282715e-05, -1.7233192920684814e-05, -9.34302806854248e-06, -1.4528632164001465e-06, 6.4373016357421875e-06, 1.4327466487884521e-05, 2.2217631340026855e-05, 3.010779619216919e-05, 3.7997961044311523e-05, 4.588812589645386e-05, 5.377829074859619e-05, 6.166845560073853e-05, 6.955862045288086e-05, 7.74487853050232e-05, 8.533895015716553e-05, 9.322911500930786e-05, 0.0001011192798614502, 0.00010900944471359253, 0.00011689960956573486, 0.0001247897744178772, 0.00013267993927001953, 0.00014057010412216187, 0.0001484602689743042, 0.00015635043382644653, 0.00016424059867858887, 0.0001721307635307312, 0.00018002092838287354, 0.00018791109323501587, 0.0001958012580871582, 0.00020369142293930054, 0.00021158158779144287, 0.0002194717526435852, 0.00022736191749572754, 0.00023525208234786987, 0.0002431422472000122, 0.00025103241205215454, 0.0002589225769042969]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048551.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 8.0, 8.0, 0.0, 11.0, 0.0, 20.0, 33.0, 0.0, 43.0, 77.0, 0.0, 101.0, 0.0, 136.0, 127.0, 0.0, 127.0, 109.0, 0.0, 82.0, 0.0, 59.0, 32.0, 0.0, 13.0, 6.0, 0.0, 8.0, 0.0, 5.0, 9.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.214444637298584e-06, -1.1771917343139648e-06, -1.1399388313293457e-06, -1.1026859283447266e-06, -1.0654330253601074e-06, -1.0281801223754883e-06, -9.909272193908691e-07, -9.5367431640625e-07, -9.164214134216309e-07, -8.791685104370117e-07, -8.419156074523926e-07, -8.046627044677734e-07, -7.674098014831543e-07, -7.301568984985352e-07, -6.92903995513916e-07, -6.556510925292969e-07, -6.183981895446777e-07, -5.811452865600586e-07, -5.438923835754395e-07, -5.066394805908203e-07, -4.6938657760620117e-07, -4.3213367462158203e-07, -3.948807716369629e-07, -3.5762786865234375e-07, -3.203749656677246e-07, -2.8312206268310547e-07, -2.4586915969848633e-07, -2.086162567138672e-07, -1.7136335372924805e-07, -1.341104507446289e-07, -9.685754776000977e-08, -5.960464477539063e-08, -2.2351741790771484e-08, 1.4901161193847656e-08, 5.21540641784668e-08, 8.940696716308594e-08, 1.2665987014770508e-07, 1.6391277313232422e-07, 2.0116567611694336e-07, 2.384185791015625e-07, 2.7567148208618164e-07, 3.129243850708008e-07, 3.501772880554199e-07, 3.8743019104003906e-07, 4.246830940246582e-07, 4.6193599700927734e-07, 4.991888999938965e-07, 5.364418029785156e-07, 5.736947059631348e-07, 6.109476089477539e-07, 6.48200511932373e-07, 6.854534149169922e-07, 7.227063179016113e-07, 7.599592208862305e-07, 7.972121238708496e-07, 8.344650268554688e-07, 8.717179298400879e-07, 9.08970832824707e-07, 9.462237358093262e-07, 9.834766387939453e-07, 1.0207295417785645e-06, 1.0579824447631836e-06, 1.0952353477478027e-06, 1.1324882507324219e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 6.0, 14.0, 18.0, 15.0, 35.0, 54.0, 77.0, 98.0, 146.0, 168.0, 121.0, 87.0, 41.0, 41.0, 13.0, 16.0, 14.0, 13.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022119141067378223, -0.00021303765242919326, -0.0002048838941846043, -0.00019673013594001532, -0.00018857637769542634, -0.00018042261945083737, -0.0001722688612062484, -0.00016411510296165943, -0.00015596134471707046, -0.0001478075864724815, -0.00013965382822789252, -0.00013150006998330355, -0.00012334631173871458, -0.0001151925534941256, -0.00010703879524953663, -9.888503700494766e-05, -9.073127876035869e-05, -8.257752051576972e-05, -7.442376227118075e-05, -6.627000402659178e-05, -5.811624578200281e-05, -4.9962487537413836e-05, -4.1808729292824864e-05, -3.365497104823589e-05, -2.5501212803646922e-05, -1.734745455905795e-05, -9.19369631446898e-06, -1.0399380698800087e-06, 7.1138201747089624e-06, 1.5267578419297934e-05, 2.3421336663886905e-05, 3.1575094908475876e-05, 3.972885315306485e-05, 4.788261139765382e-05, 5.603636964224279e-05, 6.419012788683176e-05, 7.234388613142073e-05, 8.04976443760097e-05, 8.865140262059867e-05, 9.680516086518764e-05, 0.00010495891910977662, 0.00011311267735436559, 0.00012126643559895456, 0.00012942019384354353, 0.0001375739520881325, 0.00014572771033272147, 0.00015388146857731044, 0.00016203522682189941, 0.00017018898506648839, 0.00017834274331107736, 0.00018649650155566633, 0.0001946502598002553, 0.00020280401804484427, 0.00021095777628943324, 0.0002191115345340222, 0.00022726529277861118, 0.00023541905102320015, 0.00024357280926778913, 0.0002517265675123781, 0.00025988032575696707, 0.00026803408400155604, 0.000276187842246145, 0.000284341600490734, 0.00029249535873532295, 0.0003006491169799119]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 5.0, 9.0, 13.0, 13.0, 18.0, 26.0, 17.0, 35.0, 30.0, 34.0, 40.0, 46.0, 63.0, 51.0, 52.0, 41.0, 58.0, 49.0, 51.0, 56.0, 52.0, 39.0, 42.0, 29.0, 25.0, 19.0, 10.0, 18.0, 13.0, 15.0, 4.0, 7.0, 7.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00014838608331046999, -0.00014413964527193457, -0.00013989320723339915, -0.0001356467546429485, -0.0001314003166044131, -0.00012715387856587768, -0.00012290742597542703, -0.00011866098793689162, -0.0001144145498983562, -0.00011016811185982078, -0.00010592166654532775, -0.00010167522123083472, -9.74287831922993e-05, -9.318234515376389e-05, -8.893589983927086e-05, -8.468945452477783e-05, -8.044301648624241e-05, -7.6196578447707e-05, -7.195013313321397e-05, -6.770368781872094e-05, -6.345724978018552e-05, -5.92108081036713e-05, -5.4964366427157074e-05, -5.071792475064285e-05, -4.647148307412863e-05, -4.2225041397614405e-05, -3.797859972110018e-05, -3.373215804458596e-05, -2.9485716368071735e-05, -2.523927469155751e-05, -2.099283301504329e-05, -1.6746391338529065e-05, -1.249996421393007e-05, -8.253522537415847e-06, -4.007080860901624e-06, 2.3936081561259925e-07, 4.4858024921268225e-06, 8.732244168641046e-06, 1.2978685845155269e-05, 1.7225127521669492e-05, 2.1471569198183715e-05, 2.571801087469794e-05, 2.9964452551212162e-05, 3.4210894227726385e-05, 3.845733590424061e-05, 4.270377758075483e-05, 4.6950219257269055e-05, 5.119666093378328e-05, 5.54431026102975e-05, 5.9689544286811724e-05, 6.393598596332595e-05, 6.818243127781898e-05, 7.24288693163544e-05, 7.667530735488981e-05, 8.092175266938284e-05, 8.516819798387587e-05, 8.941463602241129e-05, 9.36610740609467e-05, 9.790751937543973e-05, 0.00010215396468993276, 0.00010640040272846818, 0.0001106468407670036, 0.00011489328608149663, 0.00011913973139598966, 0.00012338616943452507]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 7.0, 3.0, 7.0, 7.0, 18.0, 15.0, 21.0, 39.0, 48.0, 63.0, 120.0, 145.0, 251.0, 394.0, 677.0, 1043.0, 1854.0, 3591.0, 6947.0, 14277.0, 33694.0, 95400.0, 382711.0, 357859.0, 89232.0, 31757.0, 13535.0, 6644.0, 3481.0, 1911.0, 1088.0, 646.0, 366.0, 238.0, 157.0, 116.0, 67.0, 48.0, 26.0, 25.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00018835067749023438, -0.00018245913088321686, -0.00017656758427619934, -0.00017067603766918182, -0.0001647844910621643, -0.0001588929444551468, -0.00015300139784812927, -0.00014710985124111176, -0.00014121830463409424, -0.00013532675802707672, -0.0001294352114200592, -0.0001235436648130417, -0.00011765211820602417, -0.00011176057159900665, -0.00010586902499198914, -9.997747838497162e-05, -9.40859317779541e-05, -8.819438517093658e-05, -8.230283856391907e-05, -7.641129195690155e-05, -7.051974534988403e-05, -6.462819874286652e-05, -5.8736652135849e-05, -5.284510552883148e-05, -4.6953558921813965e-05, -4.106201231479645e-05, -3.517046570777893e-05, -2.9278919100761414e-05, -2.3387372493743896e-05, -1.749582588672638e-05, -1.1604279279708862e-05, -5.712732672691345e-06, 1.7881393432617188e-07, 6.070360541343689e-06, 1.1961907148361206e-05, 1.7853453755378723e-05, 2.374500036239624e-05, 2.9636546969413757e-05, 3.5528093576431274e-05, 4.141964018344879e-05, 4.731118679046631e-05, 5.3202733397483826e-05, 5.909428000450134e-05, 6.498582661151886e-05, 7.087737321853638e-05, 7.67689198255539e-05, 8.266046643257141e-05, 8.855201303958893e-05, 9.444355964660645e-05, 0.00010033510625362396, 0.00010622665286064148, 0.000112118199467659, 0.00011800974607467651, 0.00012390129268169403, 0.00012979283928871155, 0.00013568438589572906, 0.00014157593250274658, 0.0001474674791097641, 0.00015335902571678162, 0.00015925057232379913, 0.00016514211893081665, 0.00017103366553783417, 0.00017692521214485168, 0.0001828167587518692, 0.00018870830535888672]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 9.0, 10.0, 12.0, 21.0, 26.0, 38.0, 36.0, 45.0, 41.0, 45.0, 56.0, 61.0, 50.0, 56.0, 63.0, 58.0, 56.0, 65.0, 43.0, 36.0, 45.0, 18.0, 22.0, 19.0, 16.0, 5.0, 9.0, 10.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000385284423828125, -0.0003749430179595947, -0.00036460161209106445, -0.0003542602062225342, -0.0003439188003540039, -0.00033357739448547363, -0.00032323598861694336, -0.0003128945827484131, -0.0003025531768798828, -0.00029221177101135254, -0.00028187036514282227, -0.000271528959274292, -0.0002611875534057617, -0.00025084614753723145, -0.00024050474166870117, -0.0002301633358001709, -0.00021982192993164062, -0.00020948052406311035, -0.00019913911819458008, -0.0001887977123260498, -0.00017845630645751953, -0.00016811490058898926, -0.00015777349472045898, -0.0001474320888519287, -0.00013709068298339844, -0.00012674927711486816, -0.00011640787124633789, -0.00010606646537780762, -9.572505950927734e-05, -8.538365364074707e-05, -7.50422477722168e-05, -6.470084190368652e-05, -5.435943603515625e-05, -4.4018030166625977e-05, -3.36766242980957e-05, -2.333521842956543e-05, -1.2993812561035156e-05, -2.652406692504883e-06, 7.68899917602539e-06, 1.8030405044555664e-05, 2.8371810913085938e-05, 3.871321678161621e-05, 4.9054622650146484e-05, 5.939602851867676e-05, 6.973743438720703e-05, 8.00788402557373e-05, 9.042024612426758e-05, 0.00010076165199279785, 0.00011110305786132812, 0.0001214444637298584, 0.00013178586959838867, 0.00014212727546691895, 0.00015246868133544922, 0.0001628100872039795, 0.00017315149307250977, 0.00018349289894104004, 0.0001938343048095703, 0.00020417571067810059, 0.00021451711654663086, 0.00022485852241516113, 0.0002351999282836914, 0.0002455413341522217, 0.00025588274002075195, 0.0002662241458892822, 0.0002765655517578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 10.0, 6.0, 13.0, 11.0, 8.0, 18.0, 27.0, 41.0, 44.0, 80.0, 110.0, 158.0, 314.0, 640.0, 5020.0, 843671.0, 194685.0, 2437.0, 482.0, 264.0, 135.0, 100.0, 68.0, 56.0, 37.0, 34.0, 20.0, 13.0, 7.0, 11.0, 7.0, 5.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0007524490356445312, -0.0007330924272537231, -0.000713735818862915, -0.0006943792104721069, -0.0006750226020812988, -0.0006556659936904907, -0.0006363093852996826, -0.0006169527769088745, -0.0005975961685180664, -0.0005782395601272583, -0.0005588829517364502, -0.0005395263433456421, -0.000520169734954834, -0.0005008131265640259, -0.0004814565181732178, -0.00046209990978240967, -0.00044274330139160156, -0.00042338669300079346, -0.00040403008460998535, -0.00038467347621917725, -0.00036531686782836914, -0.00034596025943756104, -0.00032660365104675293, -0.0003072470426559448, -0.0002878904342651367, -0.0002685338258743286, -0.0002491772174835205, -0.0002298206090927124, -0.0002104640007019043, -0.0001911073923110962, -0.00017175078392028809, -0.00015239417552947998, -0.00013303756713867188, -0.00011368095874786377, -9.432435035705566e-05, -7.496774196624756e-05, -5.561113357543945e-05, -3.625452518463135e-05, -1.6897916793823242e-05, 2.4586915969848633e-06, 2.181529998779297e-05, 4.1171908378601074e-05, 6.052851676940918e-05, 7.988512516021729e-05, 9.924173355102539e-05, 0.0001185983419418335, 0.0001379549503326416, 0.0001573115587234497, 0.0001766681671142578, 0.00019602477550506592, 0.00021538138389587402, 0.00023473799228668213, 0.00025409460067749023, 0.00027345120906829834, 0.00029280781745910645, 0.00031216442584991455, 0.00033152103424072266, 0.00035087764263153076, 0.00037023425102233887, 0.00038959085941314697, 0.0004089474678039551, 0.0004283040761947632, 0.0004476606845855713, 0.0004670172929763794, 0.0004863739013671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 7.0, 10.0, 11.0, 15.0, 15.0, 18.0, 20.0, 22.0, 28.0, 46.0, 46.0, 40.0, 74.0, 57.0, 68.0, 70.0, 51.0, 47.0, 47.0, 53.0, 38.0, 47.0, 28.0, 24.0, 19.0, 12.0, 14.0, 14.0, 9.0, 11.0, 6.0, 6.0, 2.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005097389221191406, -0.0004955828189849854, -0.0004814267158508301, -0.0004672706127166748, -0.00045311450958251953, -0.00043895840644836426, -0.000424802303314209, -0.0004106462001800537, -0.00039649009704589844, -0.00038233399391174316, -0.0003681778907775879, -0.0003540217876434326, -0.00033986568450927734, -0.00032570958137512207, -0.0003115534782409668, -0.0002973973751068115, -0.00028324127197265625, -0.000269085168838501, -0.0002549290657043457, -0.00024077296257019043, -0.00022661685943603516, -0.00021246075630187988, -0.0001983046531677246, -0.00018414855003356934, -0.00016999244689941406, -0.0001558363437652588, -0.00014168024063110352, -0.00012752413749694824, -0.00011336803436279297, -9.92119312286377e-05, -8.505582809448242e-05, -7.089972496032715e-05, -5.6743621826171875e-05, -4.25875186920166e-05, -2.8431415557861328e-05, -1.4275312423706055e-05, -1.1920928955078125e-07, 1.4036893844604492e-05, 2.8192996978759766e-05, 4.234910011291504e-05, 5.650520324707031e-05, 7.066130638122559e-05, 8.481740951538086e-05, 9.897351264953613e-05, 0.0001131296157836914, 0.00012728571891784668, 0.00014144182205200195, 0.00015559792518615723, 0.0001697540283203125, 0.00018391013145446777, 0.00019806623458862305, 0.00021222233772277832, 0.0002263784408569336, 0.00024053454399108887, 0.00025469064712524414, 0.0002688467502593994, 0.0002830028533935547, 0.00029715895652770996, 0.00031131505966186523, 0.0003254711627960205, 0.0003396272659301758, 0.00035378336906433105, 0.00036793947219848633, 0.0003820955753326416, 0.0003962516784667969]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 1.0, 3.0, 3.0, 6.0, 4.0, 10.0, 10.0, 16.0, 11.0, 21.0, 47.0, 40.0, 87.0, 162.0, 298.0, 532.0, 1044.0, 2314.0, 5849.0, 55991.0, 968278.0, 6570.0, 3718.0, 1701.0, 848.0, 404.0, 228.0, 138.0, 74.0, 45.0, 42.0, 20.0, 10.0, 10.0, 0.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.702278137207031e-06, -8.468516170978546e-06, -8.234754204750061e-06, -8.000992238521576e-06, -7.76723027229309e-06, -7.533468306064606e-06, -7.299706339836121e-06, -7.0659443736076355e-06, -6.83218240737915e-06, -6.598420441150665e-06, -6.36465847492218e-06, -6.130896508693695e-06, -5.89713454246521e-06, -5.663372576236725e-06, -5.42961061000824e-06, -5.195848643779755e-06, -4.9620866775512695e-06, -4.7283247113227844e-06, -4.494562745094299e-06, -4.260800778865814e-06, -4.027038812637329e-06, -3.793276846408844e-06, -3.559514880180359e-06, -3.3257529139518738e-06, -3.0919909477233887e-06, -2.8582289814949036e-06, -2.6244670152664185e-06, -2.3907050490379333e-06, -2.1569430828094482e-06, -1.923181116580963e-06, -1.689419150352478e-06, -1.455657184123993e-06, -1.2218952178955078e-06, -9.881332516670227e-07, -7.543712854385376e-07, -5.206093192100525e-07, -2.868473529815674e-07, -5.3085386753082275e-08, 1.8067657947540283e-07, 4.1443854570388794e-07, 6.48200511932373e-07, 8.819624781608582e-07, 1.1157244443893433e-06, 1.3494864106178284e-06, 1.5832483768463135e-06, 1.8170103430747986e-06, 2.0507723093032837e-06, 2.284534275531769e-06, 2.518296241760254e-06, 2.752058207988739e-06, 2.985820174217224e-06, 3.2195821404457092e-06, 3.4533441066741943e-06, 3.6871060729026794e-06, 3.9208680391311646e-06, 4.15463000535965e-06, 4.388391971588135e-06, 4.62215393781662e-06, 4.855915904045105e-06, 5.08967787027359e-06, 5.323439836502075e-06, 5.55720180273056e-06, 5.790963768959045e-06, 6.0247257351875305e-06, 6.258487701416016e-06]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 853.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 9.0, 6.0, 17.0, 19.0, 38.0, 63.0, 93.0, 214.0, 287.0, 710.0, 1635.0, 4364.0, 14347.0, 995813.0, 21906.0, 5356.0, 2033.0, 826.0, 346.0, 166.0, 117.0, 72.0, 39.0, 21.0, 11.0, 8.0, 15.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.059906005859375e-06, -8.773058652877808e-06, -8.48621129989624e-06, -8.199363946914673e-06, -7.912516593933105e-06, -7.625669240951538e-06, -7.338821887969971e-06, -7.051974534988403e-06, -6.765127182006836e-06, -6.4782798290252686e-06, -6.191432476043701e-06, -5.904585123062134e-06, -5.617737770080566e-06, -5.330890417098999e-06, -5.044043064117432e-06, -4.757195711135864e-06, -4.470348358154297e-06, -4.1835010051727295e-06, -3.896653652191162e-06, -3.6098062992095947e-06, -3.3229589462280273e-06, -3.03611159324646e-06, -2.7492642402648926e-06, -2.462416887283325e-06, -2.175569534301758e-06, -1.8887221813201904e-06, -1.601874828338623e-06, -1.3150274753570557e-06, -1.0281801223754883e-06, -7.413327693939209e-07, -4.544854164123535e-07, -1.6763806343078613e-07, 1.1920928955078125e-07, 4.0605664253234863e-07, 6.92903995513916e-07, 9.797513484954834e-07, 1.2665987014770508e-06, 1.5534460544586182e-06, 1.8402934074401855e-06, 2.127140760421753e-06, 2.4139881134033203e-06, 2.7008354663848877e-06, 2.987682819366455e-06, 3.2745301723480225e-06, 3.56137752532959e-06, 3.848224878311157e-06, 4.135072231292725e-06, 4.421919584274292e-06, 4.708766937255859e-06, 4.995614290237427e-06, 5.282461643218994e-06, 5.5693089962005615e-06, 5.856156349182129e-06, 6.143003702163696e-06, 6.429851055145264e-06, 6.716698408126831e-06, 7.0035457611083984e-06, 7.290393114089966e-06, 7.577240467071533e-06, 7.8640878200531e-06, 8.150935173034668e-06, 8.437782526016235e-06, 8.724629878997803e-06, 9.01147723197937e-06, 9.298324584960938e-06]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 5.0, 7.0, 11.0, 34.0, 117.0, 430.0, 247.0, 57.0, 22.0, 9.0, 7.0, 6.0, 9.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.351139068603516e-06, -4.231929779052734e-06, -4.112720489501953e-06, -3.993511199951172e-06, -3.874301910400391e-06, -3.7550926208496094e-06, -3.635883331298828e-06, -3.516674041748047e-06, -3.3974647521972656e-06, -3.2782554626464844e-06, -3.159046173095703e-06, -3.039836883544922e-06, -2.9206275939941406e-06, -2.8014183044433594e-06, -2.682209014892578e-06, -2.562999725341797e-06, -2.4437904357910156e-06, -2.3245811462402344e-06, -2.205371856689453e-06, -2.086162567138672e-06, -1.9669532775878906e-06, -1.8477439880371094e-06, -1.7285346984863281e-06, -1.6093254089355469e-06, -1.4901161193847656e-06, -1.3709068298339844e-06, -1.2516975402832031e-06, -1.1324882507324219e-06, -1.0132789611816406e-06, -8.940696716308594e-07, -7.748603820800781e-07, -6.556510925292969e-07, -5.364418029785156e-07, -4.172325134277344e-07, -2.980232238769531e-07, -1.7881393432617188e-07, -5.960464477539063e-08, 5.960464477539063e-08, 1.7881393432617188e-07, 2.980232238769531e-07, 4.172325134277344e-07, 5.364418029785156e-07, 6.556510925292969e-07, 7.748603820800781e-07, 8.940696716308594e-07, 1.0132789611816406e-06, 1.1324882507324219e-06, 1.2516975402832031e-06, 1.3709068298339844e-06, 1.4901161193847656e-06, 1.6093254089355469e-06, 1.7285346984863281e-06, 1.8477439880371094e-06, 1.9669532775878906e-06, 2.086162567138672e-06, 2.205371856689453e-06, 2.3245811462402344e-06, 2.4437904357910156e-06, 2.562999725341797e-06, 2.682209014892578e-06, 2.8014183044433594e-06, 2.9206275939941406e-06, 3.039836883544922e-06, 3.159046173095703e-06, 3.2782554626464844e-06]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 97.0, 886.0, 33.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042072980431839824, -0.0003545028157532215, -0.0002882758271880448, -0.00022204883862286806, -0.00015582185005769134, -8.959486149251461e-05, -2.3367872927337885e-05, 4.285911563783884e-05, 0.00010908610420301557, 0.0001753130927681923, 0.00024154008133336902, 0.00030776706989854574, 0.00037399405846372247, 0.0004402210470288992, 0.0005064480355940759, 0.0005726750241592526, 0.0006389020127244294, 0.0007051290012896061, 0.0007713559898547828, 0.0008375829784199595, 0.0009038099669851363, 0.000970036955550313, 0.0010362640023231506, 0.0011024909326806664, 0.0011687178630381823, 0.00123494490981102, 0.0013011718401685357, 0.0013673987705260515, 0.0014336258172988892, 0.0014998528640717268, 0.0015660797944292426, 0.0016323067247867584, 0.0016985340043902397, 0.0017647610511630774, 0.0018309879815205932, 0.001897214911878109, 0.0019634419586509466, 0.0020296690054237843, 0.0020958958193659782, 0.002162122866138816, 0.0022283499129116535, 0.002294576959684491, 0.002360804006457329, 0.0024270308203995228, 0.0024932578671723604, 0.002559484913945198, 0.002625711727887392, 0.0026919387746602297, 0.0027581658214330673, 0.002824392868205905, 0.0028906199149787426, 0.0029568467289209366, 0.0030230737756937742, 0.003089300822466612, 0.003155527636408806, 0.0032217546831816435, 0.003287981729954481, 0.0033542087767273188, 0.0034204358235001564, 0.0034866626374423504, 0.003552889684215188, 0.0036191167309880257, 0.0036853435449302197, 0.0037515705917030573, 0.003817797638475895]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 7.0, 6.0, 5.0, 12.0, 10.0, 15.0, 23.0, 14.0, 22.0, 27.0, 23.0, 26.0, 29.0, 40.0, 36.0, 30.0, 40.0, 38.0, 40.0, 37.0, 34.0, 35.0, 40.0, 44.0, 38.0, 30.0, 38.0, 18.0, 27.0, 37.0, 28.0, 26.0, 15.0, 16.0, 11.0, 23.0, 12.0, 11.0, 5.0, 1.0, 10.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006319772801361978, -0.000612594245467335, -0.0005932112107984722, -0.0005738281179219484, -0.0005544450832530856, -0.0005350620485842228, -0.00051567901391536, -0.0004962959792464972, -0.0004769129154738039, -0.00045752988080494106, -0.0004381468170322478, -0.00041876378236338496, -0.00039938074769452214, -0.00037999768392182887, -0.00036061464925296605, -0.00034123158548027277, -0.00032184855081140995, -0.00030246551614254713, -0.00028308245236985385, -0.00026369941770099103, -0.00024431635392829776, -0.00022493331925943494, -0.00020555028459057212, -0.00018616723536979407, -0.00016678418614901602, -0.00014740113692823797, -0.00012801808770745993, -0.00010863505303859711, -8.925200381781906e-05, -6.986895459704101e-05, -5.048591265222058e-05, -3.110287070740014e-05, -1.1719821486622095e-05, 7.663224096177146e-06, 2.7046269678976387e-05, 4.642931526177563e-05, 6.581236084457487e-05, 8.519541006535292e-05, 0.00010457845201017335, 0.00012396149395499378, 0.00014334454317577183, 0.00016272759239654988, 0.00018211064161732793, 0.00020149367628619075, 0.0002208767255069688, 0.00024025977472774684, 0.00025964280939660966, 0.00027902587316930294, 0.00029840890783816576, 0.0003177919425070286, 0.00033717500627972186, 0.0003565580409485847, 0.00037594110472127795, 0.00039532413939014077, 0.0004147071740590036, 0.0004340902087278664, 0.0004534732725005597, 0.0004728563071694225, 0.0004922393709421158, 0.0005116224056109786, 0.0005310054402798414, 0.0005503884749487042, 0.000569771567825228, 0.0005891546024940908, 0.0006085376371629536]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 5.0, 3.0, 9.0, 9.0, 21.0, 12.0, 26.0, 26.0, 27.0, 27.0, 36.0, 55.0, 56.0, 67.0, 98.0, 106.0, 134.0, 237.0, 1201.0, 4163987.0, 26608.0, 678.0, 188.0, 114.0, 105.0, 58.0, 66.0, 66.0, 46.0, 31.0, 34.0, 32.0, 27.0, 25.0, 17.0, 10.0, 8.0, 6.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009427070617675781, -0.0009088888764381409, -0.0008750706911087036, -0.0008412525057792664, -0.0008074343204498291, -0.0007736161351203918, -0.0007397979497909546, -0.0007059797644615173, -0.0006721615791320801, -0.0006383433938026428, -0.0006045252084732056, -0.0005707070231437683, -0.0005368888378143311, -0.0005030706524848938, -0.00046925246715545654, -0.0004354342818260193, -0.00040161609649658203, -0.0003677979111671448, -0.0003339797258377075, -0.00030016154050827026, -0.000266343355178833, -0.00023252516984939575, -0.0001987069845199585, -0.00016488879919052124, -0.00013107061386108398, -9.725242853164673e-05, -6.343424320220947e-05, -2.9616057872772217e-05, 4.202127456665039e-06, 3.8020312786102295e-05, 7.183849811553955e-05, 0.0001056566834449768, 0.00013947486877441406, 0.00017329305410385132, 0.00020711123943328857, 0.00024092942476272583, 0.0002747476100921631, 0.00030856579542160034, 0.0003423839807510376, 0.00037620216608047485, 0.0004100203514099121, 0.00044383853673934937, 0.0004776567220687866, 0.0005114749073982239, 0.0005452930927276611, 0.0005791112780570984, 0.0006129294633865356, 0.0006467476487159729, 0.0006805658340454102, 0.0007143840193748474, 0.0007482022047042847, 0.0007820203900337219, 0.0008158385753631592, 0.0008496567606925964, 0.0008834749460220337, 0.000917293131351471, 0.0009511113166809082, 0.0009849295020103455, 0.0010187476873397827, 0.00105256587266922, 0.0010863840579986572, 0.0011202022433280945, 0.0011540204286575317, 0.001187838613986969, 0.0012216567993164062]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 5.0, 9.0, 8.0, 10.0, 6.0, 14.0, 17.0, 13.0, 16.0, 19.0, 26.0, 31.0, 38.0, 28.0, 36.0, 41.0, 43.0, 52.0, 32.0, 42.0, 47.0, 42.0, 49.0, 32.0, 37.0, 30.0, 36.0, 25.0, 33.0, 33.0, 23.0, 19.0, 23.0, 9.0, 18.0, 6.0, 10.0, 10.0, 8.0, 4.0, 7.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0934810638427734e-05, -3.0025839805603027e-05, -2.911686897277832e-05, -2.8207898139953613e-05, -2.7298927307128906e-05, -2.63899564743042e-05, -2.5480985641479492e-05, -2.4572014808654785e-05, -2.3663043975830078e-05, -2.275407314300537e-05, -2.1845102310180664e-05, -2.0936131477355957e-05, -2.002716064453125e-05, -1.9118189811706543e-05, -1.8209218978881836e-05, -1.730024814605713e-05, -1.6391277313232422e-05, -1.5482306480407715e-05, -1.4573335647583008e-05, -1.36643648147583e-05, -1.2755393981933594e-05, -1.1846423149108887e-05, -1.093745231628418e-05, -1.0028481483459473e-05, -9.119510650634766e-06, -8.210539817810059e-06, -7.3015689849853516e-06, -6.3925981521606445e-06, -5.4836273193359375e-06, -4.5746564865112305e-06, -3.6656856536865234e-06, -2.7567148208618164e-06, -1.8477439880371094e-06, -9.387731552124023e-07, -2.9802322387695312e-08, 8.791685104370117e-07, 1.7881393432617188e-06, 2.6971101760864258e-06, 3.606081008911133e-06, 4.51505184173584e-06, 5.424022674560547e-06, 6.332993507385254e-06, 7.241964340209961e-06, 8.150935173034668e-06, 9.059906005859375e-06, 9.968876838684082e-06, 1.0877847671508789e-05, 1.1786818504333496e-05, 1.2695789337158203e-05, 1.360476016998291e-05, 1.4513731002807617e-05, 1.5422701835632324e-05, 1.633167266845703e-05, 1.7240643501281738e-05, 1.8149614334106445e-05, 1.9058585166931152e-05, 1.996755599975586e-05, 2.0876526832580566e-05, 2.1785497665405273e-05, 2.269446849822998e-05, 2.3603439331054688e-05, 2.4512410163879395e-05, 2.54213809967041e-05, 2.633035182952881e-05, 2.7239322662353516e-05]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 9.0, 18.0, 72.0, 257.0, 4189966.0, 3707.0, 154.0, 38.0, 14.0, 10.0, 4.0, 8.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011339187622070312, -0.0010931193828582764, -0.0010523200035095215, -0.0010115206241607666, -0.0009707212448120117, -0.0009299218654632568, -0.000889122486114502, -0.0008483231067657471, -0.0008075237274169922, -0.0007667243480682373, -0.0007259249687194824, -0.0006851255893707275, -0.0006443262100219727, -0.0006035268306732178, -0.0005627274513244629, -0.000521928071975708, -0.0004811286926269531, -0.00044032931327819824, -0.00039952993392944336, -0.0003587305545806885, -0.0003179311752319336, -0.0002771317958831787, -0.00023633241653442383, -0.00019553303718566895, -0.00015473365783691406, -0.00011393427848815918, -7.31348991394043e-05, -3.2335519790649414e-05, 8.463859558105469e-06, 4.926323890686035e-05, 9.006261825561523e-05, 0.00013086199760437012, 0.000171661376953125, 0.00021246075630187988, 0.00025326013565063477, 0.00029405951499938965, 0.00033485889434814453, 0.0003756582736968994, 0.0004164576530456543, 0.0004572570323944092, 0.0004980564117431641, 0.0005388557910919189, 0.0005796551704406738, 0.0006204545497894287, 0.0006612539291381836, 0.0007020533084869385, 0.0007428526878356934, 0.0007836520671844482, 0.0008244514465332031, 0.000865250825881958, 0.0009060502052307129, 0.0009468495845794678, 0.0009876489639282227, 0.0010284483432769775, 0.0010692477226257324, 0.0011100471019744873, 0.0011508464813232422, 0.001191645860671997, 0.001232445240020752, 0.0012732446193695068, 0.0013140439987182617, 0.0013548433780670166, 0.0013956427574157715, 0.0014364421367645264, 0.0014772415161132812]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 7.0, 6.0, 22.0, 27.0, 47.0, 98.0, 274.0, 1717.0, 1440.0, 204.0, 94.0, 43.0, 20.0, 14.0, 10.0, 7.0, 6.0, 6.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2292137145996094e-05, -2.1432526409626007e-05, -2.057291567325592e-05, -1.9713304936885834e-05, -1.8853694200515747e-05, -1.799408346414566e-05, -1.7134472727775574e-05, -1.6274861991405487e-05, -1.54152512550354e-05, -1.4555640518665314e-05, -1.3696029782295227e-05, -1.283641904592514e-05, -1.1976808309555054e-05, -1.1117197573184967e-05, -1.025758683681488e-05, -9.397976100444794e-06, -8.538365364074707e-06, -7.67875462770462e-06, -6.819143891334534e-06, -5.959533154964447e-06, -5.09992241859436e-06, -4.240311682224274e-06, -3.380700945854187e-06, -2.5210902094841003e-06, -1.6614794731140137e-06, -8.01868736743927e-07, 5.774199962615967e-08, 9.173527359962463e-07, 1.776963472366333e-06, 2.6365742087364197e-06, 3.4961849451065063e-06, 4.355795681476593e-06, 5.21540641784668e-06, 6.075017154216766e-06, 6.934627890586853e-06, 7.79423862695694e-06, 8.653849363327026e-06, 9.513460099697113e-06, 1.03730708360672e-05, 1.1232681572437286e-05, 1.2092292308807373e-05, 1.295190304517746e-05, 1.3811513781547546e-05, 1.4671124517917633e-05, 1.553073525428772e-05, 1.6390345990657806e-05, 1.7249956727027893e-05, 1.810956746339798e-05, 1.8969178199768066e-05, 1.9828788936138153e-05, 2.068839967250824e-05, 2.1548010408878326e-05, 2.2407621145248413e-05, 2.32672318816185e-05, 2.4126842617988586e-05, 2.4986453354358673e-05, 2.584606409072876e-05, 2.6705674827098846e-05, 2.7565285563468933e-05, 2.842489629983902e-05, 2.9284507036209106e-05, 3.0144117772579193e-05, 3.100372850894928e-05, 3.1863339245319366e-05, 3.272294998168945e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 4.0, 8.0, 2.0, 12.0, 4.0, 13.0, 9.0, 21.0, 21.0, 25.0, 49.0, 59.0, 79.0, 85.0, 97.0, 105.0, 99.0, 78.0, 57.0, 43.0, 24.0, 23.0, 22.0, 10.0, 13.0, 10.0, 8.0, 2.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8570349463261664e-05, -4.725164035335183e-05, -4.5932931243442e-05, -4.4614222133532166e-05, -4.329550938564353e-05, -4.1976800275733694e-05, -4.065809116582386e-05, -3.933938205591403e-05, -3.802066930802539e-05, -3.670196019811556e-05, -3.5383251088205725e-05, -3.406454197829589e-05, -3.274582923040725e-05, -3.142712012049742e-05, -3.0108411010587588e-05, -2.8789701900677755e-05, -2.7470992790767923e-05, -2.615228368085809e-05, -2.4833572751958854e-05, -2.3514863642049022e-05, -2.2196152713149786e-05, -2.0877443603239954e-05, -1.955873449333012e-05, -1.824002538342029e-05, -1.6921314454521053e-05, -1.560260534461122e-05, -1.4283894415711984e-05, -1.2965185305802152e-05, -1.1646475286397617e-05, -1.0327765266993083e-05, -9.00905615708325e-06, -7.690346137678716e-06, -6.371632480295375e-06, -5.052922460890841e-06, -3.7342128962336574e-06, -2.415503331576474e-06, -1.0967933121719398e-06, 2.219167072325945e-07, 1.540625817142427e-06, 2.8593358365469612e-06, 4.1780458559514955e-06, 5.49675587535603e-06, 6.815465440013213e-06, 8.134175004670396e-06, 9.45288502407493e-06, 1.0771595043479465e-05, 1.2090304153389297e-05, 1.3409014172793832e-05, 1.4727724192198366e-05, 1.60464333021082e-05, 1.7365144231007434e-05, 1.8683853340917267e-05, 2.0002564269816503e-05, 2.1321273379726335e-05, 2.2639982489636168e-05, 2.3958691599546e-05, 2.5277402528445236e-05, 2.659611163835507e-05, 2.7914822567254305e-05, 2.9233531677164137e-05, 3.055224078707397e-05, 3.18709498969838e-05, 3.3189659006893635e-05, 3.4508371754782274e-05, 3.582708086469211e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 9.0, 9.0, 6.0, 8.0, 19.0, 14.0, 14.0, 13.0, 26.0, 25.0, 41.0, 28.0, 37.0, 44.0, 41.0, 50.0, 43.0, 36.0, 42.0, 45.0, 45.0, 39.0, 37.0, 35.0, 47.0, 38.0, 33.0, 44.0, 22.0, 17.0, 14.0, 13.0, 19.0, 12.0, 9.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.986637264257297e-05, -2.883641718653962e-05, -2.780646173050627e-05, -2.6776508093462326e-05, -2.5746552637428977e-05, -2.4716597181395628e-05, -2.3686643544351682e-05, -2.2656688088318333e-05, -2.1626732632284984e-05, -2.0596777176251635e-05, -1.9566821720218286e-05, -1.853686808317434e-05, -1.750691262714099e-05, -1.6476957171107642e-05, -1.5447003534063697e-05, -1.4417048078030348e-05, -1.3387092621996999e-05, -1.235713716596365e-05, -1.1327182619425002e-05, -1.0297228072886355e-05, -9.267272616853006e-06, -8.237317160819657e-06, -7.20736261428101e-06, -6.177407612995012e-06, -5.147452611709014e-06, -4.1174976104230154e-06, -3.0875426091370173e-06, -2.057587607851019e-06, -1.027632606565021e-06, 2.3223947209771723e-09, 1.0322773960069753e-06, 2.0622323972929735e-06, 3.0921837606001645e-06, 4.122138761886163e-06, 5.152093763172161e-06, 6.182048764458159e-06, 7.212003765744157e-06, 8.241959221777506e-06, 9.271913768316153e-06, 1.03018683148548e-05, 1.133182377088815e-05, 1.2361779226921499e-05, 1.3391733773460146e-05, 1.4421688319998793e-05, 1.5451643776032142e-05, 1.648159923206549e-05, 1.7511552869109437e-05, 1.8541508325142786e-05, 1.9571463781176135e-05, 2.0601419237209484e-05, 2.1631374693242833e-05, 2.266132833028678e-05, 2.3691283786320128e-05, 2.4721239242353477e-05, 2.5751192879397422e-05, 2.678114833543077e-05, 2.781110379146412e-05, 2.884105924749747e-05, 2.9871014703530818e-05, 3.090097015956417e-05, 3.1930925615597516e-05, 3.296087743365206e-05, 3.399083288968541e-05, 3.5020788345718756e-05, 3.6050743801752105e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 6.0, 7.0, 8.0, 6.0, 18.0, 21.0, 25.0, 31.0, 29.0, 50.0, 94.0, 111.0, 124.0, 215.0, 338.0, 338.0, 706.0, 1209.0, 1720.0, 4108.0, 11239.0, 36496.0, 852360.0, 114209.0, 12875.0, 5908.0, 2607.0, 1128.0, 854.0, 558.0, 293.0, 249.0, 174.0, 84.0, 82.0, 73.0, 59.0, 42.0, 29.0, 13.0, 15.0, 8.0, 16.0, 9.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.821487426757812e-06, -8.543021976947784e-06, -8.264556527137756e-06, -7.986091077327728e-06, -7.7076256275177e-06, -7.429160177707672e-06, -7.150694727897644e-06, -6.872229278087616e-06, -6.593763828277588e-06, -6.31529837846756e-06, -6.036832928657532e-06, -5.758367478847504e-06, -5.479902029037476e-06, -5.2014365792274475e-06, -4.9229711294174194e-06, -4.644505679607391e-06, -4.366040229797363e-06, -4.087574779987335e-06, -3.809109330177307e-06, -3.530643880367279e-06, -3.252178430557251e-06, -2.973712980747223e-06, -2.695247530937195e-06, -2.4167820811271667e-06, -2.1383166313171387e-06, -1.8598511815071106e-06, -1.5813857316970825e-06, -1.3029202818870544e-06, -1.0244548320770264e-06, -7.459893822669983e-07, -4.675239324569702e-07, -1.8905848264694214e-07, 8.940696716308594e-08, 3.67872416973114e-07, 6.463378667831421e-07, 9.248033165931702e-07, 1.2032687664031982e-06, 1.4817342162132263e-06, 1.7601996660232544e-06, 2.0386651158332825e-06, 2.3171305656433105e-06, 2.5955960154533386e-06, 2.8740614652633667e-06, 3.1525269150733948e-06, 3.430992364883423e-06, 3.709457814693451e-06, 3.987923264503479e-06, 4.266388714313507e-06, 4.544854164123535e-06, 4.823319613933563e-06, 5.101785063743591e-06, 5.380250513553619e-06, 5.6587159633636475e-06, 5.9371814131736755e-06, 6.215646862983704e-06, 6.494112312793732e-06, 6.77257776260376e-06, 7.051043212413788e-06, 7.329508662223816e-06, 7.607974112033844e-06, 7.886439561843872e-06, 8.1649050116539e-06, 8.443370461463928e-06, 8.721835911273956e-06, 9.000301361083984e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 7.0, 4.0, 2.0, 7.0, 10.0, 10.0, 11.0, 23.0, 21.0, 21.0, 34.0, 32.0, 40.0, 45.0, 39.0, 53.0, 41.0, 41.0, 48.0, 52.0, 57.0, 51.0, 40.0, 35.0, 44.0, 35.0, 46.0, 28.0, 22.0, 17.0, 13.0, 11.0, 15.0, 14.0, 7.0, 6.0, 5.0, 2.0, 3.0, 0.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.771615982055664e-05, -2.68714502453804e-05, -2.6026740670204163e-05, -2.5182031095027924e-05, -2.4337321519851685e-05, -2.3492611944675446e-05, -2.2647902369499207e-05, -2.1803192794322968e-05, -2.095848321914673e-05, -2.011377364397049e-05, -1.926906406879425e-05, -1.842435449361801e-05, -1.7579644918441772e-05, -1.6734935343265533e-05, -1.5890225768089294e-05, -1.5045516192913055e-05, -1.4200806617736816e-05, -1.3356097042560577e-05, -1.2511387467384338e-05, -1.16666778922081e-05, -1.082196831703186e-05, -9.977258741855621e-06, -9.132549166679382e-06, -8.287839591503143e-06, -7.443130016326904e-06, -6.598420441150665e-06, -5.753710865974426e-06, -4.909001290798187e-06, -4.064291715621948e-06, -3.2195821404457092e-06, -2.3748725652694702e-06, -1.5301629900932312e-06, -6.854534149169922e-07, 1.5925616025924683e-07, 1.0039657354354858e-06, 1.8486753106117249e-06, 2.693384885787964e-06, 3.538094460964203e-06, 4.382804036140442e-06, 5.227513611316681e-06, 6.07222318649292e-06, 6.916932761669159e-06, 7.761642336845398e-06, 8.606351912021637e-06, 9.451061487197876e-06, 1.0295771062374115e-05, 1.1140480637550354e-05, 1.1985190212726593e-05, 1.2829899787902832e-05, 1.3674609363079071e-05, 1.451931893825531e-05, 1.536402851343155e-05, 1.6208738088607788e-05, 1.7053447663784027e-05, 1.7898157238960266e-05, 1.8742866814136505e-05, 1.9587576389312744e-05, 2.0432285964488983e-05, 2.1276995539665222e-05, 2.212170511484146e-05, 2.29664146900177e-05, 2.381112426519394e-05, 2.4655833840370178e-05, 2.5500543415546417e-05, 2.6345252990722656e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 1.0, 6.0, 7.0, 8.0, 9.0, 19.0, 25.0, 33.0, 46.0, 153.0, 178.0, 377.0, 1559.0, 5602.0, 929965.0, 102617.0, 6429.0, 717.0, 444.0, 135.0, 103.0, 42.0, 15.0, 20.0, 8.0, 9.0, 2.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.245208740234375e-06, -5.098991096019745e-06, -4.952773451805115e-06, -4.806555807590485e-06, -4.6603381633758545e-06, -4.514120519161224e-06, -4.367902874946594e-06, -4.221685230731964e-06, -4.075467586517334e-06, -3.929249942302704e-06, -3.7830322980880737e-06, -3.6368146538734436e-06, -3.4905970096588135e-06, -3.3443793654441833e-06, -3.1981617212295532e-06, -3.051944077014923e-06, -2.905726432800293e-06, -2.759508788585663e-06, -2.6132911443710327e-06, -2.4670735001564026e-06, -2.3208558559417725e-06, -2.1746382117271423e-06, -2.028420567512512e-06, -1.882202923297882e-06, -1.735985279083252e-06, -1.5897676348686218e-06, -1.4435499906539917e-06, -1.2973323464393616e-06, -1.1511147022247314e-06, -1.0048970580101013e-06, -8.586794137954712e-07, -7.124617695808411e-07, -5.662441253662109e-07, -4.200264811515808e-07, -2.738088369369507e-07, -1.2759119272232056e-07, 1.862645149230957e-08, 1.648440957069397e-07, 3.110617399215698e-07, 4.5727938413619995e-07, 6.034970283508301e-07, 7.497146725654602e-07, 8.959323167800903e-07, 1.0421499609947205e-06, 1.1883676052093506e-06, 1.3345852494239807e-06, 1.4808028936386108e-06, 1.627020537853241e-06, 1.773238182067871e-06, 1.9194558262825012e-06, 2.0656734704971313e-06, 2.2118911147117615e-06, 2.3581087589263916e-06, 2.5043264031410217e-06, 2.650544047355652e-06, 2.796761691570282e-06, 2.942979335784912e-06, 3.0891969799995422e-06, 3.2354146242141724e-06, 3.3816322684288025e-06, 3.5278499126434326e-06, 3.6740675568580627e-06, 3.820285201072693e-06, 3.966502845287323e-06, 4.112720489501953e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 0.0, 5.0, 7.0, 16.0, 10.0, 21.0, 40.0, 62.0, 63.0, 74.0, 89.0, 109.0, 96.0, 93.0, 82.0, 72.0, 51.0, 31.0, 34.0, 14.0, 10.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00013816356658935547, -0.0001343265175819397, -0.00013048946857452393, -0.00012665241956710815, -0.00012281537055969238, -0.00011897832155227661, -0.00011514127254486084, -0.00011130422353744507, -0.0001074671745300293, -0.00010363012552261353, -9.979307651519775e-05, -9.595602750778198e-05, -9.211897850036621e-05, -8.828192949295044e-05, -8.444488048553467e-05, -8.06078314781189e-05, -7.677078247070312e-05, -7.293373346328735e-05, -6.909668445587158e-05, -6.525963544845581e-05, -6.142258644104004e-05, -5.758553743362427e-05, -5.3748488426208496e-05, -4.9911439418792725e-05, -4.607439041137695e-05, -4.223734140396118e-05, -3.840029239654541e-05, -3.456324338912964e-05, -3.072619438171387e-05, -2.6889145374298096e-05, -2.3052096366882324e-05, -1.9215047359466553e-05, -1.537799835205078e-05, -1.154094934463501e-05, -7.703900337219238e-06, -3.866851329803467e-06, -2.9802322387695312e-08, 3.807246685028076e-06, 7.644295692443848e-06, 1.1481344699859619e-05, 1.531839370727539e-05, 1.9155442714691162e-05, 2.2992491722106934e-05, 2.6829540729522705e-05, 3.0666589736938477e-05, 3.450363874435425e-05, 3.834068775177002e-05, 4.217773675918579e-05, 4.601478576660156e-05, 4.9851834774017334e-05, 5.3688883781433105e-05, 5.752593278884888e-05, 6.136298179626465e-05, 6.520003080368042e-05, 6.903707981109619e-05, 7.287412881851196e-05, 7.671117782592773e-05, 8.05482268333435e-05, 8.438527584075928e-05, 8.822232484817505e-05, 9.205937385559082e-05, 9.589642286300659e-05, 9.973347187042236e-05, 0.00010357052087783813, 0.0001074075698852539]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 94.0, 0.0, 0.0, 0.0, 0.0, 127.0, 0.0, 0.0, 0.0, 0.0, 417.0, 0.0, 0.0, 0.0, 151.0, 0.0, 0.0, 0.0, 0.0, 89.0, 0.0, 0.0, 0.0, 50.0, 0.0, 0.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 9.0, 30.0, 44.0, 150.0, 305.0, 290.0, 104.0, 47.0, 16.0, 3.0, 8.0, 3.0, 1.0, 1.0], "bins": [-0.00017781545466277748, -0.00017457333160564303, -0.0001713312231004238, -0.00016808910004328936, -0.00016484697698615491, -0.0001616048684809357, -0.00015836274542380124, -0.0001551206223666668, -0.00015187851386144757, -0.00014863639080431312, -0.0001453942822990939, -0.00014215215924195945, -0.000138910036184825, -0.00013566792767960578, -0.00013242580462247133, -0.00012918368156533688, -0.00012594155850820243, -0.00012269943545106798, -0.00011945731966989115, -0.00011621520388871431, -0.00011297308810753748, -0.00010973097232636064, -0.0001064888492692262, -0.00010324673348804936, -0.00010000461770687252, -9.676250192569569e-05, -9.352037886856124e-05, -9.02782630873844e-05, -8.703614730620757e-05, -8.379403152503073e-05, -8.055190846789628e-05, -7.730979268671945e-05, -7.4067669629585e-05, -7.082555384840816e-05, -6.758343079127371e-05, -6.434131501009688e-05, -6.109919922892004e-05, -5.78570798097644e-05, -5.461496039060876e-05, -5.137284460943192e-05, -4.813072882825509e-05, -4.4888609409099445e-05, -4.164649362792261e-05, -3.840437420876697e-05, -3.516225842759013e-05, -3.192013900843449e-05, -2.8678019589278847e-05, -2.5435901989112608e-05, -2.2193782569956966e-05, -1.8951664969790727e-05, -1.5709545550635085e-05, -1.2467427950468846e-05, -9.225310350302607e-06, -5.983192750136368e-06, -2.7410733309807256e-06, 5.010442691855133e-07, 3.743161869351752e-06, 6.985279924265342e-06, 1.0227397979178932e-05, 1.3469516488839872e-05, 1.671163408900611e-05, 1.995375168917235e-05, 2.3195871108327992e-05, 2.643798870849423e-05, 2.968010630866047e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 11.0, 3.0, 11.0, 13.0, 18.0, 12.0, 17.0, 22.0, 26.0, 39.0, 38.0, 31.0, 49.0, 47.0, 49.0, 46.0, 32.0, 44.0, 40.0, 56.0, 30.0, 42.0, 38.0, 40.0, 54.0, 46.0, 26.0, 14.0, 13.0, 14.0, 22.0, 10.0, 9.0, 10.0, 6.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.4854645744198933e-05, -2.4061584554146975e-05, -2.3268523364095017e-05, -2.2475463993032463e-05, -2.1682402802980505e-05, -2.0889341612928547e-05, -2.009628042287659e-05, -1.9303221051814035e-05, -1.8510159861762077e-05, -1.771709867171012e-05, -1.692403748165816e-05, -1.6130978110595606e-05, -1.5337916920543648e-05, -1.454485573049169e-05, -1.3751794540439732e-05, -1.2958734259882476e-05, -1.2165673069830518e-05, -1.137261187977856e-05, -1.0579551599221304e-05, -9.786490409169346e-06, -8.99343012861209e-06, -8.200368938560132e-06, -7.407308203255525e-06, -6.614247467950918e-06, -5.821186732646311e-06, -5.028125997341704e-06, -4.2350652620370965e-06, -3.442004299358814e-06, -2.648943564054207e-06, -1.8558826013759244e-06, -1.0628218660713173e-06, -2.6976113076671027e-07, 5.232996045378968e-07, 1.3163603398425039e-06, 2.109421075147111e-06, 2.9024820378253935e-06, 3.6955427731300006e-06, 4.488603735808283e-06, 5.28166447111289e-06, 6.074725206417497e-06, 6.867785941722104e-06, 7.660846677026711e-06, 8.45390786707867e-06, 9.246968147635926e-06, 1.0040029337687884e-05, 1.083308961824514e-05, 1.1626150808297098e-05, 1.2419211998349056e-05, 1.3212272278906312e-05, 1.400533346895827e-05, 1.4798393749515526e-05, 1.5591454939567484e-05, 1.6384516129619442e-05, 1.7177575500681996e-05, 1.7970636690733954e-05, 1.8763697880785912e-05, 1.955675907083787e-05, 2.0349820260889828e-05, 2.1142881450941786e-05, 2.193594082200434e-05, 2.27290020120563e-05, 2.3522063202108257e-05, 2.4315124392160214e-05, 2.510818376322277e-05, 2.5901244953274727e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 11.0, 9.0, 11.0, 15.0, 21.0, 27.0, 50.0, 62.0, 76.0, 140.0, 433.0, 1746.0, 12086.0, 123888.0, 798578.0, 98954.0, 10123.0, 1524.0, 353.0, 144.0, 84.0, 57.0, 35.0, 23.0, 27.0, 23.0, 11.0, 12.0, 11.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.00011485815048217773, -0.00011208746582269669, -0.00010931678116321564, -0.00010654609650373459, -0.00010377541184425354, -0.00010100472718477249, -9.823404252529144e-05, -9.54633578658104e-05, -9.269267320632935e-05, -8.99219885468483e-05, -8.715130388736725e-05, -8.43806192278862e-05, -8.160993456840515e-05, -7.88392499089241e-05, -7.606856524944305e-05, -7.3297880589962e-05, -7.052719593048096e-05, -6.775651127099991e-05, -6.498582661151886e-05, -6.221514195203781e-05, -5.944445729255676e-05, -5.6673772633075714e-05, -5.3903087973594666e-05, -5.113240331411362e-05, -4.836171865463257e-05, -4.559103399515152e-05, -4.282034933567047e-05, -4.004966467618942e-05, -3.7278980016708374e-05, -3.4508295357227325e-05, -3.173761069774628e-05, -2.8966926038265228e-05, -2.619624137878418e-05, -2.342555671930313e-05, -2.0654872059822083e-05, -1.7884187400341034e-05, -1.5113502740859985e-05, -1.2342818081378937e-05, -9.572133421897888e-06, -6.80144876241684e-06, -4.030764102935791e-06, -1.2600794434547424e-06, 1.5106052160263062e-06, 4.281289875507355e-06, 7.051974534988403e-06, 9.822659194469452e-06, 1.25933438539505e-05, 1.536402851343155e-05, 1.8134713172912598e-05, 2.0905397832393646e-05, 2.3676082491874695e-05, 2.6446767151355743e-05, 2.9217451810836792e-05, 3.198813647031784e-05, 3.475882112979889e-05, 3.752950578927994e-05, 4.0300190448760986e-05, 4.3070875108242035e-05, 4.5841559767723083e-05, 4.861224442720413e-05, 5.138292908668518e-05, 5.415361374616623e-05, 5.692429840564728e-05, 5.9694983065128326e-05, 6.246566772460938e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 6.0, 11.0, 8.0, 10.0, 12.0, 14.0, 24.0, 31.0, 34.0, 38.0, 38.0, 55.0, 49.0, 59.0, 67.0, 64.0, 67.0, 51.0, 58.0, 46.0, 39.0, 47.0, 30.0, 24.0, 29.0, 17.0, 23.0, 12.0, 10.0, 13.0, 7.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0002276897430419922, -0.0002222210168838501, -0.000216752290725708, -0.00021128356456756592, -0.00020581483840942383, -0.00020034611225128174, -0.00019487738609313965, -0.00018940865993499756, -0.00018393993377685547, -0.00017847120761871338, -0.0001730024814605713, -0.0001675337553024292, -0.0001620650291442871, -0.00015659630298614502, -0.00015112757682800293, -0.00014565885066986084, -0.00014019012451171875, -0.00013472139835357666, -0.00012925267219543457, -0.00012378394603729248, -0.00011831521987915039, -0.0001128464937210083, -0.00010737776756286621, -0.00010190904140472412, -9.644031524658203e-05, -9.097158908843994e-05, -8.550286293029785e-05, -8.003413677215576e-05, -7.456541061401367e-05, -6.909668445587158e-05, -6.362795829772949e-05, -5.81592321395874e-05, -5.269050598144531e-05, -4.722177982330322e-05, -4.175305366516113e-05, -3.628432750701904e-05, -3.081560134887695e-05, -2.5346875190734863e-05, -1.9878149032592773e-05, -1.4409422874450684e-05, -8.940696716308594e-06, -3.471970558166504e-06, 1.996755599975586e-06, 7.465481758117676e-06, 1.2934207916259766e-05, 1.8402934074401855e-05, 2.3871660232543945e-05, 2.9340386390686035e-05, 3.4809112548828125e-05, 4.0277838706970215e-05, 4.5746564865112305e-05, 5.1215291023254395e-05, 5.6684017181396484e-05, 6.215274333953857e-05, 6.762146949768066e-05, 7.309019565582275e-05, 7.855892181396484e-05, 8.402764797210693e-05, 8.949637413024902e-05, 9.496510028839111e-05, 0.0001004338264465332, 0.00010590255260467529, 0.00011137127876281738, 0.00011684000492095947, 0.00012230873107910156]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 10.0, 6.0, 10.0, 14.0, 23.0, 22.0, 49.0, 70.0, 124.0, 277.0, 874.0, 835238.0, 210400.0, 793.0, 337.0, 93.0, 67.0, 27.0, 28.0, 32.0, 16.0, 11.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0009350776672363281, -0.0009110867977142334, -0.0008870959281921387, -0.0008631050586700439, -0.0008391141891479492, -0.0008151233196258545, -0.0007911324501037598, -0.000767141580581665, -0.0007431507110595703, -0.0007191598415374756, -0.0006951689720153809, -0.0006711781024932861, -0.0006471872329711914, -0.0006231963634490967, -0.000599205493927002, -0.0005752146244049072, -0.0005512237548828125, -0.0005272328853607178, -0.000503242015838623, -0.0004792511463165283, -0.0004552602767944336, -0.00043126940727233887, -0.00040727853775024414, -0.0003832876682281494, -0.0003592967987060547, -0.00033530592918395996, -0.00031131505966186523, -0.0002873241901397705, -0.0002633333206176758, -0.00023934245109558105, -0.00021535158157348633, -0.0001913607120513916, -0.00016736984252929688, -0.00014337897300720215, -0.00011938810348510742, -9.53972339630127e-05, -7.140636444091797e-05, -4.741549491882324e-05, -2.3424625396728516e-05, 5.662441253662109e-07, 2.4557113647460938e-05, 4.8547983169555664e-05, 7.253885269165039e-05, 9.652972221374512e-05, 0.00012052059173583984, 0.00014451146125793457, 0.0001685023307800293, 0.00019249320030212402, 0.00021648406982421875, 0.00024047493934631348, 0.0002644658088684082, 0.00028845667839050293, 0.00031244754791259766, 0.0003364384174346924, 0.0003604292869567871, 0.00038442015647888184, 0.00040841102600097656, 0.0004324018955230713, 0.000456392765045166, 0.00048038363456726074, 0.0005043745040893555, 0.0005283653736114502, 0.0005523562431335449, 0.0005763471126556396, 0.0006003379821777344]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 2.0, 6.0, 7.0, 8.0, 8.0, 7.0, 20.0, 21.0, 38.0, 39.0, 45.0, 67.0, 88.0, 100.0, 107.0, 106.0, 87.0, 59.0, 52.0, 39.0, 27.0, 22.0, 18.0, 12.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00045561790466308594, -0.00044374167919158936, -0.0004318654537200928, -0.0004199892282485962, -0.0004081130027770996, -0.00039623677730560303, -0.00038436055183410645, -0.00037248432636260986, -0.0003606081008911133, -0.0003487318754196167, -0.0003368556499481201, -0.00032497942447662354, -0.00031310319900512695, -0.00030122697353363037, -0.0002893507480621338, -0.0002774745225906372, -0.0002655982971191406, -0.00025372207164764404, -0.00024184584617614746, -0.00022996962070465088, -0.0002180933952331543, -0.00020621716976165771, -0.00019434094429016113, -0.00018246471881866455, -0.00017058849334716797, -0.0001587122678756714, -0.0001468360424041748, -0.00013495981693267822, -0.00012308359146118164, -0.00011120736598968506, -9.933114051818848e-05, -8.74549150466919e-05, -7.557868957519531e-05, -6.370246410369873e-05, -5.182623863220215e-05, -3.9950013160705566e-05, -2.8073787689208984e-05, -1.6197562217712402e-05, -4.32133674621582e-06, 7.554888725280762e-06, 1.9431114196777344e-05, 3.1307339668273926e-05, 4.318356513977051e-05, 5.505979061126709e-05, 6.693601608276367e-05, 7.881224155426025e-05, 9.068846702575684e-05, 0.00010256469249725342, 0.00011444091796875, 0.00012631714344024658, 0.00013819336891174316, 0.00015006959438323975, 0.00016194581985473633, 0.0001738220453262329, 0.0001856982707977295, 0.00019757449626922607, 0.00020945072174072266, 0.00022132694721221924, 0.00023320317268371582, 0.0002450793981552124, 0.000256955623626709, 0.00026883184909820557, 0.00028070807456970215, 0.00029258430004119873, 0.0003044605255126953]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 3.0, 6.0, 26.0, 20.0, 34.0, 51.0, 70.0, 102.0, 151.0, 254.0, 512.0, 869.0, 1827.0, 12918.0, 39992.0, 934693.0, 40308.0, 9148.0, 3639.0, 1747.0, 904.0, 559.0, 254.0, 175.0, 148.0, 37.0, 26.0, 21.0, 13.0, 10.0, 8.0, 6.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-06, -1.4845281839370728e-06, -1.4193356037139893e-06, -1.3541430234909058e-06, -1.2889504432678223e-06, -1.2237578630447388e-06, -1.1585652828216553e-06, -1.0933727025985718e-06, -1.0281801223754883e-06, -9.629875421524048e-07, -8.977949619293213e-07, -8.326023817062378e-07, -7.674098014831543e-07, -7.022172212600708e-07, -6.370246410369873e-07, -5.718320608139038e-07, -5.066394805908203e-07, -4.414469003677368e-07, -3.762543201446533e-07, -3.110617399215698e-07, -2.4586915969848633e-07, -1.8067657947540283e-07, -1.1548399925231934e-07, -5.029141902923584e-08, 1.4901161193847656e-08, 8.009374141693115e-08, 1.4528632164001465e-07, 2.1047890186309814e-07, 2.7567148208618164e-07, 3.4086406230926514e-07, 4.0605664253234863e-07, 4.7124922275543213e-07, 5.364418029785156e-07, 6.016343832015991e-07, 6.668269634246826e-07, 7.320195436477661e-07, 7.972121238708496e-07, 8.624047040939331e-07, 9.275972843170166e-07, 9.927898645401e-07, 1.0579824447631836e-06, 1.123175024986267e-06, 1.1883676052093506e-06, 1.253560185432434e-06, 1.3187527656555176e-06, 1.383945345878601e-06, 1.4491379261016846e-06, 1.514330506324768e-06, 1.5795230865478516e-06, 1.644715666770935e-06, 1.7099082469940186e-06, 1.775100827217102e-06, 1.8402934074401855e-06, 1.905485987663269e-06, 1.9706785678863525e-06, 2.035871148109436e-06, 2.1010637283325195e-06, 2.166256308555603e-06, 2.2314488887786865e-06, 2.29664146900177e-06, 2.3618340492248535e-06, 2.427026629447937e-06, 2.4922192096710205e-06, 2.557411789894104e-06, 2.6226043701171875e-06]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 808.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 111.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 4.0, 9.0, 10.0, 9.0, 20.0, 21.0, 20.0, 54.0, 51.0, 66.0, 83.0, 101.0, 145.0, 200.0, 265.0, 423.0, 699.0, 1283.0, 2288.0, 4263.0, 9772.0, 41035.0, 926723.0, 41388.0, 9631.0, 4378.0, 2156.0, 1212.0, 731.0, 443.0, 296.0, 173.0, 139.0, 103.0, 69.0, 67.0, 49.0, 36.0, 28.0, 21.0, 21.0, 16.0, 17.0, 4.0, 4.0, 9.0, 7.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 0.0, 2.0], "bins": [-1.9073486328125e-06, -1.846812665462494e-06, -1.7862766981124878e-06, -1.7257407307624817e-06, -1.6652047634124756e-06, -1.6046687960624695e-06, -1.5441328287124634e-06, -1.4835968613624573e-06, -1.4230608940124512e-06, -1.362524926662445e-06, -1.301988959312439e-06, -1.2414529919624329e-06, -1.1809170246124268e-06, -1.1203810572624207e-06, -1.0598450899124146e-06, -9.993091225624084e-07, -9.387731552124023e-07, -8.782371878623962e-07, -8.177012205123901e-07, -7.57165253162384e-07, -6.966292858123779e-07, -6.360933184623718e-07, -5.755573511123657e-07, -5.150213837623596e-07, -4.544854164123535e-07, -3.939494490623474e-07, -3.334134817123413e-07, -2.728775143623352e-07, -2.123415470123291e-07, -1.51805579662323e-07, -9.12696123123169e-08, -3.073364496231079e-08, 2.9802322387695312e-08, 9.033828973770142e-08, 1.5087425708770752e-07, 2.1141022443771362e-07, 2.7194619178771973e-07, 3.3248215913772583e-07, 3.9301812648773193e-07, 4.5355409383773804e-07, 5.140900611877441e-07, 5.746260285377502e-07, 6.351619958877563e-07, 6.956979632377625e-07, 7.562339305877686e-07, 8.167698979377747e-07, 8.773058652877808e-07, 9.378418326377869e-07, 9.98377799987793e-07, 1.058913767337799e-06, 1.1194497346878052e-06, 1.1799857020378113e-06, 1.2405216693878174e-06, 1.3010576367378235e-06, 1.3615936040878296e-06, 1.4221295714378357e-06, 1.4826655387878418e-06, 1.543201506137848e-06, 1.603737473487854e-06, 1.6642734408378601e-06, 1.7248094081878662e-06, 1.7853453755378723e-06, 1.8458813428878784e-06, 1.9064173102378845e-06, 1.9669532775878906e-06]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 7.0, 0.0, 0.0, 9.0, 0.0, 0.0, 11.0, 0.0, 22.0, 0.0, 0.0, 46.0, 0.0, 105.0, 0.0, 0.0, 576.0, 0.0, 125.0, 0.0, 0.0, 48.0, 0.0, 26.0, 0.0, 0.0, 13.0, 0.0, 0.0, 6.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.515773177146912e-07, -7.282942533493042e-07, -7.050111889839172e-07, -6.817281246185303e-07, -6.584450602531433e-07, -6.351619958877563e-07, -6.118789315223694e-07, -5.885958671569824e-07, -5.653128027915955e-07, -5.420297384262085e-07, -5.187466740608215e-07, -4.954636096954346e-07, -4.721805453300476e-07, -4.4889748096466064e-07, -4.256144165992737e-07, -4.023313522338867e-07, -3.7904828786849976e-07, -3.557652235031128e-07, -3.3248215913772583e-07, -3.0919909477233887e-07, -2.859160304069519e-07, -2.6263296604156494e-07, -2.39349901676178e-07, -2.1606683731079102e-07, -1.9278377294540405e-07, -1.695007085800171e-07, -1.4621764421463013e-07, -1.2293457984924316e-07, -9.96515154838562e-08, -7.636845111846924e-08, -5.3085386753082275e-08, -2.9802322387695312e-08, -6.51925802230835e-09, 1.6763806343078613e-08, 4.0046870708465576e-08, 6.332993507385254e-08, 8.66129994392395e-08, 1.0989606380462646e-07, 1.3317912817001343e-07, 1.564621925354004e-07, 1.7974525690078735e-07, 2.0302832126617432e-07, 2.2631138563156128e-07, 2.4959444999694824e-07, 2.728775143623352e-07, 2.9616057872772217e-07, 3.1944364309310913e-07, 3.427267074584961e-07, 3.6600977182388306e-07, 3.8929283618927e-07, 4.12575900554657e-07, 4.3585896492004395e-07, 4.591420292854309e-07, 4.824250936508179e-07, 5.057081580162048e-07, 5.289912223815918e-07, 5.522742867469788e-07, 5.755573511123657e-07, 5.988404154777527e-07, 6.221234798431396e-07, 6.454065442085266e-07, 6.686896085739136e-07, 6.919726729393005e-07, 7.152557373046875e-07]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 25.0, 983.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005731600103899837, -0.000545083312317729, -0.0005170066142454743, -0.0004889298579655588, -0.0004608531598933041, -0.00043277646182104945, -0.00040469973464496434, -0.0003766230074688792, -0.00034854630939662457, -0.0003204696113243699, -0.0002923928841482848, -0.0002643161569721997, -0.00023623945889994502, -0.00020816274627577513, -0.00018008603365160525, -0.00015200932102743536, -0.00012393260840326548, -9.585589577909559e-05, -6.77791831549257e-05, -3.970247053075582e-05, -1.1625757906585932e-05, 1.6450954717583954e-05, 4.452766734175384e-05, 7.260437996592373e-05, 0.00010068109259009361, 0.0001287578052142635, 0.00015683451783843338, 0.00018491123046260327, 0.00021298794308677316, 0.00024106465571094304, 0.00026914136833511293, 0.00029721809551119804, 0.0003252947935834527, 0.00035337149165570736, 0.0003814482188317925, 0.0004095249460078776, 0.00043760164408013225, 0.0004656783421523869, 0.0004937550984323025, 0.0005218317965045571, 0.0005499084945768118, 0.0005779851926490664, 0.0006060618907213211, 0.0006341386470012367, 0.0006622153450734913, 0.000690292043145746, 0.0007183687994256616, 0.0007464454974979162, 0.0007745221955701709, 0.0008025988936424255, 0.0008306755917146802, 0.0008587523479945958, 0.0008868290460668504, 0.0009149057441391051, 0.0009429825004190207, 0.0009710591984912753, 0.00099913589656353, 0.0010272125946357846, 0.0010552892927080393, 0.001083365990780294, 0.0011114426888525486, 0.001139519503340125, 0.0011675962014123797, 0.0011956728994846344, 0.001223749597556889]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 8.0, 6.0, 5.0, 12.0, 10.0, 11.0, 17.0, 9.0, 14.0, 17.0, 22.0, 30.0, 24.0, 33.0, 33.0, 37.0, 38.0, 39.0, 40.0, 38.0, 49.0, 45.0, 45.0, 38.0, 36.0, 39.0, 25.0, 34.0, 23.0, 28.0, 31.0, 17.0, 15.0, 20.0, 22.0, 11.0, 16.0, 11.0, 14.0, 5.0, 7.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00030405286815948784, -0.00029360834741964936, -0.0002831638266798109, -0.0002727193059399724, -0.0002622747852001339, -0.00025183026446029544, -0.00024138575827237219, -0.0002309412375325337, -0.00022049671679269522, -0.00021005219605285674, -0.00019960767531301826, -0.000189163169125095, -0.00017871864838525653, -0.00016827412764541805, -0.00015782960690557957, -0.00014738508616574109, -0.0001369405654259026, -0.00012649604468606412, -0.00011605152394622564, -0.00010560701048234478, -9.51624897425063e-05, -8.471796900266781e-05, -7.427345553878695e-05, -6.382893479894847e-05, -5.3384414059109986e-05, -4.2939893319271505e-05, -3.249537621741183e-05, -2.2050859115552157e-05, -1.1606338375713676e-05, -1.1618176358751953e-06, 9.282695828005672e-06, 1.9727216567844152e-05, 3.0171737307682633e-05, 4.0616258047521114e-05, 5.106077514938079e-05, 6.150529225124046e-05, 7.194981299107894e-05, 8.239433373091742e-05, 9.283884719479829e-05, 0.00010328336793463677, 0.00011372788867447525, 0.00012417240941431373, 0.00013461693015415221, 0.00014506143634207547, 0.00015550595708191395, 0.00016595047782175243, 0.0001763949985615909, 0.0001868395193014294, 0.00019728404004126787, 0.00020772856078110635, 0.00021817308152094483, 0.00022861760226078331, 0.0002390621230006218, 0.0002495066437404603, 0.00025995116448029876, 0.0002703956561163068, 0.0002808402059599757, 0.0002912847266998142, 0.0003017292474396527, 0.00031217376817949116, 0.00032261828891932964, 0.0003330628096591681, 0.0003435073303990066, 0.00035395182203501463, 0.0003643963427748531]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 6.0, 4.0, 5.0, 8.0, 20.0, 17.0, 22.0, 30.0, 38.0, 49.0, 45.0, 76.0, 65.0, 89.0, 94.0, 97.0, 123.0, 120.0, 158.0, 227.0, 2451.0, 4188573.0, 693.0, 205.0, 184.0, 152.0, 121.0, 104.0, 77.0, 80.0, 54.0, 54.0, 45.0, 42.0, 29.0, 30.0, 21.0, 18.0, 14.0, 13.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0003685951232910156, -0.0003578700125217438, -0.0003471449017524719, -0.0003364197909832001, -0.0003256946802139282, -0.00031496956944465637, -0.0003042444586753845, -0.00029351934790611267, -0.0002827942371368408, -0.00027206912636756897, -0.0002613440155982971, -0.00025061890482902527, -0.00023989379405975342, -0.00022916868329048157, -0.00021844357252120972, -0.00020771846175193787, -0.00019699335098266602, -0.00018626824021339417, -0.00017554312944412231, -0.00016481801867485046, -0.0001540929079055786, -0.00014336779713630676, -0.0001326426863670349, -0.00012191757559776306, -0.00011119246482849121, -0.00010046735405921936, -8.974224328994751e-05, -7.901713252067566e-05, -6.829202175140381e-05, -5.756691098213196e-05, -4.684180021286011e-05, -3.611668944358826e-05, -2.5391578674316406e-05, -1.4666467905044556e-05, -3.941357135772705e-06, 6.7837536334991455e-06, 1.7508864402770996e-05, 2.8233975172042847e-05, 3.89590859413147e-05, 4.968419671058655e-05, 6.04093074798584e-05, 7.113441824913025e-05, 8.18595290184021e-05, 9.258463978767395e-05, 0.0001033097505569458, 0.00011403486132621765, 0.0001247599720954895, 0.00013548508286476135, 0.0001462101936340332, 0.00015693530440330505, 0.0001676604151725769, 0.00017838552594184875, 0.0001891106367111206, 0.00019983574748039246, 0.0002105608582496643, 0.00022128596901893616, 0.000232011079788208, 0.00024273619055747986, 0.0002534613013267517, 0.00026418641209602356, 0.0002749115228652954, 0.00028563663363456726, 0.0002963617444038391, 0.00030708685517311096, 0.0003178119659423828]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 9.0, 15.0, 9.0, 7.0, 13.0, 23.0, 20.0, 25.0, 39.0, 29.0, 26.0, 32.0, 48.0, 47.0, 49.0, 60.0, 51.0, 30.0, 48.0, 57.0, 53.0, 44.0, 33.0, 36.0, 19.0, 32.0, 24.0, 15.0, 20.0, 19.0, 11.0, 10.0, 6.0, 8.0, 6.0, 5.0, 8.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.046627044677734e-06, -7.816590368747711e-06, -7.586553692817688e-06, -7.356517016887665e-06, -7.126480340957642e-06, -6.896443665027618e-06, -6.666406989097595e-06, -6.436370313167572e-06, -6.206333637237549e-06, -5.976296961307526e-06, -5.7462602853775024e-06, -5.516223609447479e-06, -5.286186933517456e-06, -5.056150257587433e-06, -4.82611358165741e-06, -4.5960769057273865e-06, -4.366040229797363e-06, -4.13600355386734e-06, -3.905966877937317e-06, -3.6759302020072937e-06, -3.4458935260772705e-06, -3.2158568501472473e-06, -2.985820174217224e-06, -2.755783498287201e-06, -2.5257468223571777e-06, -2.2957101464271545e-06, -2.0656734704971313e-06, -1.8356367945671082e-06, -1.605600118637085e-06, -1.3755634427070618e-06, -1.1455267667770386e-06, -9.154900908470154e-07, -6.854534149169922e-07, -4.55416738986969e-07, -2.253800630569458e-07, 4.6566128730773926e-09, 2.3469328880310059e-07, 4.647299647331238e-07, 6.94766640663147e-07, 9.248033165931702e-07, 1.1548399925231934e-06, 1.3848766684532166e-06, 1.6149133443832397e-06, 1.844950020313263e-06, 2.074986696243286e-06, 2.3050233721733093e-06, 2.5350600481033325e-06, 2.7650967240333557e-06, 2.995133399963379e-06, 3.225170075893402e-06, 3.4552067518234253e-06, 3.6852434277534485e-06, 3.915280103683472e-06, 4.145316779613495e-06, 4.375353455543518e-06, 4.605390131473541e-06, 4.8354268074035645e-06, 5.065463483333588e-06, 5.295500159263611e-06, 5.525536835193634e-06, 5.755573511123657e-06, 5.98561018705368e-06, 6.215646862983704e-06, 6.445683538913727e-06, 6.67572021484375e-06]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 12.0, 14.0, 16.0, 23.0, 54.0, 90.0, 189.0, 453.0, 1315.0, 4822.0, 28572.0, 3979279.0, 166146.0, 9790.0, 2118.0, 741.0, 291.0, 134.0, 76.0, 32.0, 30.0, 20.0, 11.0, 11.0, 12.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.2067298889160156e-05, -3.077089786529541e-05, -2.9474496841430664e-05, -2.8178095817565918e-05, -2.6881694793701172e-05, -2.5585293769836426e-05, -2.428889274597168e-05, -2.2992491722106934e-05, -2.1696090698242188e-05, -2.039968967437744e-05, -1.9103288650512695e-05, -1.780688762664795e-05, -1.6510486602783203e-05, -1.5214085578918457e-05, -1.3917684555053711e-05, -1.2621283531188965e-05, -1.1324882507324219e-05, -1.0028481483459473e-05, -8.732080459594727e-06, -7.4356794357299805e-06, -6.139278411865234e-06, -4.842877388000488e-06, -3.546476364135742e-06, -2.250075340270996e-06, -9.5367431640625e-07, 3.427267074584961e-07, 1.6391277313232422e-06, 2.9355287551879883e-06, 4.231929779052734e-06, 5.5283308029174805e-06, 6.8247318267822266e-06, 8.121132850646973e-06, 9.417533874511719e-06, 1.0713934898376465e-05, 1.2010335922241211e-05, 1.3306736946105957e-05, 1.4603137969970703e-05, 1.589953899383545e-05, 1.7195940017700195e-05, 1.849234104156494e-05, 1.9788742065429688e-05, 2.1085143089294434e-05, 2.238154411315918e-05, 2.3677945137023926e-05, 2.4974346160888672e-05, 2.6270747184753418e-05, 2.7567148208618164e-05, 2.886354923248291e-05, 3.0159950256347656e-05, 3.14563512802124e-05, 3.275275230407715e-05, 3.4049153327941895e-05, 3.534555435180664e-05, 3.664195537567139e-05, 3.793835639953613e-05, 3.923475742340088e-05, 4.0531158447265625e-05, 4.182755947113037e-05, 4.312396049499512e-05, 4.442036151885986e-05, 4.571676254272461e-05, 4.7013163566589355e-05, 4.83095645904541e-05, 4.960596561431885e-05, 5.0902366638183594e-05]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 5.0, 11.0, 15.0, 5.0, 17.0, 25.0, 49.0, 56.0, 145.0, 454.0, 965.0, 1458.0, 412.0, 200.0, 66.0, 58.0, 31.0, 23.0, 24.0, 10.0, 8.0, 4.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.543231964111328e-06, -5.330890417098999e-06, -5.11854887008667e-06, -4.906207323074341e-06, -4.693865776062012e-06, -4.481524229049683e-06, -4.2691826820373535e-06, -4.056841135025024e-06, -3.844499588012695e-06, -3.632158041000366e-06, -3.419816493988037e-06, -3.207474946975708e-06, -2.995133399963379e-06, -2.78279185295105e-06, -2.5704503059387207e-06, -2.3581087589263916e-06, -2.1457672119140625e-06, -1.9334256649017334e-06, -1.7210841178894043e-06, -1.5087425708770752e-06, -1.296401023864746e-06, -1.084059476852417e-06, -8.717179298400879e-07, -6.593763828277588e-07, -4.470348358154297e-07, -2.3469328880310059e-07, -2.2351741790771484e-08, 1.8998980522155762e-07, 4.023313522338867e-07, 6.146728992462158e-07, 8.270144462585449e-07, 1.039355993270874e-06, 1.2516975402832031e-06, 1.4640390872955322e-06, 1.6763806343078613e-06, 1.8887221813201904e-06, 2.1010637283325195e-06, 2.3134052753448486e-06, 2.5257468223571777e-06, 2.738088369369507e-06, 2.950429916381836e-06, 3.162771463394165e-06, 3.375113010406494e-06, 3.5874545574188232e-06, 3.7997961044311523e-06, 4.0121376514434814e-06, 4.2244791984558105e-06, 4.43682074546814e-06, 4.649162292480469e-06, 4.861503839492798e-06, 5.073845386505127e-06, 5.286186933517456e-06, 5.498528480529785e-06, 5.710870027542114e-06, 5.923211574554443e-06, 6.1355531215667725e-06, 6.3478946685791016e-06, 6.560236215591431e-06, 6.77257776260376e-06, 6.984919309616089e-06, 7.197260856628418e-06, 7.409602403640747e-06, 7.621943950653076e-06, 7.834285497665405e-06, 8.046627044677734e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 8.0, 11.0, 15.0, 15.0, 28.0, 37.0, 49.0, 99.0, 141.0, 166.0, 144.0, 97.0, 55.0, 38.0, 32.0, 23.0, 14.0, 11.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2486548257584218e-05, -1.1811855983978603e-05, -1.1137162800878286e-05, -1.0462470527272671e-05, -9.787778253667057e-06, -9.11308507056674e-06, -8.438392796961125e-06, -7.763699613860808e-06, -7.089007340255193e-06, -6.414314611902228e-06, -5.739621883549262e-06, -5.064929609943647e-06, -4.390236881590681e-06, -3.7155441532377154e-06, -3.0408518796321005e-06, -2.3661591512791347e-06, -1.6914664229261689e-06, -1.0167738082600408e-06, -3.4208119359391276e-07, 3.326113073853776e-07, 1.0073040357383434e-06, 1.6819967640913092e-06, 2.356689037696924e-06, 3.03138176604989e-06, 3.7060744944028556e-06, 4.380767222755821e-06, 5.055459951108787e-06, 5.730152224714402e-06, 6.404844953067368e-06, 7.079537681420334e-06, 7.754229955025949e-06, 8.428922228631563e-06, 9.103616321226582e-06, 9.778308594832197e-06, 1.0453001777932514e-05, 1.1127694051538128e-05, 1.1802387234638445e-05, 1.247707950824406e-05, 1.3151771781849675e-05, 1.382646405545529e-05, 1.4501157238555606e-05, 1.5175849512161221e-05, 1.5850542695261538e-05, 1.6525234968867153e-05, 1.7199927242472768e-05, 1.7874619516078383e-05, 1.8549311789683998e-05, 1.9224005882279016e-05, 1.989869815588463e-05, 2.0573390429490246e-05, 2.124808270309586e-05, 2.192277679569088e-05, 2.2597469069296494e-05, 2.327216134290211e-05, 2.3946853616507724e-05, 2.462154589011334e-05, 2.5296238163718954e-05, 2.597093043732457e-05, 2.6645622710930184e-05, 2.73203149845358e-05, 2.7995009077130817e-05, 2.8669701350736432e-05, 2.9344393624342047e-05, 3.001908589794766e-05, 3.069377999054268e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 8.0, 4.0, 16.0, 13.0, 16.0, 16.0, 18.0, 14.0, 27.0, 27.0, 32.0, 34.0, 27.0, 28.0, 30.0, 39.0, 41.0, 44.0, 45.0, 40.0, 38.0, 39.0, 44.0, 40.0, 36.0, 24.0, 27.0, 35.0, 29.0, 23.0, 28.0, 15.0, 11.0, 12.0, 14.0, 16.0, 12.0, 4.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.288695426017512e-06, -8.024278031371068e-06, -7.759860636724625e-06, -7.4954427873308305e-06, -7.231025392684387e-06, -6.966607543290593e-06, -6.702190148644149e-06, -6.437772753997706e-06, -6.1733553593512625e-06, -5.908937964704819e-06, -5.644520115311025e-06, -5.380102720664581e-06, -5.115685326018138e-06, -4.8512674766243435e-06, -4.5868500819779e-06, -4.322432687331457e-06, -4.058014837937662e-06, -3.7935972159175435e-06, -3.5291798212711e-06, -3.264762199250981e-06, -3.0003448046045378e-06, -2.735927182584419e-06, -2.4715095605643e-06, -2.2070921659178566e-06, -1.9426745438977377e-06, -1.6782570355644566e-06, -1.4138395272311755e-06, -1.1494219052110566e-06, -8.850043968777754e-07, -6.205868885444943e-07, -3.561692665243754e-07, -9.175175819109427e-08, 1.7266575014218688e-07, 4.3708328689717746e-07, 7.01500823652168e-07, 9.65918388828868e-07, 1.2303358971621492e-06, 1.4947534054954303e-06, 1.7591710275155492e-06, 2.0235884221619926e-06, 2.2880060441821115e-06, 2.5524236662022304e-06, 2.816841060848674e-06, 3.0812586828687927e-06, 3.3456763048889115e-06, 3.610093699535355e-06, 3.874511094181798e-06, 4.138928943575593e-06, 4.403346338222036e-06, 4.6677637328684796e-06, 4.932181582262274e-06, 5.196598976908717e-06, 5.461016371555161e-06, 5.725433766201604e-06, 5.9898516155953985e-06, 6.254269010241842e-06, 6.518686859635636e-06, 6.78310425428208e-06, 7.047522103675874e-06, 7.311939498322317e-06, 7.576356892968761e-06, 7.840774742362555e-06, 8.105192137008999e-06, 8.369609531655442e-06, 8.634026926301885e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 10.0, 14.0, 9.0, 15.0, 39.0, 23.0, 34.0, 119.0, 64.0, 90.0, 294.0, 276.0, 974.0, 928.0, 1604.0, 9562.0, 17332.0, 87899.0, 897497.0, 17671.0, 6411.0, 4666.0, 964.0, 1005.0, 283.0, 197.0, 233.0, 65.0, 51.0, 79.0, 28.0, 23.0, 29.0, 15.0, 13.0, 14.0, 3.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.682209014892578e-06, -2.6011839509010315e-06, -2.520158886909485e-06, -2.4391338229179382e-06, -2.3581087589263916e-06, -2.277083694934845e-06, -2.1960586309432983e-06, -2.1150335669517517e-06, -2.034008502960205e-06, -1.9529834389686584e-06, -1.8719583749771118e-06, -1.7909333109855652e-06, -1.7099082469940186e-06, -1.628883183002472e-06, -1.5478581190109253e-06, -1.4668330550193787e-06, -1.385807991027832e-06, -1.3047829270362854e-06, -1.2237578630447388e-06, -1.1427327990531921e-06, -1.0617077350616455e-06, -9.806826710700989e-07, -8.996576070785522e-07, -8.186325430870056e-07, -7.37607479095459e-07, -6.565824151039124e-07, -5.755573511123657e-07, -4.945322871208191e-07, -4.1350722312927246e-07, -3.3248215913772583e-07, -2.514570951461792e-07, -1.7043203115463257e-07, -8.940696716308594e-08, -8.381903171539307e-09, 7.264316082000732e-08, 1.5366822481155396e-07, 2.3469328880310059e-07, 3.157183527946472e-07, 3.9674341678619385e-07, 4.777684807777405e-07, 5.587935447692871e-07, 6.398186087608337e-07, 7.208436727523804e-07, 8.01868736743927e-07, 8.828938007354736e-07, 9.639188647270203e-07, 1.044943928718567e-06, 1.1259689927101135e-06, 1.2069940567016602e-06, 1.2880191206932068e-06, 1.3690441846847534e-06, 1.4500692486763e-06, 1.5310943126678467e-06, 1.6121193766593933e-06, 1.69314444065094e-06, 1.7741695046424866e-06, 1.8551945686340332e-06, 1.93621963262558e-06, 2.0172446966171265e-06, 2.098269760608673e-06, 2.1792948246002197e-06, 2.2603198885917664e-06, 2.341344952583313e-06, 2.4223700165748596e-06, 2.5033950805664062e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 9.0, 13.0, 13.0, 12.0, 18.0, 21.0, 21.0, 28.0, 35.0, 36.0, 40.0, 44.0, 44.0, 45.0, 42.0, 62.0, 54.0, 50.0, 71.0, 30.0, 37.0, 32.0, 33.0, 50.0, 25.0, 20.0, 27.0, 10.0, 16.0, 9.0, 18.0, 6.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.556510925292969e-06, -6.342306733131409e-06, -6.128102540969849e-06, -5.9138983488082886e-06, -5.6996941566467285e-06, -5.4854899644851685e-06, -5.271285772323608e-06, -5.057081580162048e-06, -4.842877388000488e-06, -4.628673195838928e-06, -4.414469003677368e-06, -4.200264811515808e-06, -3.986060619354248e-06, -3.771856427192688e-06, -3.557652235031128e-06, -3.343448042869568e-06, -3.129243850708008e-06, -2.9150396585464478e-06, -2.7008354663848877e-06, -2.4866312742233276e-06, -2.2724270820617676e-06, -2.0582228899002075e-06, -1.8440186977386475e-06, -1.6298145055770874e-06, -1.4156103134155273e-06, -1.2014061212539673e-06, -9.872019290924072e-07, -7.729977369308472e-07, -5.587935447692871e-07, -3.4458935260772705e-07, -1.30385160446167e-07, 8.381903171539307e-08, 2.980232238769531e-07, 5.122274160385132e-07, 7.264316082000732e-07, 9.406358003616333e-07, 1.1548399925231934e-06, 1.3690441846847534e-06, 1.5832483768463135e-06, 1.7974525690078735e-06, 2.0116567611694336e-06, 2.2258609533309937e-06, 2.4400651454925537e-06, 2.6542693376541138e-06, 2.868473529815674e-06, 3.082677721977234e-06, 3.296881914138794e-06, 3.511086106300354e-06, 3.725290298461914e-06, 3.939494490623474e-06, 4.153698682785034e-06, 4.367902874946594e-06, 4.582107067108154e-06, 4.796311259269714e-06, 5.010515451431274e-06, 5.2247196435928345e-06, 5.4389238357543945e-06, 5.653128027915955e-06, 5.867332220077515e-06, 6.081536412239075e-06, 6.295740604400635e-06, 6.509944796562195e-06, 6.724148988723755e-06, 6.938353180885315e-06, 7.152557373046875e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 5.0, 0.0, 0.0, 18.0, 0.0, 0.0, 35.0, 0.0, 0.0, 89.0, 0.0, 0.0, 194.0, 0.0, 505.0, 0.0, 0.0, 9321.0, 0.0, 0.0, 1028126.0, 0.0, 0.0, 9411.0, 0.0, 499.0, 0.0, 0.0, 199.0, 0.0, 0.0, 94.0, 0.0, 0.0, 41.0, 0.0, 0.0, 19.0, 0.0, 7.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.938353180885315e-07, -6.724148988723755e-07, -6.509944796562195e-07, -6.295740604400635e-07, -6.081536412239075e-07, -5.867332220077515e-07, -5.653128027915955e-07, -5.438923835754395e-07, -5.224719643592834e-07, -5.010515451431274e-07, -4.796311259269714e-07, -4.5821070671081543e-07, -4.367902874946594e-07, -4.153698682785034e-07, -3.939494490623474e-07, -3.725290298461914e-07, -3.511086106300354e-07, -3.296881914138794e-07, -3.082677721977234e-07, -2.868473529815674e-07, -2.654269337654114e-07, -2.4400651454925537e-07, -2.2258609533309937e-07, -2.0116567611694336e-07, -1.7974525690078735e-07, -1.5832483768463135e-07, -1.3690441846847534e-07, -1.1548399925231934e-07, -9.406358003616333e-08, -7.264316082000732e-08, -5.122274160385132e-08, -2.9802322387695312e-08, -8.381903171539307e-09, 1.30385160446167e-08, 3.4458935260772705e-08, 5.587935447692871e-08, 7.729977369308472e-08, 9.872019290924072e-08, 1.2014061212539673e-07, 1.4156103134155273e-07, 1.6298145055770874e-07, 1.8440186977386475e-07, 2.0582228899002075e-07, 2.2724270820617676e-07, 2.4866312742233276e-07, 2.7008354663848877e-07, 2.915039658546448e-07, 3.129243850708008e-07, 3.343448042869568e-07, 3.557652235031128e-07, 3.771856427192688e-07, 3.986060619354248e-07, 4.200264811515808e-07, 4.414469003677368e-07, 4.628673195838928e-07, 4.842877388000488e-07, 5.057081580162048e-07, 5.271285772323608e-07, 5.485489964485168e-07, 5.699694156646729e-07, 5.913898348808289e-07, 6.128102540969849e-07, 6.342306733131409e-07, 6.556510925292969e-07]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 9.0, 5.0, 12.0, 17.0, 19.0, 29.0, 25.0, 33.0, 27.0, 42.0, 47.0, 37.0, 45.0, 47.0, 67.0, 59.0, 55.0, 40.0, 53.0, 55.0, 28.0, 52.0, 33.0, 24.0, 23.0, 21.0, 19.0, 13.0, 15.0, 9.0, 10.0, 8.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.751817762851715e-05, -1.6976147890090942e-05, -1.6434118151664734e-05, -1.5892088413238525e-05, -1.5350058674812317e-05, -1.4808028936386108e-05, -1.42659991979599e-05, -1.3723969459533691e-05, -1.3181939721107483e-05, -1.2639909982681274e-05, -1.2097880244255066e-05, -1.1555850505828857e-05, -1.1013820767402649e-05, -1.047179102897644e-05, -9.929761290550232e-06, -9.387731552124023e-06, -8.845701813697815e-06, -8.303672075271606e-06, -7.761642336845398e-06, -7.2196125984191895e-06, -6.677582859992981e-06, -6.1355531215667725e-06, -5.593523383140564e-06, -5.0514936447143555e-06, -4.509463906288147e-06, -3.9674341678619385e-06, -3.42540442943573e-06, -2.8833746910095215e-06, -2.341344952583313e-06, -1.7993152141571045e-06, -1.257285475730896e-06, -7.152557373046875e-07, -1.73225998878479e-07, 3.688037395477295e-07, 9.10833477973938e-07, 1.4528632164001465e-06, 1.994892954826355e-06, 2.5369226932525635e-06, 3.078952431678772e-06, 3.6209821701049805e-06, 4.163011908531189e-06, 4.7050416469573975e-06, 5.247071385383606e-06, 5.7891011238098145e-06, 6.331130862236023e-06, 6.8731606006622314e-06, 7.41519033908844e-06, 7.957220077514648e-06, 8.499249815940857e-06, 9.041279554367065e-06, 9.583309292793274e-06, 1.0125339031219482e-05, 1.0667368769645691e-05, 1.12093985080719e-05, 1.1751428246498108e-05, 1.2293457984924316e-05, 1.2835487723350525e-05, 1.3377517461776733e-05, 1.3919547200202942e-05, 1.446157693862915e-05, 1.5003606677055359e-05, 1.5545636415481567e-05, 1.6087666153907776e-05, 1.6629695892333984e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 124.0, 0.0, 0.0, 0.0, 0.0, 625.0, 0.0, 0.0, 0.0, 0.0, 121.0, 0.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.5762786865234375e-07, -3.4552067518234253e-07, -3.334134817123413e-07, -3.213062882423401e-07, -3.0919909477233887e-07, -2.9709190130233765e-07, -2.849847078323364e-07, -2.728775143623352e-07, -2.60770320892334e-07, -2.4866312742233276e-07, -2.3655593395233154e-07, -2.2444874048233032e-07, -2.123415470123291e-07, -2.0023435354232788e-07, -1.8812716007232666e-07, -1.7601996660232544e-07, -1.6391277313232422e-07, -1.51805579662323e-07, -1.3969838619232178e-07, -1.2759119272232056e-07, -1.1548399925231934e-07, -1.0337680578231812e-07, -9.12696123123169e-08, -7.916241884231567e-08, -6.705522537231445e-08, -5.494803190231323e-08, -4.284083843231201e-08, -3.073364496231079e-08, -1.862645149230957e-08, -6.51925802230835e-09, 5.587935447692871e-09, 1.7695128917694092e-08, 2.9802322387695312e-08, 4.190951585769653e-08, 5.4016709327697754e-08, 6.612390279769897e-08, 7.82310962677002e-08, 9.033828973770142e-08, 1.0244548320770264e-07, 1.1455267667770386e-07, 1.2665987014770508e-07, 1.387670636177063e-07, 1.5087425708770752e-07, 1.6298145055770874e-07, 1.7508864402770996e-07, 1.8719583749771118e-07, 1.993030309677124e-07, 2.1141022443771362e-07, 2.2351741790771484e-07, 2.3562461137771606e-07, 2.477318048477173e-07, 2.598389983177185e-07, 2.7194619178771973e-07, 2.8405338525772095e-07, 2.9616057872772217e-07, 3.082677721977234e-07, 3.203749656677246e-07, 3.3248215913772583e-07, 3.4458935260772705e-07, 3.5669654607772827e-07, 3.688037395477295e-07, 3.809109330177307e-07, 3.9301812648773193e-07, 4.0512531995773315e-07, 4.172325134277344e-07]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 15.0, 29.0, 46.0, 121.0, 313.0, 289.0, 109.0, 45.0, 26.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4162338629830629e-05, -1.3277227481012233e-05, -1.2392116332193837e-05, -1.150700518337544e-05, -1.0621894034557045e-05, -9.736782885738648e-06, -8.851671736920252e-06, -7.966560588101856e-06, -7.0814489845361095e-06, -6.1963378357177135e-06, -5.3112266868993174e-06, -4.4261150833335705e-06, -3.54100416188885e-06, -2.6558927856967784e-06, -1.7707816368783824e-06, -8.856704880599864e-07, -5.593392415903509e-10, 8.845518664202245e-07, 1.7696630720820394e-06, 2.654774334587273e-06, 3.5398854834056692e-06, 4.424996859597741e-06, 5.310108008416137e-06, 6.195219157234533e-06, 7.080330306052929e-06, 7.965441909618676e-06, 8.850553058437072e-06, 9.735664207255468e-06, 1.0620775356073864e-05, 1.150588650489226e-05, 1.2390997653710656e-05, 1.3276108802529052e-05, 1.4161219951347448e-05, 1.5046331100165844e-05, 1.593144224898424e-05, 1.6816553397802636e-05, 1.7701664546621032e-05, 1.8586775695439428e-05, 1.9471886844257824e-05, 2.035699799307622e-05, 2.1242109141894616e-05, 2.2127220290713012e-05, 2.3012331439531408e-05, 2.3897442588349804e-05, 2.47825537371682e-05, 2.5667664885986596e-05, 2.6552776034804992e-05, 2.743788718362339e-05, 2.8323000151431188e-05, 2.9208111300249584e-05, 3.009322244906798e-05, 3.097833541687578e-05, 3.186344474670477e-05, 3.274855771451257e-05, 3.3633667044341564e-05, 3.4518780012149364e-05, 3.5403889341978356e-05, 3.6289002309786156e-05, 3.717411163961515e-05, 3.805922460742295e-05, 3.894433393725194e-05, 3.982944690505974e-05, 4.071455623488873e-05, 4.159966920269653e-05, 4.2484778532525524e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 2.0, 11.0, 13.0, 16.0, 13.0, 16.0, 14.0, 21.0, 21.0, 26.0, 34.0, 36.0, 33.0, 30.0, 38.0, 43.0, 39.0, 57.0, 42.0, 37.0, 49.0, 46.0, 34.0, 29.0, 40.0, 24.0, 38.0, 38.0, 29.0, 20.0, 22.0, 8.0, 9.0, 15.0, 13.0, 11.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8184119805227965e-06, -4.643654847313883e-06, -4.468897259357618e-06, -4.2941401261487044e-06, -4.119382992939791e-06, -3.944625859730877e-06, -3.7698682717746124e-06, -3.5951111385656986e-06, -3.420354005356785e-06, -3.2455966447741957e-06, -3.070839511565282e-06, -2.896082150982693e-06, -2.721325017773779e-06, -2.54656765719119e-06, -2.3718102966086008e-06, -2.197053163399687e-06, -2.022295802817098e-06, -1.8475385559213464e-06, -1.672781309025595e-06, -1.4980239484430058e-06, -1.323266815234092e-06, -1.1485094546515029e-06, -9.737522077557514e-07, -7.9899496086e-07, -6.242377139642485e-07, -4.494804670684971e-07, -2.747231917510362e-07, -9.996591643357533e-08, 7.479133046217612e-08, 2.4954857735792757e-07, 4.243058810970979e-07, 5.990631279928493e-07, 7.738203748886008e-07, 9.485776217843522e-07, 1.1233348686801037e-06, 1.2980922292626929e-06, 1.4728493624716066e-06, 1.6476067230541958e-06, 1.8223639699499472e-06, 1.9971212168456987e-06, 2.1718783500546124e-06, 2.3466357106372016e-06, 2.5213928438461153e-06, 2.6961502044287045e-06, 2.870907337637618e-06, 3.0456646982202074e-06, 3.2204220588027965e-06, 3.3951791920117103e-06, 3.5699365525942994e-06, 3.7446939131768886e-06, 3.919451046385802e-06, 4.094208179594716e-06, 4.268965767550981e-06, 4.443722900759894e-06, 4.618480033968808e-06, 4.793237167177722e-06, 4.9679947551339865e-06, 5.1427518883429e-06, 5.317509476299165e-06, 5.4922666095080785e-06, 5.667023742716992e-06, 5.841780875925906e-06, 6.016538463882171e-06, 6.191295597091084e-06, 6.366052730299998e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 12.0, 14.0, 21.0, 37.0, 40.0, 51.0, 121.0, 111.0, 202.0, 298.0, 456.0, 790.0, 1113.0, 2204.0, 3131.0, 5623.0, 12484.0, 20219.0, 52972.0, 120656.0, 490605.0, 222076.0, 55726.0, 29892.0, 11980.0, 8076.0, 3671.0, 2102.0, 1539.0, 797.0, 551.0, 310.0, 227.0, 159.0, 80.0, 65.0, 40.0, 18.0, 27.0, 22.0, 10.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0192394256591797e-05, -9.870156645774841e-06, -9.547919034957886e-06, -9.22568142414093e-06, -8.903443813323975e-06, -8.581206202507019e-06, -8.258968591690063e-06, -7.936730980873108e-06, -7.614493370056152e-06, -7.292255759239197e-06, -6.970018148422241e-06, -6.647780537605286e-06, -6.32554292678833e-06, -6.0033053159713745e-06, -5.681067705154419e-06, -5.358830094337463e-06, -5.036592483520508e-06, -4.714354872703552e-06, -4.392117261886597e-06, -4.069879651069641e-06, -3.7476420402526855e-06, -3.42540442943573e-06, -3.1031668186187744e-06, -2.780929207801819e-06, -2.4586915969848633e-06, -2.1364539861679077e-06, -1.8142163753509521e-06, -1.4919787645339966e-06, -1.169741153717041e-06, -8.475035429000854e-07, -5.252659320831299e-07, -2.0302832126617432e-07, 1.1920928955078125e-07, 4.414469003677368e-07, 7.636845111846924e-07, 1.085922122001648e-06, 1.4081597328186035e-06, 1.730397343635559e-06, 2.0526349544525146e-06, 2.3748725652694702e-06, 2.6971101760864258e-06, 3.0193477869033813e-06, 3.341585397720337e-06, 3.6638230085372925e-06, 3.986060619354248e-06, 4.308298230171204e-06, 4.630535840988159e-06, 4.952773451805115e-06, 5.27501106262207e-06, 5.597248673439026e-06, 5.9194862842559814e-06, 6.241723895072937e-06, 6.563961505889893e-06, 6.886199116706848e-06, 7.208436727523804e-06, 7.530674338340759e-06, 7.852911949157715e-06, 8.17514955997467e-06, 8.497387170791626e-06, 8.819624781608582e-06, 9.141862392425537e-06, 9.464100003242493e-06, 9.786337614059448e-06, 1.0108575224876404e-05, 1.043081283569336e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 6.0, 6.0, 7.0, 10.0, 13.0, 18.0, 24.0, 27.0, 29.0, 36.0, 35.0, 46.0, 47.0, 49.0, 55.0, 56.0, 57.0, 60.0, 54.0, 52.0, 41.0, 37.0, 35.0, 28.0, 34.0, 30.0, 24.0, 16.0, 12.0, 11.0, 10.0, 8.0, 4.0, 5.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4616718292236328e-05, -2.3937784135341644e-05, -2.325884997844696e-05, -2.2579915821552277e-05, -2.1900981664657593e-05, -2.122204750776291e-05, -2.0543113350868225e-05, -1.986417919397354e-05, -1.9185245037078857e-05, -1.8506310880184174e-05, -1.782737672328949e-05, -1.7148442566394806e-05, -1.6469508409500122e-05, -1.5790574252605438e-05, -1.5111640095710754e-05, -1.443270593881607e-05, -1.3753771781921387e-05, -1.3074837625026703e-05, -1.2395903468132019e-05, -1.1716969311237335e-05, -1.1038035154342651e-05, -1.0359100997447968e-05, -9.680166840553284e-06, -9.0012326836586e-06, -8.322298526763916e-06, -7.643364369869232e-06, -6.964430212974548e-06, -6.2854960560798645e-06, -5.606561899185181e-06, -4.927627742290497e-06, -4.248693585395813e-06, -3.569759428501129e-06, -2.8908252716064453e-06, -2.2118911147117615e-06, -1.5329569578170776e-06, -8.540228009223938e-07, -1.7508864402770996e-07, 5.038455128669739e-07, 1.1827796697616577e-06, 1.8617138266563416e-06, 2.5406479835510254e-06, 3.2195821404457092e-06, 3.898516297340393e-06, 4.577450454235077e-06, 5.256384611129761e-06, 5.935318768024445e-06, 6.614252924919128e-06, 7.293187081813812e-06, 7.972121238708496e-06, 8.65105539560318e-06, 9.329989552497864e-06, 1.0008923709392548e-05, 1.0687857866287231e-05, 1.1366792023181915e-05, 1.2045726180076599e-05, 1.2724660336971283e-05, 1.3403594493865967e-05, 1.408252865076065e-05, 1.4761462807655334e-05, 1.544039696455002e-05, 1.6119331121444702e-05, 1.6798265278339386e-05, 1.747719943523407e-05, 1.8156133592128754e-05, 1.8835067749023438e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 15.0, 20.0, 27.0, 26.0, 50.0, 73.0, 102.0, 211.0, 488.0, 1784.0, 30800.0, 999165.0, 13538.0, 1357.0, 410.0, 167.0, 109.0, 65.0, 34.0, 32.0, 21.0, 13.0, 11.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.958578109741211e-05, -8.698180317878723e-05, -8.437782526016235e-05, -8.177384734153748e-05, -7.91698694229126e-05, -7.656589150428772e-05, -7.396191358566284e-05, -7.135793566703796e-05, -6.875395774841309e-05, -6.614997982978821e-05, -6.354600191116333e-05, -6.094202399253845e-05, -5.8338046073913574e-05, -5.5734068155288696e-05, -5.313009023666382e-05, -5.052611231803894e-05, -4.792213439941406e-05, -4.5318156480789185e-05, -4.271417856216431e-05, -4.011020064353943e-05, -3.750622272491455e-05, -3.490224480628967e-05, -3.2298266887664795e-05, -2.9694288969039917e-05, -2.709031105041504e-05, -2.448633313179016e-05, -2.1882355213165283e-05, -1.9278377294540405e-05, -1.6674399375915527e-05, -1.407042145729065e-05, -1.1466443538665771e-05, -8.862465620040894e-06, -6.258487701416016e-06, -3.6545097827911377e-06, -1.0505318641662598e-06, 1.5534460544586182e-06, 4.157423973083496e-06, 6.761401891708374e-06, 9.365379810333252e-06, 1.196935772895813e-05, 1.4573335647583008e-05, 1.7177313566207886e-05, 1.9781291484832764e-05, 2.238526940345764e-05, 2.498924732208252e-05, 2.7593225240707397e-05, 3.0197203159332275e-05, 3.280118107795715e-05, 3.540515899658203e-05, 3.800913691520691e-05, 4.061311483383179e-05, 4.3217092752456665e-05, 4.582107067108154e-05, 4.842504858970642e-05, 5.10290265083313e-05, 5.363300442695618e-05, 5.6236982345581055e-05, 5.884096026420593e-05, 6.144493818283081e-05, 6.404891610145569e-05, 6.665289402008057e-05, 6.925687193870544e-05, 7.186084985733032e-05, 7.44648277759552e-05, 7.706880569458008e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 11.0, 6.0, 12.0, 14.0, 18.0, 21.0, 30.0, 32.0, 54.0, 46.0, 51.0, 60.0, 60.0, 76.0, 77.0, 75.0, 53.0, 44.0, 49.0, 42.0, 40.0, 31.0, 19.0, 16.0, 13.0, 8.0, 6.0, 7.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.035234451293945e-05, -3.921985626220703e-05, -3.808736801147461e-05, -3.695487976074219e-05, -3.5822391510009766e-05, -3.4689903259277344e-05, -3.355741500854492e-05, -3.24249267578125e-05, -3.129243850708008e-05, -3.0159950256347656e-05, -2.9027462005615234e-05, -2.7894973754882812e-05, -2.676248550415039e-05, -2.562999725341797e-05, -2.4497509002685547e-05, -2.3365020751953125e-05, -2.2232532501220703e-05, -2.110004425048828e-05, -1.996755599975586e-05, -1.8835067749023438e-05, -1.7702579498291016e-05, -1.6570091247558594e-05, -1.5437602996826172e-05, -1.430511474609375e-05, -1.3172626495361328e-05, -1.2040138244628906e-05, -1.0907649993896484e-05, -9.775161743164062e-06, -8.64267349243164e-06, -7.510185241699219e-06, -6.377696990966797e-06, -5.245208740234375e-06, -4.112720489501953e-06, -2.9802322387695312e-06, -1.8477439880371094e-06, -7.152557373046875e-07, 4.172325134277344e-07, 1.5497207641601562e-06, 2.682209014892578e-06, 3.814697265625e-06, 4.947185516357422e-06, 6.079673767089844e-06, 7.212162017822266e-06, 8.344650268554688e-06, 9.47713851928711e-06, 1.0609626770019531e-05, 1.1742115020751953e-05, 1.2874603271484375e-05, 1.4007091522216797e-05, 1.5139579772949219e-05, 1.627206802368164e-05, 1.7404556274414062e-05, 1.8537044525146484e-05, 1.9669532775878906e-05, 2.0802021026611328e-05, 2.193450927734375e-05, 2.3066997528076172e-05, 2.4199485778808594e-05, 2.5331974029541016e-05, 2.6464462280273438e-05, 2.759695053100586e-05, 2.872943878173828e-05, 2.9861927032470703e-05, 3.0994415283203125e-05, 3.212690353393555e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 7.0, 0.0, 20.0, 0.0, 48.0, 0.0, 0.0, 415.0, 0.0, 9387.0, 0.0, 1028830.0, 0.0, 9335.0, 0.0, 431.0, 0.0, 47.0, 0.0, 22.0, 0.0, 11.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.853392839431763e-07, -9.57399606704712e-07, -9.294599294662476e-07, -9.015202522277832e-07, -8.735805749893188e-07, -8.456408977508545e-07, -8.177012205123901e-07, -7.897615432739258e-07, -7.618218660354614e-07, -7.338821887969971e-07, -7.059425115585327e-07, -6.780028343200684e-07, -6.50063157081604e-07, -6.221234798431396e-07, -5.941838026046753e-07, -5.662441253662109e-07, -5.383044481277466e-07, -5.103647708892822e-07, -4.824250936508179e-07, -4.544854164123535e-07, -4.2654573917388916e-07, -3.986060619354248e-07, -3.7066638469696045e-07, -3.427267074584961e-07, -3.1478703022003174e-07, -2.868473529815674e-07, -2.5890767574310303e-07, -2.3096799850463867e-07, -2.0302832126617432e-07, -1.7508864402770996e-07, -1.471489667892456e-07, -1.1920928955078125e-07, -9.12696123123169e-08, -6.332993507385254e-08, -3.5390257835388184e-08, -7.450580596923828e-09, 2.0489096641540527e-08, 4.842877388000488e-08, 7.636845111846924e-08, 1.043081283569336e-07, 1.3224780559539795e-07, 1.601874828338623e-07, 1.8812716007232666e-07, 2.1606683731079102e-07, 2.4400651454925537e-07, 2.7194619178771973e-07, 2.998858690261841e-07, 3.2782554626464844e-07, 3.557652235031128e-07, 3.8370490074157715e-07, 4.116445779800415e-07, 4.3958425521850586e-07, 4.675239324569702e-07, 4.954636096954346e-07, 5.234032869338989e-07, 5.513429641723633e-07, 5.792826414108276e-07, 6.07222318649292e-07, 6.351619958877563e-07, 6.631016731262207e-07, 6.910413503646851e-07, 7.189810276031494e-07, 7.469207048416138e-07, 7.748603820800781e-07]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [40.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 946.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.960464477539063e-08, -5.681067705154419e-08, -5.4016709327697754e-08, -5.122274160385132e-08, -4.842877388000488e-08, -4.563480615615845e-08, -4.284083843231201e-08, -4.0046870708465576e-08, -3.725290298461914e-08, -3.4458935260772705e-08, -3.166496753692627e-08, -2.8870999813079834e-08, -2.60770320892334e-08, -2.3283064365386963e-08, -2.0489096641540527e-08, -1.7695128917694092e-08, -1.4901161193847656e-08, -1.210719347000122e-08, -9.313225746154785e-09, -6.51925802230835e-09, -3.725290298461914e-09, -9.313225746154785e-10, 1.862645149230957e-09, 4.6566128730773926e-09, 7.450580596923828e-09, 1.0244548320770264e-08, 1.30385160446167e-08, 1.5832483768463135e-08, 1.862645149230957e-08, 2.1420419216156006e-08, 2.421438694000244e-08, 2.7008354663848877e-08, 2.9802322387695312e-08, 3.259629011154175e-08, 3.5390257835388184e-08, 3.818422555923462e-08, 4.0978193283081055e-08, 4.377216100692749e-08, 4.6566128730773926e-08, 4.936009645462036e-08, 5.21540641784668e-08, 5.494803190231323e-08, 5.774199962615967e-08, 6.05359673500061e-08, 6.332993507385254e-08, 6.612390279769897e-08, 6.891787052154541e-08, 7.171183824539185e-08, 7.450580596923828e-08, 7.729977369308472e-08, 8.009374141693115e-08, 8.288770914077759e-08, 8.568167686462402e-08, 8.847564458847046e-08, 9.12696123123169e-08, 9.406358003616333e-08, 9.685754776000977e-08, 9.96515154838562e-08, 1.0244548320770264e-07, 1.0523945093154907e-07, 1.0803341865539551e-07, 1.1082738637924194e-07, 1.1362135410308838e-07, 1.1641532182693481e-07, 1.1920928955078125e-07]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 7.0, 4.0, 7.0, 0.0, 4.0, 18.0, 0.0, 69.0, 227.0, 0.0, 1174.0, 14444.0, 1016671.0, 0.0, 14435.0, 1165.0, 0.0, 233.0, 69.0, 14.0, 0.0, 7.0, 2.0, 0.0, 3.0, 5.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2097880244255066e-06, -1.16787850856781e-06, -1.1259689927101135e-06, -1.084059476852417e-06, -1.0421499609947205e-06, -1.000240445137024e-06, -9.583309292793274e-07, -9.164214134216309e-07, -8.745118975639343e-07, -8.326023817062378e-07, -7.906928658485413e-07, -7.487833499908447e-07, -7.068738341331482e-07, -6.649643182754517e-07, -6.230548024177551e-07, -5.811452865600586e-07, -5.392357707023621e-07, -4.973262548446655e-07, -4.55416738986969e-07, -4.1350722312927246e-07, -3.7159770727157593e-07, -3.296881914138794e-07, -2.8777867555618286e-07, -2.4586915969848633e-07, -2.039596438407898e-07, -1.6205012798309326e-07, -1.2014061212539673e-07, -7.82310962677002e-08, -3.632158041000366e-08, 5.587935447692871e-09, 4.7497451305389404e-08, 8.940696716308594e-08, 1.3131648302078247e-07, 1.73225998878479e-07, 2.1513551473617554e-07, 2.5704503059387207e-07, 2.989545464515686e-07, 3.4086406230926514e-07, 3.8277357816696167e-07, 4.246830940246582e-07, 4.6659260988235474e-07, 5.085021257400513e-07, 5.504116415977478e-07, 5.923211574554443e-07, 6.342306733131409e-07, 6.761401891708374e-07, 7.180497050285339e-07, 7.599592208862305e-07, 8.01868736743927e-07, 8.437782526016235e-07, 8.856877684593201e-07, 9.275972843170166e-07, 9.695068001747131e-07, 1.0114163160324097e-06, 1.0533258318901062e-06, 1.0952353477478027e-06, 1.1371448636054993e-06, 1.1790543794631958e-06, 1.2209638953208923e-06, 1.2628734111785889e-06, 1.3047829270362854e-06, 1.346692442893982e-06, 1.3886019587516785e-06, 1.430511474609375e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 90.0, 0.0, 0.0, 0.0, 0.0, 801.0, 0.0, 0.0, 0.0, 0.0, 72.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.0512531995773315e-07, -3.9301812648773193e-07, -3.809109330177307e-07, -3.688037395477295e-07, -3.5669654607772827e-07, -3.4458935260772705e-07, -3.3248215913772583e-07, -3.203749656677246e-07, -3.082677721977234e-07, -2.9616057872772217e-07, -2.8405338525772095e-07, -2.7194619178771973e-07, -2.598389983177185e-07, -2.477318048477173e-07, -2.3562461137771606e-07, -2.2351741790771484e-07, -2.1141022443771362e-07, -1.993030309677124e-07, -1.8719583749771118e-07, -1.7508864402770996e-07, -1.6298145055770874e-07, -1.5087425708770752e-07, -1.387670636177063e-07, -1.2665987014770508e-07, -1.1455267667770386e-07, -1.0244548320770264e-07, -9.033828973770142e-08, -7.82310962677002e-08, -6.612390279769897e-08, -5.4016709327697754e-08, -4.190951585769653e-08, -2.9802322387695312e-08, -1.7695128917694092e-08, -5.587935447692871e-09, 6.51925802230835e-09, 1.862645149230957e-08, 3.073364496231079e-08, 4.284083843231201e-08, 5.494803190231323e-08, 6.705522537231445e-08, 7.916241884231567e-08, 9.12696123123169e-08, 1.0337680578231812e-07, 1.1548399925231934e-07, 1.2759119272232056e-07, 1.3969838619232178e-07, 1.51805579662323e-07, 1.6391277313232422e-07, 1.7601996660232544e-07, 1.8812716007232666e-07, 2.0023435354232788e-07, 2.123415470123291e-07, 2.2444874048233032e-07, 2.3655593395233154e-07, 2.4866312742233276e-07, 2.60770320892334e-07, 2.728775143623352e-07, 2.849847078323364e-07, 2.9709190130233765e-07, 3.0919909477233887e-07, 3.213062882423401e-07, 3.334134817123413e-07, 3.4552067518234253e-07, 3.5762786865234375e-07]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 20.0, 130.0, 638.0, 182.0, 34.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020560156553983688, -0.00020161608699709177, -0.00019763060845434666, -0.00019364512991160154, -0.00018965965136885643, -0.0001856741582741961, -0.00018168867973145097, -0.00017770320118870586, -0.00017371772264596075, -0.00016973224410321563, -0.00016574676556047052, -0.0001617612870177254, -0.00015777579392306507, -0.00015379031538031995, -0.00014980483683757484, -0.00014581935829482973, -0.0001418338797520846, -0.0001378484012093395, -0.00013386292266659439, -0.00012987744412384927, -0.00012589196558110416, -0.00012190647976240143, -0.0001179209939436987, -0.00011393551540095359, -0.00010995003685820848, -0.00010596455831546336, -0.00010197907977271825, -9.799359395401552e-05, -9.400811541127041e-05, -9.00226368685253e-05, -8.603715104982257e-05, -8.205167250707746e-05, -7.806620851624757e-05, -7.408072997350246e-05, -7.009525143075734e-05, -6.610976561205462e-05, -6.21242870693095e-05, -5.813880852656439e-05, -5.415332634584047e-05, -5.016784416511655e-05, -4.618236198439263e-05, -4.219687980366871e-05, -3.8211401260923594e-05, -3.422592271817848e-05, -3.024044053745456e-05, -2.6254960175720043e-05, -2.2269479813985527e-05, -1.828399945225101e-05, -1.4298519090516493e-05, -1.0313038728781976e-05, -6.327558367047459e-06, -2.342078005312942e-06, 1.643402356421575e-06, 5.628882718156092e-06, 9.614363079890609e-06, 1.3599843441625126e-05, 1.7585323803359643e-05, 2.157080416509416e-05, 2.5556284526828676e-05, 2.9541764888563193e-05, 3.352724525029771e-05, 3.751272743102163e-05, 4.1498205973766744e-05, 4.548368451651186e-05, 4.946916669723578e-05]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 9.0, 7.0, 9.0, 8.0, 19.0, 18.0, 11.0, 21.0, 19.0, 19.0, 25.0, 32.0, 37.0, 41.0, 45.0, 41.0, 49.0, 42.0, 50.0, 50.0, 50.0, 42.0, 46.0, 34.0, 32.0, 38.0, 30.0, 19.0, 27.0, 22.0, 22.0, 22.0, 21.0, 7.0, 9.0, 5.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.583987174555659e-05, -4.447176252142526e-05, -4.310365329729393e-05, -4.17355440731626e-05, -4.036743484903127e-05, -3.8999329262878746e-05, -3.763121640076861e-05, -3.6263110814616084e-05, -3.489500159048475e-05, -3.352689236635342e-05, -3.215878314222209e-05, -3.079067391809076e-05, -2.9422566512948833e-05, -2.8054457288817503e-05, -2.6686348064686172e-05, -2.5318240659544244e-05, -2.395012961642351e-05, -2.258202039229218e-05, -2.121391116816085e-05, -1.984580376301892e-05, -1.847769453888759e-05, -1.710958531475626e-05, -1.574147609062493e-05, -1.43733677759883e-05, -1.3005258551856969e-05, -1.1637149327725638e-05, -1.0269041013089009e-05, -8.900931788957678e-06, -7.532823019573698e-06, -6.164714250189718e-06, -4.796605026058387e-06, -3.428496711421758e-06, -2.060387487290427e-06, -6.922786042196094e-07, 6.758302788512083e-07, 2.0439392756088637e-06, 3.4120480449928436e-06, 4.780156814376824e-06, 6.1482660385081545e-06, 7.5163743531447835e-06, 8.884483577276114e-06, 1.0252592801407445e-05, 1.1620701116044074e-05, 1.2988810340175405e-05, 1.4356919564306736e-05, 1.5725028788438067e-05, 1.7093138012569398e-05, 1.8461245417711325e-05, 1.9829354641842656e-05, 2.1197463865973987e-05, 2.2565573090105318e-05, 2.3933680495247245e-05, 2.5301789719378576e-05, 2.6669898943509907e-05, 2.8038008167641237e-05, 2.9406117391772568e-05, 3.07742266159039e-05, 3.214233584003523e-05, 3.351044506416656e-05, 3.487855428829789e-05, 3.624666351242922e-05, 3.761477273656055e-05, 3.898287832271308e-05, 4.035098754684441e-05, 4.171909677097574e-05]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 10.0, 1.0, 3.0, 2.0, 4.0, 8.0, 26.0, 11.0, 11.0, 32.0, 27.0, 125.0, 69.0, 79.0, 115.0, 199.0, 518.0, 490.0, 994.0, 2200.0, 6316.0, 1237207.0, 2934809.0, 6206.0, 2188.0, 962.0, 449.0, 518.0, 178.0, 107.0, 99.0, 66.0, 136.0, 31.0, 25.0, 11.0, 9.0, 11.0, 29.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4928321838378906e-05, -3.3836811780929565e-05, -3.2745301723480225e-05, -3.1653791666030884e-05, -3.056228160858154e-05, -2.9470771551132202e-05, -2.837926149368286e-05, -2.728775143623352e-05, -2.619624137878418e-05, -2.510473132133484e-05, -2.4013221263885498e-05, -2.2921711206436157e-05, -2.1830201148986816e-05, -2.0738691091537476e-05, -1.9647181034088135e-05, -1.8555670976638794e-05, -1.7464160919189453e-05, -1.6372650861740112e-05, -1.528114080429077e-05, -1.418963074684143e-05, -1.309812068939209e-05, -1.2006610631942749e-05, -1.0915100574493408e-05, -9.823590517044067e-06, -8.732080459594727e-06, -7.640570402145386e-06, -6.549060344696045e-06, -5.457550287246704e-06, -4.366040229797363e-06, -3.2745301723480225e-06, -2.1830201148986816e-06, -1.0915100574493408e-06, 0.0, 1.0915100574493408e-06, 2.1830201148986816e-06, 3.2745301723480225e-06, 4.366040229797363e-06, 5.457550287246704e-06, 6.549060344696045e-06, 7.640570402145386e-06, 8.732080459594727e-06, 9.823590517044067e-06, 1.0915100574493408e-05, 1.2006610631942749e-05, 1.309812068939209e-05, 1.418963074684143e-05, 1.528114080429077e-05, 1.6372650861740112e-05, 1.7464160919189453e-05, 1.8555670976638794e-05, 1.9647181034088135e-05, 2.0738691091537476e-05, 2.1830201148986816e-05, 2.2921711206436157e-05, 2.4013221263885498e-05, 2.510473132133484e-05, 2.619624137878418e-05, 2.728775143623352e-05, 2.837926149368286e-05, 2.9470771551132202e-05, 3.056228160858154e-05, 3.1653791666030884e-05, 3.2745301723480225e-05, 3.3836811780929565e-05, 3.4928321838378906e-05]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 9.0, 12.0, 11.0, 15.0, 11.0, 17.0, 26.0, 28.0, 32.0, 30.0, 30.0, 43.0, 45.0, 50.0, 37.0, 47.0, 50.0, 51.0, 67.0, 54.0, 50.0, 49.0, 34.0, 17.0, 34.0, 26.0, 21.0, 25.0, 17.0, 10.0, 12.0, 8.0, 10.0, 10.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-6.67572021484375e-06, -6.5034255385398865e-06, -6.331130862236023e-06, -6.1588361859321594e-06, -5.986541509628296e-06, -5.814246833324432e-06, -5.641952157020569e-06, -5.469657480716705e-06, -5.297362804412842e-06, -5.125068128108978e-06, -4.952773451805115e-06, -4.780478775501251e-06, -4.608184099197388e-06, -4.435889422893524e-06, -4.263594746589661e-06, -4.091300070285797e-06, -3.919005393981934e-06, -3.74671071767807e-06, -3.5744160413742065e-06, -3.402121365070343e-06, -3.2298266887664795e-06, -3.057532012462616e-06, -2.8852373361587524e-06, -2.712942659854889e-06, -2.5406479835510254e-06, -2.368353307247162e-06, -2.1960586309432983e-06, -2.023763954639435e-06, -1.8514692783355713e-06, -1.6791746020317078e-06, -1.5068799257278442e-06, -1.3345852494239807e-06, -1.1622905731201172e-06, -9.899958968162537e-07, -8.177012205123901e-07, -6.454065442085266e-07, -4.731118679046631e-07, -3.0081719160079956e-07, -1.2852251529693604e-07, 4.377216100692749e-08, 2.1606683731079102e-07, 3.8836151361465454e-07, 5.606561899185181e-07, 7.329508662223816e-07, 9.052455425262451e-07, 1.0775402188301086e-06, 1.2498348951339722e-06, 1.4221295714378357e-06, 1.5944242477416992e-06, 1.7667189240455627e-06, 1.9390136003494263e-06, 2.11130827665329e-06, 2.2836029529571533e-06, 2.455897629261017e-06, 2.6281923055648804e-06, 2.800486981868744e-06, 2.9727816581726074e-06, 3.145076334476471e-06, 3.3173710107803345e-06, 3.489665687084198e-06, 3.6619603633880615e-06, 3.834255039691925e-06, 4.0065497159957886e-06, 4.178844392299652e-06, 4.351139068603516e-06]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 11.0, 21.0, 242.0, 1597.0, 4190300.0, 1822.0, 229.0, 40.0, 8.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.85860824584961e-05, -9.326264262199402e-05, -8.793920278549194e-05, -8.261576294898987e-05, -7.729232311248779e-05, -7.196888327598572e-05, -6.664544343948364e-05, -6.132200360298157e-05, -5.599856376647949e-05, -5.067512392997742e-05, -4.535168409347534e-05, -4.0028244256973267e-05, -3.470480442047119e-05, -2.9381364583969116e-05, -2.405792474746704e-05, -1.8734484910964966e-05, -1.341104507446289e-05, -8.087605237960815e-06, -2.7641654014587402e-06, 2.559274435043335e-06, 7.88271427154541e-06, 1.3206154108047485e-05, 1.852959394454956e-05, 2.3853033781051636e-05, 2.917647361755371e-05, 3.4499913454055786e-05, 3.982335329055786e-05, 4.5146793127059937e-05, 5.047023296356201e-05, 5.579367280006409e-05, 6.111711263656616e-05, 6.644055247306824e-05, 7.176399230957031e-05, 7.708743214607239e-05, 8.241087198257446e-05, 8.773431181907654e-05, 9.305775165557861e-05, 9.838119149208069e-05, 0.00010370463132858276, 0.00010902807116508484, 0.00011435151100158691, 0.00011967495083808899, 0.00012499839067459106, 0.00013032183051109314, 0.00013564527034759521, 0.0001409687101840973, 0.00014629215002059937, 0.00015161558985710144, 0.00015693902969360352, 0.0001622624695301056, 0.00016758590936660767, 0.00017290934920310974, 0.00017823278903961182, 0.0001835562288761139, 0.00018887966871261597, 0.00019420310854911804, 0.00019952654838562012, 0.0002048499882221222, 0.00021017342805862427, 0.00021549686789512634, 0.00022082030773162842, 0.0002261437475681305, 0.00023146718740463257, 0.00023679062724113464, 0.00024211406707763672]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 8.0, 0.0, 10.0, 16.0, 25.0, 45.0, 308.0, 2635.0, 855.0, 115.0, 31.0, 16.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.377696990966797e-06, -6.083399057388306e-06, -5.7891011238098145e-06, -5.494803190231323e-06, -5.200505256652832e-06, -4.906207323074341e-06, -4.61190938949585e-06, -4.317611455917358e-06, -4.023313522338867e-06, -3.729015588760376e-06, -3.4347176551818848e-06, -3.1404197216033936e-06, -2.8461217880249023e-06, -2.551823854446411e-06, -2.25752592086792e-06, -1.9632279872894287e-06, -1.6689300537109375e-06, -1.3746321201324463e-06, -1.080334186553955e-06, -7.860362529754639e-07, -4.917383193969727e-07, -1.9744038581848145e-07, 9.685754776000977e-08, 3.91155481338501e-07, 6.854534149169922e-07, 9.797513484954834e-07, 1.2740492820739746e-06, 1.5683472156524658e-06, 1.862645149230957e-06, 2.1569430828094482e-06, 2.4512410163879395e-06, 2.7455389499664307e-06, 3.039836883544922e-06, 3.334134817123413e-06, 3.6284327507019043e-06, 3.9227306842803955e-06, 4.217028617858887e-06, 4.511326551437378e-06, 4.805624485015869e-06, 5.09992241859436e-06, 5.3942203521728516e-06, 5.688518285751343e-06, 5.982816219329834e-06, 6.277114152908325e-06, 6.571412086486816e-06, 6.865710020065308e-06, 7.160007953643799e-06, 7.45430588722229e-06, 7.748603820800781e-06, 8.042901754379272e-06, 8.337199687957764e-06, 8.631497621536255e-06, 8.925795555114746e-06, 9.220093488693237e-06, 9.514391422271729e-06, 9.80868935585022e-06, 1.0102987289428711e-05, 1.0397285223007202e-05, 1.0691583156585693e-05, 1.0985881090164185e-05, 1.1280179023742676e-05, 1.1574476957321167e-05, 1.1868774890899658e-05, 1.216307282447815e-05, 1.245737075805664e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 11.0, 11.0, 31.0, 37.0, 80.0, 119.0, 200.0, 229.0, 116.0, 80.0, 40.0, 19.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.262283699878026e-06, -7.6266087489784695e-06, -6.990933343331562e-06, -6.355258392432006e-06, -5.719582986785099e-06, -5.083908035885543e-06, -4.448233084985986e-06, -3.812557679339079e-06, -3.176882728439523e-06, -2.541207550166291e-06, -1.9055324855798972e-06, -1.2698574209935032e-06, -6.341822427202715e-07, 1.4929355529602617e-09, 6.371678864525165e-07, 1.2728432920994237e-06, 1.90851824299898e-06, 2.5441934212722117e-06, 3.1798685995454434e-06, 3.815543550445e-06, 4.451218956091907e-06, 5.086893906991463e-06, 5.7225688578910194e-06, 6.358244263537927e-06, 6.993919214437483e-06, 7.62959462008439e-06, 8.265269570983946e-06, 8.900944521883503e-06, 9.536619472783059e-06, 1.0172294423682615e-05, 1.0807969374582171e-05, 1.144364523497643e-05, 1.2079321095370688e-05, 1.2714996046270244e-05, 1.33506709971698e-05, 1.3986345948069356e-05, 1.4622021808463614e-05, 1.525769675936317e-05, 1.589337261975743e-05, 1.6529047570656985e-05, 1.716472252155654e-05, 1.7800397472456098e-05, 1.8436072423355654e-05, 1.907174737425521e-05, 1.9707422325154766e-05, 2.0343097276054323e-05, 2.097877222695388e-05, 2.161444899684284e-05, 2.225012212875299e-05, 2.2885797079652548e-05, 2.3521472030552104e-05, 2.415714698145166e-05, 2.4792821932351217e-05, 2.5428496883250773e-05, 2.606417183415033e-05, 2.669984860403929e-05, 2.7335523554938845e-05, 2.79711985058384e-05, 2.8606873456737958e-05, 2.9242548407637514e-05, 2.987822335853707e-05, 3.051390012842603e-05, 3.1149575079325587e-05, 3.178525003022514e-05, 3.24209249811247e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 14.0, 19.0, 27.0, 20.0, 41.0, 52.0, 51.0, 52.0, 75.0, 52.0, 53.0, 68.0, 50.0, 67.0, 56.0, 56.0, 54.0, 43.0, 37.0, 31.0, 16.0, 20.0, 9.0, 8.0, 10.0, 8.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.904036465333775e-06, -7.630450454598758e-06, -7.356865353358444e-06, -7.083279797370778e-06, -6.809694241383113e-06, -6.536108230648097e-06, -6.262522674660431e-06, -5.988937118672766e-06, -5.7153515626851e-06, -5.441766006697435e-06, -5.1681804507097695e-06, -4.894594894722104e-06, -4.621008883987088e-06, -4.347423782746773e-06, -4.073837772011757e-06, -3.8002522160240915e-06, -3.526666660036426e-06, -3.2530811040487606e-06, -2.979495548061095e-06, -2.7059097646997543e-06, -2.432324208712089e-06, -2.1587386527244234e-06, -1.8851529830499203e-06, -1.6115673133754171e-06, -1.3379817573877517e-06, -1.0643962014000863e-06, -7.908105317255831e-07, -5.172249188944988e-07, -2.4363930606341455e-07, 2.994624992425088e-08, 3.0353191959875403e-07, 5.771175892732572e-07, 8.507022357662208e-07, 1.1242877917538863e-06, 1.3978734614283894e-06, 1.6714591311028926e-06, 1.945044687090558e-06, 2.2186302430782234e-06, 2.4922160264395643e-06, 2.7658015824272297e-06, 3.039387138414895e-06, 3.3129726944025606e-06, 3.586558250390226e-06, 3.8601438063778915e-06, 4.133729817112908e-06, 4.407314918353222e-06, 4.680900929088239e-06, 4.954486485075904e-06, 5.2280720410635695e-06, 5.501657597051235e-06, 5.7752431530389e-06, 6.048828709026566e-06, 6.322414265014231e-06, 6.5960002757492475e-06, 6.869585831736913e-06, 7.143171387724578e-06, 7.416756943712244e-06, 7.69034249969991e-06, 7.963928510434926e-06, 8.23751361167524e-06, 8.511099622410256e-06, 8.784684723650571e-06, 9.058270734385587e-06, 9.331855835625902e-06, 9.605441846360918e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 8.0, 19.0, 43.0, 66.0, 125.0, 350.0, 673.0, 2068.0, 54174.0, 987680.0, 1981.0, 744.0, 289.0, 197.0, 63.0, 32.0, 16.0, 10.0, 7.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-06, -7.554888725280762e-06, -7.361173629760742e-06, -7.167458534240723e-06, -6.973743438720703e-06, -6.780028343200684e-06, -6.586313247680664e-06, -6.3925981521606445e-06, -6.198883056640625e-06, -6.0051679611206055e-06, -5.811452865600586e-06, -5.617737770080566e-06, -5.424022674560547e-06, -5.230307579040527e-06, -5.036592483520508e-06, -4.842877388000488e-06, -4.649162292480469e-06, -4.455447196960449e-06, -4.26173210144043e-06, -4.06801700592041e-06, -3.874301910400391e-06, -3.680586814880371e-06, -3.4868717193603516e-06, -3.293156623840332e-06, -3.0994415283203125e-06, -2.905726432800293e-06, -2.7120113372802734e-06, -2.518296241760254e-06, -2.3245811462402344e-06, -2.130866050720215e-06, -1.9371509552001953e-06, -1.7434358596801758e-06, -1.5497207641601562e-06, -1.3560056686401367e-06, -1.1622905731201172e-06, -9.685754776000977e-07, -7.748603820800781e-07, -5.811452865600586e-07, -3.8743019104003906e-07, -1.9371509552001953e-07, 0.0, 1.9371509552001953e-07, 3.8743019104003906e-07, 5.811452865600586e-07, 7.748603820800781e-07, 9.685754776000977e-07, 1.1622905731201172e-06, 1.3560056686401367e-06, 1.5497207641601562e-06, 1.7434358596801758e-06, 1.9371509552001953e-06, 2.130866050720215e-06, 2.3245811462402344e-06, 2.518296241760254e-06, 2.7120113372802734e-06, 2.905726432800293e-06, 3.0994415283203125e-06, 3.293156623840332e-06, 3.4868717193603516e-06, 3.680586814880371e-06, 3.874301910400391e-06, 4.06801700592041e-06, 4.26173210144043e-06, 4.455447196960449e-06, 4.649162292480469e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 15.0, 8.0, 20.0, 32.0, 62.0, 48.0, 84.0, 74.0, 99.0, 97.0, 83.0, 83.0, 78.0, 70.0, 53.0, 35.0, 18.0, 18.0, 13.0, 10.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4836273193359375e-06, -5.218200385570526e-06, -4.952773451805115e-06, -4.687346518039703e-06, -4.421919584274292e-06, -4.156492650508881e-06, -3.891065716743469e-06, -3.625638782978058e-06, -3.3602118492126465e-06, -3.094784915447235e-06, -2.8293579816818237e-06, -2.5639310479164124e-06, -2.298504114151001e-06, -2.0330771803855896e-06, -1.7676502466201782e-06, -1.5022233128547668e-06, -1.2367963790893555e-06, -9.71369445323944e-07, -7.059425115585327e-07, -4.4051557779312134e-07, -1.7508864402770996e-07, 9.033828973770142e-08, 3.557652235031128e-07, 6.211921572685242e-07, 8.866190910339355e-07, 1.152046024799347e-06, 1.4174729585647583e-06, 1.6828998923301697e-06, 1.948326826095581e-06, 2.2137537598609924e-06, 2.479180693626404e-06, 2.744607627391815e-06, 3.0100345611572266e-06, 3.275461494922638e-06, 3.5408884286880493e-06, 3.8063153624534607e-06, 4.071742296218872e-06, 4.3371692299842834e-06, 4.602596163749695e-06, 4.868023097515106e-06, 5.133450031280518e-06, 5.398876965045929e-06, 5.66430389881134e-06, 5.929730832576752e-06, 6.195157766342163e-06, 6.4605847001075745e-06, 6.726011633872986e-06, 6.991438567638397e-06, 7.256865501403809e-06, 7.52229243516922e-06, 7.787719368934631e-06, 8.053146302700043e-06, 8.318573236465454e-06, 8.584000170230865e-06, 8.849427103996277e-06, 9.114854037761688e-06, 9.3802809715271e-06, 9.645707905292511e-06, 9.911134839057922e-06, 1.0176561772823334e-05, 1.0441988706588745e-05, 1.0707415640354156e-05, 1.0972842574119568e-05, 1.123826950788498e-05, 1.150369644165039e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 131.0, 0.0, 0.0, 0.0, 351.0, 0.0, 0.0, 4971.0, 0.0, 0.0, 0.0, 1037511.0, 0.0, 0.0, 5006.0, 0.0, 0.0, 0.0, 337.0, 0.0, 0.0, 126.0, 0.0, 0.0, 0.0, 52.0, 0.0, 0.0, 19.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.388872861862183e-07, -6.221234798431396e-07, -6.05359673500061e-07, -5.885958671569824e-07, -5.718320608139038e-07, -5.550682544708252e-07, -5.383044481277466e-07, -5.21540641784668e-07, -5.047768354415894e-07, -4.880130290985107e-07, -4.7124922275543213e-07, -4.544854164123535e-07, -4.377216100692749e-07, -4.209578037261963e-07, -4.041939973831177e-07, -3.8743019104003906e-07, -3.7066638469696045e-07, -3.5390257835388184e-07, -3.371387720108032e-07, -3.203749656677246e-07, -3.03611159324646e-07, -2.868473529815674e-07, -2.7008354663848877e-07, -2.5331974029541016e-07, -2.3655593395233154e-07, -2.1979212760925293e-07, -2.0302832126617432e-07, -1.862645149230957e-07, -1.695007085800171e-07, -1.5273690223693848e-07, -1.3597309589385986e-07, -1.1920928955078125e-07, -1.0244548320770264e-07, -8.568167686462402e-08, -6.891787052154541e-08, -5.21540641784668e-08, -3.5390257835388184e-08, -1.862645149230957e-08, -1.862645149230957e-09, 1.4901161193847656e-08, 3.166496753692627e-08, 4.842877388000488e-08, 6.51925802230835e-08, 8.195638656616211e-08, 9.872019290924072e-08, 1.1548399925231934e-07, 1.3224780559539795e-07, 1.4901161193847656e-07, 1.6577541828155518e-07, 1.825392246246338e-07, 1.993030309677124e-07, 2.1606683731079102e-07, 2.3283064365386963e-07, 2.4959444999694824e-07, 2.6635825634002686e-07, 2.8312206268310547e-07, 2.998858690261841e-07, 3.166496753692627e-07, 3.334134817123413e-07, 3.501772880554199e-07, 3.6694109439849854e-07, 3.8370490074157715e-07, 4.0046870708465576e-07, 4.172325134277344e-07]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 8.0, 8.0, 10.0, 16.0, 15.0, 24.0, 21.0, 20.0, 29.0, 38.0, 36.0, 47.0, 46.0, 49.0, 48.0, 65.0, 46.0, 63.0, 74.0, 47.0, 50.0, 38.0, 36.0, 32.0, 31.0, 14.0, 15.0, 15.0, 10.0, 13.0, 8.0, 6.0, 9.0, 1.0, 7.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6748905181884766e-05, -1.6318634152412415e-05, -1.5888363122940063e-05, -1.5458092093467712e-05, -1.5027821063995361e-05, -1.459755003452301e-05, -1.416727900505066e-05, -1.3737007975578308e-05, -1.3306736946105957e-05, -1.2876465916633606e-05, -1.2446194887161255e-05, -1.2015923857688904e-05, -1.1585652828216553e-05, -1.1155381798744202e-05, -1.072511076927185e-05, -1.02948397397995e-05, -9.864568710327148e-06, -9.434297680854797e-06, -9.004026651382446e-06, -8.573755621910095e-06, -8.143484592437744e-06, -7.713213562965393e-06, -7.282942533493042e-06, -6.852671504020691e-06, -6.42240047454834e-06, -5.992129445075989e-06, -5.561858415603638e-06, -5.131587386131287e-06, -4.7013163566589355e-06, -4.2710453271865845e-06, -3.840774297714233e-06, -3.4105032682418823e-06, -2.9802322387695312e-06, -2.54996120929718e-06, -2.119690179824829e-06, -1.689419150352478e-06, -1.259148120880127e-06, -8.288770914077759e-07, -3.986060619354248e-07, 3.166496753692627e-08, 4.6193599700927734e-07, 8.922070264816284e-07, 1.3224780559539795e-06, 1.7527490854263306e-06, 2.1830201148986816e-06, 2.6132911443710327e-06, 3.043562173843384e-06, 3.473833203315735e-06, 3.904104232788086e-06, 4.334375262260437e-06, 4.764646291732788e-06, 5.194917321205139e-06, 5.62518835067749e-06, 6.055459380149841e-06, 6.485730409622192e-06, 6.9160014390945435e-06, 7.3462724685668945e-06, 7.776543498039246e-06, 8.206814527511597e-06, 8.637085556983948e-06, 9.067356586456299e-06, 9.49762761592865e-06, 9.927898645401001e-06, 1.0358169674873352e-05, 1.0788440704345703e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 0.0, 0.0, 60.0, 0.0, 0.0, 0.0, 0.0, 0.0, 785.0, 0.0, 0.0, 0.0, 0.0, 64.0, 0.0, 0.0, 0.0, 0.0, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 19.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.46451997756958e-07, -3.3527612686157227e-07, -3.241002559661865e-07, -3.129243850708008e-07, -3.0174851417541504e-07, -2.905726432800293e-07, -2.7939677238464355e-07, -2.682209014892578e-07, -2.5704503059387207e-07, -2.4586915969848633e-07, -2.3469328880310059e-07, -2.2351741790771484e-07, -2.123415470123291e-07, -2.0116567611694336e-07, -1.8998980522155762e-07, -1.7881393432617188e-07, -1.6763806343078613e-07, -1.564621925354004e-07, -1.4528632164001465e-07, -1.341104507446289e-07, -1.2293457984924316e-07, -1.1175870895385742e-07, -1.0058283805847168e-07, -8.940696716308594e-08, -7.82310962677002e-08, -6.705522537231445e-08, -5.587935447692871e-08, -4.470348358154297e-08, -3.3527612686157227e-08, -2.2351741790771484e-08, -1.1175870895385742e-08, 0.0, 1.1175870895385742e-08, 2.2351741790771484e-08, 3.3527612686157227e-08, 4.470348358154297e-08, 5.587935447692871e-08, 6.705522537231445e-08, 7.82310962677002e-08, 8.940696716308594e-08, 1.0058283805847168e-07, 1.1175870895385742e-07, 1.2293457984924316e-07, 1.341104507446289e-07, 1.4528632164001465e-07, 1.564621925354004e-07, 1.6763806343078613e-07, 1.7881393432617188e-07, 1.8998980522155762e-07, 2.0116567611694336e-07, 2.123415470123291e-07, 2.2351741790771484e-07, 2.3469328880310059e-07, 2.4586915969848633e-07, 2.5704503059387207e-07, 2.682209014892578e-07, 2.7939677238464355e-07, 2.905726432800293e-07, 3.0174851417541504e-07, 3.129243850708008e-07, 3.241002559661865e-07, 3.3527612686157227e-07, 3.46451997756958e-07, 3.5762786865234375e-07]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [10.0, 11.0, 58.0, 251.0, 551.0, 115.0, 15.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.121250524098286e-06, -3.928803835151484e-06, -2.736357146204682e-06, -1.54391045725788e-06, -3.5146376831107773e-07, 8.409829206357244e-07, 2.0334296095825266e-06, 3.2258762985293288e-06, 4.418322987476131e-06, 5.610769676422933e-06, 6.803216365369735e-06, 7.995662599569187e-06, 9.18811019801069e-06, 1.0380555977462791e-05, 1.1573003575904295e-05, 1.2765449355356395e-05, 1.39578969537979e-05, 1.5150343642744701e-05, 1.6342790331691504e-05, 1.7535236111143604e-05, 1.8727683709585108e-05, 1.9920131308026612e-05, 2.1112577087478712e-05, 2.2305022866930813e-05, 2.3497470465372317e-05, 2.468991806381382e-05, 2.588236384326592e-05, 2.707480962271802e-05, 2.8267257221159525e-05, 2.945970481960103e-05, 3.065215059905313e-05, 3.184459637850523e-05, 3.303704579593614e-05, 3.422949157538824e-05, 3.542193735484034e-05, 3.6614386772271246e-05, 3.7806832551723346e-05, 3.8999278331175447e-05, 4.0191727748606354e-05, 4.1384173528058454e-05, 4.2576619307510555e-05, 4.3769065086962655e-05, 4.4961510866414756e-05, 4.615396028384566e-05, 4.7346406063297763e-05, 4.8538851842749864e-05, 4.973130126018077e-05, 5.092374703963287e-05, 5.211619281908497e-05, 5.330863859853707e-05, 5.450108437798917e-05, 5.569353379542008e-05, 5.688597957487218e-05, 5.807842535432428e-05, 5.927087477175519e-05, 6.046332055120729e-05, 6.165576633065939e-05, 6.28482157480903e-05, 6.404065788956359e-05, 6.52331073069945e-05, 6.642554944846779e-05, 6.76179988658987e-05, 6.88104482833296e-05, 7.00028904248029e-05, 7.119533984223381e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 14.0, 28.0, 38.0, 49.0, 67.0, 73.0, 85.0, 80.0, 84.0, 77.0, 86.0, 82.0, 66.0, 48.0, 40.0, 23.0, 21.0, 13.0, 6.0, 11.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19500508744386e-06, -4.954760242981138e-06, -4.714515853265766e-06, -4.4742710088030435e-06, -4.234026164340321e-06, -3.9937813198775984e-06, -3.7535367027885513e-06, -3.5132920856995042e-06, -3.2730472412367817e-06, -3.032802396774059e-06, -2.792557779685012e-06, -2.552313162595965e-06, -2.3120683181332424e-06, -2.07182347367052e-06, -1.8315788565814728e-06, -1.591334125805588e-06, -1.3510893950297032e-06, -1.1108446642538183e-06, -8.705999334779335e-07, -6.303552027020487e-07, -3.901104719261639e-07, -1.4986574115027906e-07, 9.037898962560575e-08, 3.3062372040149057e-07, 5.708684511773754e-07, 8.111131819532602e-07, 1.051357912729145e-06, 1.2916026435050298e-06, 1.5318473742809147e-06, 1.7720921050567995e-06, 2.0123368358326843e-06, 2.2525814529217314e-06, 2.492825842637103e-06, 2.7330706870998256e-06, 2.9733153041888727e-06, 3.2135599212779198e-06, 3.4538047657406423e-06, 3.694049610203365e-06, 3.9342939999187365e-06, 4.174538844381459e-06, 4.414783688844182e-06, 4.655028533306904e-06, 4.895273377769627e-06, 5.135517767484998e-06, 5.375762611947721e-06, 5.616007456410443e-06, 5.856251846125815e-06, 6.096496690588538e-06, 6.33674153505126e-06, 6.576986379513983e-06, 6.817231223976705e-06, 7.057475613692077e-06, 7.297720458154799e-06, 7.537965302617522e-06, 7.778209692332894e-06, 8.018454536795616e-06, 8.258699381258339e-06, 8.498944225721061e-06, 8.739189070183784e-06, 8.979433914646506e-06, 9.219678759109229e-06, 9.45992269407725e-06, 9.700167538539972e-06, 9.940412383002695e-06, 1.0180657227465417e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 0.0, 8.0, 5.0, 2.0, 12.0, 16.0, 27.0, 33.0, 37.0, 45.0, 88.0, 154.0, 299.0, 488.0, 903.0, 2315.0, 6421.0, 17750.0, 109745.0, 771189.0, 104755.0, 23349.0, 5928.0, 2681.0, 1069.0, 470.0, 299.0, 163.0, 84.0, 67.0, 48.0, 21.0, 17.0, 23.0, 8.0, 10.0, 10.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.4066696166992188e-05, -1.3670884072780609e-05, -1.327507197856903e-05, -1.2879259884357452e-05, -1.2483447790145874e-05, -1.2087635695934296e-05, -1.1691823601722717e-05, -1.1296011507511139e-05, -1.090019941329956e-05, -1.0504387319087982e-05, -1.0108575224876404e-05, -9.712763130664825e-06, -9.316951036453247e-06, -8.921138942241669e-06, -8.52532684803009e-06, -8.129514753818512e-06, -7.733702659606934e-06, -7.337890565395355e-06, -6.942078471183777e-06, -6.5462663769721985e-06, -6.15045428276062e-06, -5.754642188549042e-06, -5.358830094337463e-06, -4.963018000125885e-06, -4.567205905914307e-06, -4.171393811702728e-06, -3.77558171749115e-06, -3.3797696232795715e-06, -2.983957529067993e-06, -2.588145434856415e-06, -2.1923333406448364e-06, -1.796521246433258e-06, -1.4007091522216797e-06, -1.0048970580101013e-06, -6.09084963798523e-07, -2.1327286958694458e-07, 1.825392246246338e-07, 5.783513188362122e-07, 9.741634130477905e-07, 1.369975507259369e-06, 1.7657876014709473e-06, 2.1615996956825256e-06, 2.557411789894104e-06, 2.9532238841056824e-06, 3.3490359783172607e-06, 3.744848072528839e-06, 4.1406601667404175e-06, 4.536472260951996e-06, 4.932284355163574e-06, 5.328096449375153e-06, 5.723908543586731e-06, 6.119720637798309e-06, 6.515532732009888e-06, 6.911344826221466e-06, 7.3071569204330444e-06, 7.702969014644623e-06, 8.098781108856201e-06, 8.49459320306778e-06, 8.890405297279358e-06, 9.286217391490936e-06, 9.682029485702515e-06, 1.0077841579914093e-05, 1.0473653674125671e-05, 1.086946576833725e-05, 1.1265277862548828e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 9.0, 13.0, 20.0, 23.0, 18.0, 24.0, 41.0, 40.0, 34.0, 42.0, 59.0, 72.0, 64.0, 57.0, 62.0, 64.0, 51.0, 33.0, 49.0, 26.0, 38.0, 33.0, 16.0, 22.0, 21.0, 18.0, 6.0, 9.0, 8.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.543231964111328e-06, -5.311332643032074e-06, -5.07943332195282e-06, -4.847534000873566e-06, -4.6156346797943115e-06, -4.383735358715057e-06, -4.151836037635803e-06, -3.919936716556549e-06, -3.688037395477295e-06, -3.4561380743980408e-06, -3.2242387533187866e-06, -2.9923394322395325e-06, -2.7604401111602783e-06, -2.528540790081024e-06, -2.29664146900177e-06, -2.064742147922516e-06, -1.8328428268432617e-06, -1.6009435057640076e-06, -1.3690441846847534e-06, -1.1371448636054993e-06, -9.052455425262451e-07, -6.73346221446991e-07, -4.414469003677368e-07, -2.0954757928848267e-07, 2.2351741790771484e-08, 2.5425106287002563e-07, 4.861503839492798e-07, 7.180497050285339e-07, 9.499490261077881e-07, 1.1818483471870422e-06, 1.4137476682662964e-06, 1.6456469893455505e-06, 1.8775463104248047e-06, 2.109445631504059e-06, 2.341344952583313e-06, 2.573244273662567e-06, 2.8051435947418213e-06, 3.0370429158210754e-06, 3.2689422369003296e-06, 3.5008415579795837e-06, 3.732740879058838e-06, 3.964640200138092e-06, 4.196539521217346e-06, 4.4284388422966e-06, 4.6603381633758545e-06, 4.892237484455109e-06, 5.124136805534363e-06, 5.356036126613617e-06, 5.587935447692871e-06, 5.819834768772125e-06, 6.051734089851379e-06, 6.2836334109306335e-06, 6.515532732009888e-06, 6.747432053089142e-06, 6.979331374168396e-06, 7.21123069524765e-06, 7.443130016326904e-06, 7.675029337406158e-06, 7.906928658485413e-06, 8.138827979564667e-06, 8.370727300643921e-06, 8.602626621723175e-06, 8.83452594280243e-06, 9.066425263881683e-06, 9.298324584960938e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 2.0, 11.0, 8.0, 13.0, 35.0, 38.0, 80.0, 156.0, 195.0, 450.0, 944.0, 1967.0, 9476.0, 129111.0, 853443.0, 44422.0, 5265.0, 1359.0, 748.0, 318.0, 212.0, 124.0, 53.0, 39.0, 21.0, 15.0, 13.0, 9.0, 6.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3589859008789062e-05, -1.3073906302452087e-05, -1.2557953596115112e-05, -1.2042000889778137e-05, -1.1526048183441162e-05, -1.1010095477104187e-05, -1.0494142770767212e-05, -9.978190064430237e-06, -9.462237358093262e-06, -8.946284651756287e-06, -8.430331945419312e-06, -7.914379239082336e-06, -7.398426532745361e-06, -6.882473826408386e-06, -6.366521120071411e-06, -5.850568413734436e-06, -5.334615707397461e-06, -4.818663001060486e-06, -4.302710294723511e-06, -3.7867575883865356e-06, -3.2708048820495605e-06, -2.7548521757125854e-06, -2.2388994693756104e-06, -1.7229467630386353e-06, -1.2069940567016602e-06, -6.910413503646851e-07, -1.7508864402770996e-07, 3.4086406230926514e-07, 8.568167686462402e-07, 1.3727694749832153e-06, 1.8887221813201904e-06, 2.4046748876571655e-06, 2.9206275939941406e-06, 3.4365803003311157e-06, 3.952533006668091e-06, 4.468485713005066e-06, 4.984438419342041e-06, 5.500391125679016e-06, 6.016343832015991e-06, 6.532296538352966e-06, 7.048249244689941e-06, 7.5642019510269165e-06, 8.080154657363892e-06, 8.596107363700867e-06, 9.112060070037842e-06, 9.628012776374817e-06, 1.0143965482711792e-05, 1.0659918189048767e-05, 1.1175870895385742e-05, 1.1691823601722717e-05, 1.2207776308059692e-05, 1.2723729014396667e-05, 1.3239681720733643e-05, 1.3755634427070618e-05, 1.4271587133407593e-05, 1.4787539839744568e-05, 1.5303492546081543e-05, 1.5819445252418518e-05, 1.6335397958755493e-05, 1.6851350665092468e-05, 1.7367303371429443e-05, 1.788325607776642e-05, 1.8399208784103394e-05, 1.891516149044037e-05, 1.9431114196777344e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 5.0, 8.0, 16.0, 15.0, 20.0, 24.0, 29.0, 30.0, 35.0, 60.0, 49.0, 50.0, 54.0, 69.0, 73.0, 70.0, 61.0, 58.0, 51.0, 40.0, 30.0, 28.0, 19.0, 25.0, 17.0, 9.0, 7.0, 9.0, 10.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-06, -8.05780291557312e-06, -7.770955562591553e-06, -7.484108209609985e-06, -7.197260856628418e-06, -6.910413503646851e-06, -6.623566150665283e-06, -6.336718797683716e-06, -6.0498714447021484e-06, -5.763024091720581e-06, -5.476176738739014e-06, -5.189329385757446e-06, -4.902482032775879e-06, -4.6156346797943115e-06, -4.328787326812744e-06, -4.041939973831177e-06, -3.7550926208496094e-06, -3.468245267868042e-06, -3.1813979148864746e-06, -2.8945505619049072e-06, -2.60770320892334e-06, -2.3208558559417725e-06, -2.034008502960205e-06, -1.7471611499786377e-06, -1.4603137969970703e-06, -1.173466444015503e-06, -8.866190910339355e-07, -5.997717380523682e-07, -3.129243850708008e-07, -2.60770320892334e-08, 2.60770320892334e-07, 5.476176738739014e-07, 8.344650268554688e-07, 1.1213123798370361e-06, 1.4081597328186035e-06, 1.695007085800171e-06, 1.9818544387817383e-06, 2.2687017917633057e-06, 2.555549144744873e-06, 2.8423964977264404e-06, 3.129243850708008e-06, 3.416091203689575e-06, 3.7029385566711426e-06, 3.98978590965271e-06, 4.276633262634277e-06, 4.563480615615845e-06, 4.850327968597412e-06, 5.1371753215789795e-06, 5.424022674560547e-06, 5.710870027542114e-06, 5.997717380523682e-06, 6.284564733505249e-06, 6.571412086486816e-06, 6.858259439468384e-06, 7.145106792449951e-06, 7.4319541454315186e-06, 7.718801498413086e-06, 8.005648851394653e-06, 8.29249620437622e-06, 8.579343557357788e-06, 8.866190910339355e-06, 9.153038263320923e-06, 9.43988561630249e-06, 9.726732969284058e-06, 1.0013580322265625e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 64.0, 0.0, 0.0, 0.0, 200.0, 0.0, 0.0, 1883.0, 0.0, 0.0, 0.0, 29661.0, 0.0, 0.0, 0.0, 984997.0, 0.0, 0.0, 29519.0, 0.0, 0.0, 0.0, 1909.0, 0.0, 0.0, 200.0, 0.0, 0.0, 0.0, 72.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-07, -5.19677996635437e-07, -5.029141902923584e-07, -4.861503839492798e-07, -4.6938657760620117e-07, -4.5262277126312256e-07, -4.3585896492004395e-07, -4.1909515857696533e-07, -4.023313522338867e-07, -3.855675458908081e-07, -3.688037395477295e-07, -3.520399332046509e-07, -3.3527612686157227e-07, -3.1851232051849365e-07, -3.0174851417541504e-07, -2.849847078323364e-07, -2.682209014892578e-07, -2.514570951461792e-07, -2.3469328880310059e-07, -2.1792948246002197e-07, -2.0116567611694336e-07, -1.8440186977386475e-07, -1.6763806343078613e-07, -1.5087425708770752e-07, -1.341104507446289e-07, -1.1734664440155029e-07, -1.0058283805847168e-07, -8.381903171539307e-08, -6.705522537231445e-08, -5.029141902923584e-08, -3.3527612686157227e-08, -1.6763806343078613e-08, 0.0, 1.6763806343078613e-08, 3.3527612686157227e-08, 5.029141902923584e-08, 6.705522537231445e-08, 8.381903171539307e-08, 1.0058283805847168e-07, 1.1734664440155029e-07, 1.341104507446289e-07, 1.5087425708770752e-07, 1.6763806343078613e-07, 1.8440186977386475e-07, 2.0116567611694336e-07, 2.1792948246002197e-07, 2.3469328880310059e-07, 2.514570951461792e-07, 2.682209014892578e-07, 2.849847078323364e-07, 3.0174851417541504e-07, 3.1851232051849365e-07, 3.3527612686157227e-07, 3.520399332046509e-07, 3.688037395477295e-07, 3.855675458908081e-07, 4.023313522338867e-07, 4.1909515857696533e-07, 4.3585896492004395e-07, 4.5262277126312256e-07, 4.6938657760620117e-07, 4.861503839492798e-07, 5.029141902923584e-07, 5.19677996635437e-07, 5.364418029785156e-07]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 889.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 0.0, 9.0, 0.0, 15.0, 0.0, 0.0, 17.0, 0.0, 29.0, 0.0, 58.0, 0.0, 0.0, 105.0, 0.0, 320.0, 0.0, 0.0, 1140.0, 0.0, 5721.0, 0.0, 48809.0, 0.0, 0.0, 935941.0, 0.0, 48926.0, 0.0, 5833.0, 0.0, 0.0, 1056.0, 0.0, 307.0, 0.0, 0.0, 148.0, 0.0, 64.0, 0.0, 29.0, 0.0, 0.0, 12.0, 0.0, 8.0, 0.0, 10.0, 0.0, 0.0, 5.0, 0.0, 3.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.093193173408508e-07, -7.841736078262329e-07, -7.59027898311615e-07, -7.338821887969971e-07, -7.087364792823792e-07, -6.835907697677612e-07, -6.584450602531433e-07, -6.332993507385254e-07, -6.081536412239075e-07, -5.830079317092896e-07, -5.578622221946716e-07, -5.327165126800537e-07, -5.075708031654358e-07, -4.824250936508179e-07, -4.5727938413619995e-07, -4.3213367462158203e-07, -4.069879651069641e-07, -3.818422555923462e-07, -3.5669654607772827e-07, -3.3155083656311035e-07, -3.0640512704849243e-07, -2.812594175338745e-07, -2.561137080192566e-07, -2.3096799850463867e-07, -2.0582228899002075e-07, -1.8067657947540283e-07, -1.555308699607849e-07, -1.30385160446167e-07, -1.0523945093154907e-07, -8.009374141693115e-08, -5.494803190231323e-08, -2.9802322387695312e-08, -4.6566128730773926e-09, 2.0489096641540527e-08, 4.563480615615845e-08, 7.078051567077637e-08, 9.592622518539429e-08, 1.210719347000122e-07, 1.4621764421463013e-07, 1.7136335372924805e-07, 1.9650906324386597e-07, 2.2165477275848389e-07, 2.468004822731018e-07, 2.7194619178771973e-07, 2.9709190130233765e-07, 3.2223761081695557e-07, 3.473833203315735e-07, 3.725290298461914e-07, 3.976747393608093e-07, 4.2282044887542725e-07, 4.4796615839004517e-07, 4.731118679046631e-07, 4.98257577419281e-07, 5.234032869338989e-07, 5.485489964485168e-07, 5.736947059631348e-07, 5.988404154777527e-07, 6.239861249923706e-07, 6.491318345069885e-07, 6.742775440216064e-07, 6.994232535362244e-07, 7.245689630508423e-07, 7.497146725654602e-07, 7.748603820800781e-07]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 17.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 709.0, 0.0, 0.0, 99.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 19.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -3.995373845100403e-07, -3.818422555923462e-07, -3.641471266746521e-07, -3.46451997756958e-07, -3.287568688392639e-07, -3.110617399215698e-07, -2.9336661100387573e-07, -2.7567148208618164e-07, -2.5797635316848755e-07, -2.4028122425079346e-07, -2.2258609533309937e-07, -2.0489096641540527e-07, -1.8719583749771118e-07, -1.695007085800171e-07, -1.51805579662323e-07, -1.341104507446289e-07, -1.1641532182693481e-07, -9.872019290924072e-08, -8.102506399154663e-08, -6.332993507385254e-08, -4.563480615615845e-08, -2.7939677238464355e-08, -1.0244548320770264e-08, 7.450580596923828e-09, 2.514570951461792e-08, 4.284083843231201e-08, 6.05359673500061e-08, 7.82310962677002e-08, 9.592622518539429e-08, 1.1362135410308838e-07, 1.3131648302078247e-07, 1.4901161193847656e-07, 1.6670674085617065e-07, 1.8440186977386475e-07, 2.0209699869155884e-07, 2.1979212760925293e-07, 2.3748725652694702e-07, 2.551823854446411e-07, 2.728775143623352e-07, 2.905726432800293e-07, 3.082677721977234e-07, 3.259629011154175e-07, 3.4365803003311157e-07, 3.6135315895080566e-07, 3.7904828786849976e-07, 3.9674341678619385e-07, 4.1443854570388794e-07, 4.3213367462158203e-07, 4.498288035392761e-07, 4.675239324569702e-07, 4.852190613746643e-07, 5.029141902923584e-07, 5.206093192100525e-07, 5.383044481277466e-07, 5.559995770454407e-07, 5.736947059631348e-07, 5.913898348808289e-07, 6.09084963798523e-07, 6.26780092716217e-07, 6.444752216339111e-07, 6.621703505516052e-07, 6.798654794692993e-07, 6.975606083869934e-07, 7.152557373046875e-07]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 18.0, 45.0, 299.0, 526.0, 87.0, 20.0, 7.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.909733226872049e-05, -5.714019789593294e-05, -5.518306352314539e-05, -5.322592915035784e-05, -5.126879477757029e-05, -4.931166040478274e-05, -4.7354522394016385e-05, -4.539739165920764e-05, -4.3440253648441285e-05, -4.1483119275653735e-05, -3.9525984902866185e-05, -3.7568850530078635e-05, -3.5611716157291085e-05, -3.3654581784503534e-05, -3.1697447411715984e-05, -2.974031121993903e-05, -2.7783178666140884e-05, -2.5826044293353334e-05, -2.3868909920565784e-05, -2.1911775547778234e-05, -1.9954641174990684e-05, -1.7997506802203134e-05, -1.604037061042618e-05, -1.408323623763863e-05, -1.212610186485108e-05, -1.016896749206353e-05, -8.21183311927598e-06, -6.254697836993728e-06, -4.297563464206178e-06, -2.3404290914186276e-06, -3.832938091363758e-07, 1.5738405636511743e-06, 3.5309712984599173e-06, 5.488105671247467e-06, 7.445240498782368e-06, 9.40237532631727e-06, 1.135950969910482e-05, 1.331664407189237e-05, 1.527377935417462e-05, 1.723091372696217e-05, 1.918804809974972e-05, 2.114518247253727e-05, 2.3102316845324822e-05, 2.5059453037101775e-05, 2.7016587409889325e-05, 2.8973721782676876e-05, 3.0930856155464426e-05, 3.2887990528251976e-05, 3.4845124901039526e-05, 3.6802259273827076e-05, 3.8759393646614626e-05, 4.0716528019402176e-05, 4.2673662392189726e-05, 4.4630796764977276e-05, 4.6587934775743634e-05, 4.8545065510552377e-05, 5.0502203521318734e-05, 5.2459337894106284e-05, 5.4416472266893834e-05, 5.6373606639681384e-05, 5.8330741012468934e-05, 6.0287875385256484e-05, 6.224500975804403e-05, 6.420214776881039e-05, 6.615927850361913e-05]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 10.0, 6.0, 10.0, 8.0, 13.0, 12.0, 9.0, 23.0, 21.0, 15.0, 15.0, 31.0, 22.0, 29.0, 39.0, 37.0, 33.0, 39.0, 36.0, 45.0, 30.0, 44.0, 37.0, 42.0, 26.0, 42.0, 36.0, 31.0, 27.0, 38.0, 21.0, 20.0, 19.0, 19.0, 20.0, 11.0, 7.0, 15.0, 6.0, 10.0, 9.0, 8.0, 7.0, 8.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-9.717604370962363e-06, -9.422691618965473e-06, -9.127777957473882e-06, -8.832865205476992e-06, -8.537952453480102e-06, -8.243039701483212e-06, -7.948126949486323e-06, -7.653213287994731e-06, -7.3583005359978415e-06, -7.063387784000952e-06, -6.768474577256711e-06, -6.473561370512471e-06, -6.178648618515581e-06, -5.883735866518691e-06, -5.588822659774451e-06, -5.29390945303021e-06, -4.99899670103332e-06, -4.7040839490364306e-06, -4.40917074229219e-06, -4.114257535547949e-06, -3.81934478355106e-06, -3.5244318041804945e-06, -3.2295188248099294e-06, -2.934605845439364e-06, -2.639692866068799e-06, -2.344779886698234e-06, -2.0498669073276687e-06, -1.7549539279571036e-06, -1.4600409485865384e-06, -1.1651279692159733e-06, -8.702149898454081e-07, -5.75302010474843e-07, -2.803890311042778e-07, 1.4523948266287334e-08, 3.094369276368525e-07, 6.043499070074176e-07, 8.992628863779828e-07, 1.194175865748548e-06, 1.489088845119113e-06, 1.7840018244896783e-06, 2.0789148038602434e-06, 2.3738277832308086e-06, 2.6687407626013737e-06, 2.963653741971939e-06, 3.258566721342504e-06, 3.553479700713069e-06, 3.848392680083634e-06, 4.143305886827875e-06, 4.438218638824765e-06, 4.733131390821654e-06, 5.028044597565895e-06, 5.3229578043101355e-06, 5.617870556307025e-06, 5.912783308303915e-06, 6.2076965150481556e-06, 6.502609721792396e-06, 6.797522473789286e-06, 7.092435225786176e-06, 7.387348432530416e-06, 7.682261639274657e-06, 7.977174391271546e-06, 8.272087143268436e-06, 8.566999895265326e-06, 8.861913556756917e-06, 9.156826308753807e-06]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 4.0, 8.0, 7.0, 5.0, 5.0, 13.0, 17.0, 16.0, 24.0, 30.0, 41.0, 34.0, 68.0, 66.0, 84.0, 97.0, 116.0, 153.0, 200.0, 279.0, 657.0, 1047011.0, 463.0, 234.0, 174.0, 165.0, 129.0, 104.0, 81.0, 57.0, 53.0, 30.0, 34.0, 27.0, 13.0, 21.0, 12.0, 14.0, 7.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.7621650840737857e-05, -1.7041518731275573e-05, -1.6461384802823886e-05, -1.5881252693361603e-05, -1.530112058389932e-05, -1.4720988474437036e-05, -1.414085545548005e-05, -1.3560722436523065e-05, -1.2980590327060781e-05, -1.2400458217598498e-05, -1.1820325198641513e-05, -1.1240192179684527e-05, -1.0660060070222244e-05, -1.007992796075996e-05, -9.499794941802975e-06, -8.91966192284599e-06, -8.339529813383706e-06, -7.759397703921422e-06, -7.179264684964437e-06, -6.599132120754803e-06, -6.018999556545168e-06, -5.438866992335534e-06, -4.858734428125899e-06, -4.278601863916265e-06, -3.6984692997066304e-06, -3.118336735496996e-06, -2.5382041712873615e-06, -1.958071607077727e-06, -1.3779390428680927e-06, -7.978064786584582e-07, -2.1767391444882378e-07, 3.6245864976081066e-07, 9.425912139704451e-07, 1.5227237781800795e-06, 2.102856342389714e-06, 2.6829889065993484e-06, 3.263121470808983e-06, 3.843254035018617e-06, 4.423386599228252e-06, 5.003519163437886e-06, 5.583651727647521e-06, 6.163784291857155e-06, 6.7439168560667895e-06, 7.324049420276424e-06, 7.904181984486058e-06, 8.484314093948342e-06, 9.064447112905327e-06, 9.644580131862313e-06, 1.0224712241324596e-05, 1.080484435078688e-05, 1.1384977369743865e-05, 1.196511038870085e-05, 1.2545242498163134e-05, 1.3125374607625417e-05, 1.3705507626582403e-05, 1.4285640645539388e-05, 1.4865772755001672e-05, 1.5445904864463955e-05, 1.6026038792915642e-05, 1.6606170902377926e-05, 1.718630301184021e-05, 1.7766435121302493e-05, 1.8346567230764776e-05, 1.8926701159216464e-05, 1.9506833268678747e-05]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 25.0, 45.0, 233.0, 7237.0, 51462480.0, 1030.0, 194.0, 45.0, 24.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-122.0, -119.56494140625, -117.1298828125, -114.69482421875, -112.259765625, -109.82470703125, -107.3896484375, -104.95458984375, -102.51953125, -100.08447265625, -97.6494140625, -95.21435546875, -92.779296875, -90.34423828125, -87.9091796875, -85.47412109375, -83.0390625, -80.60400390625, -78.1689453125, -75.73388671875, -73.298828125, -70.86376953125, -68.4287109375, -65.99365234375, -63.55859375, -61.12353515625, -58.6884765625, -56.25341796875, -53.818359375, -51.38330078125, -48.9482421875, -46.51318359375, -44.078125, -41.64306640625, -39.2080078125, -36.77294921875, -34.337890625, -31.90283203125, -29.4677734375, -27.03271484375, -24.59765625, -22.16259765625, -19.7275390625, -17.29248046875, -14.857421875, -12.42236328125, -9.9873046875, -7.55224609375, -5.1171875, -2.68212890625, -0.2470703125, 2.18798828125, 4.623046875, 7.05810546875, 9.4931640625, 11.92822265625, 14.36328125, 16.79833984375, 19.2333984375, 21.66845703125, 24.103515625, 26.53857421875, 28.9736328125, 31.40869140625, 33.84375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 5.0, 13.0, 15.0, 20.0, 20.0, 28.0, 26.0, 49.0, 65.0, 91.0, 108.0, 140.0, 223.0, 292.0, 415.0, 611.0, 1068.0, 2380.0, 80631.0, 6197942.0, 3363.0, 1346.0, 764.0, 504.0, 337.0, 253.0, 176.0, 147.0, 92.0, 72.0, 45.0, 43.0, 31.0, 24.0, 18.0, 12.0, 14.0, 10.0, 9.0, 6.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.047332763671875, -0.04581117630004883, -0.044289588928222656, -0.042768001556396484, -0.04124641418457031, -0.03972482681274414, -0.03820323944091797, -0.0366816520690918, -0.035160064697265625, -0.03363847732543945, -0.03211688995361328, -0.03059530258178711, -0.029073715209960938, -0.027552127838134766, -0.026030540466308594, -0.024508953094482422, -0.02298736572265625, -0.021465778350830078, -0.019944190979003906, -0.018422603607177734, -0.016901016235351562, -0.01537942886352539, -0.013857841491699219, -0.012336254119873047, -0.010814666748046875, -0.009293079376220703, -0.007771492004394531, -0.006249904632568359, -0.0047283172607421875, -0.0032067298889160156, -0.0016851425170898438, -0.00016355514526367188, 0.0013580322265625, 0.002879619598388672, 0.004401206970214844, 0.005922794342041016, 0.0074443817138671875, 0.00896596908569336, 0.010487556457519531, 0.012009143829345703, 0.013530731201171875, 0.015052318572998047, 0.01657390594482422, 0.01809549331665039, 0.019617080688476562, 0.021138668060302734, 0.022660255432128906, 0.024181842803955078, 0.02570343017578125, 0.027225017547607422, 0.028746604919433594, 0.030268192291259766, 0.03178977966308594, 0.03331136703491211, 0.03483295440673828, 0.03635454177856445, 0.037876129150390625, 0.0393977165222168, 0.04091930389404297, 0.04244089126586914, 0.04396247863769531, 0.045484066009521484, 0.047005653381347656, 0.04852724075317383, 0.050048828125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 5.0, 6.0, 9.0, 8.0, 11.0, 8.0, 11.0, 16.0, 22.0, 23.0, 21.0, 29.0, 32.0, 39.0, 46.0, 46.0, 48.0, 47.0, 53.0, 55.0, 1076.0, 48.0, 32.0, 41.0, 42.0, 39.0, 36.0, 32.0, 24.0, 31.0, 16.0, 9.0, 16.0, 10.0, 9.0, 4.0, 9.0, 6.0, 6.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21875, -6.954345703125, -6.68994140625, -6.425537109375, -6.1611328125, -5.896728515625, -5.63232421875, -5.367919921875, -5.103515625, -4.839111328125, -4.57470703125, -4.310302734375, -4.0458984375, -3.781494140625, -3.51708984375, -3.252685546875, -2.98828125, -2.723876953125, -2.45947265625, -2.195068359375, -1.9306640625, -1.666259765625, -1.40185546875, -1.137451171875, -0.873046875, -0.608642578125, -0.34423828125, -0.079833984375, 0.1845703125, 0.448974609375, 0.71337890625, 0.977783203125, 1.2421875, 1.506591796875, 1.77099609375, 2.035400390625, 2.2998046875, 2.564208984375, 2.82861328125, 3.093017578125, 3.357421875, 3.621826171875, 3.88623046875, 4.150634765625, 4.4150390625, 4.679443359375, 4.94384765625, 5.208251953125, 5.47265625, 5.737060546875, 6.00146484375, 6.265869140625, 6.5302734375, 6.794677734375, 7.05908203125, 7.323486328125, 7.587890625, 7.852294921875, 8.11669921875, 8.381103515625, 8.6455078125, 8.909912109375, 9.17431640625, 9.438720703125, 9.703125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 9.0, 10.0, 9.0, 11.0, 19.0, 28.0, 38.0, 45.0, 94.0, 141.0, 304.0, 620.0, 2217.0, 6250531.0, 34712.0, 1526.0, 507.0, 229.0, 119.0, 82.0, 55.0, 34.0, 28.0, 14.0, 8.0, 10.0, 5.0, 6.0, 6.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1107177734375, -0.10701370239257812, -0.10330963134765625, -0.09960556030273438, -0.0959014892578125, -0.09219741821289062, -0.08849334716796875, -0.08478927612304688, -0.081085205078125, -0.07738113403320312, -0.07367706298828125, -0.06997299194335938, -0.0662689208984375, -0.06256484985351562, -0.05886077880859375, -0.055156707763671875, -0.05145263671875, -0.047748565673828125, -0.04404449462890625, -0.040340423583984375, -0.0366363525390625, -0.032932281494140625, -0.02922821044921875, -0.025524139404296875, -0.021820068359375, -0.018115997314453125, -0.01441192626953125, -0.010707855224609375, -0.0070037841796875, -0.003299713134765625, 0.00040435791015625, 0.004108428955078125, 0.0078125, 0.011516571044921875, 0.01522064208984375, 0.018924713134765625, 0.0226287841796875, 0.026332855224609375, 0.03003692626953125, 0.033740997314453125, 0.037445068359375, 0.041149139404296875, 0.04485321044921875, 0.048557281494140625, 0.0522613525390625, 0.055965423583984375, 0.05966949462890625, 0.06337356567382812, 0.06707763671875, 0.07078170776367188, 0.07448577880859375, 0.07818984985351562, 0.0818939208984375, 0.08559799194335938, 0.08930206298828125, 0.09300613403320312, 0.096710205078125, 0.10041427612304688, 0.10411834716796875, 0.10782241821289062, 0.1115264892578125, 0.11523056030273438, 0.11893463134765625, 0.12263870239257812, 0.1263427734375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 8.0, 31.0, 1754.0, 215.0, 7.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05267333984375, -0.051412343978881836, -0.05015134811401367, -0.04889035224914551, -0.047629356384277344, -0.04636836051940918, -0.045107364654541016, -0.04384636878967285, -0.04258537292480469, -0.04132437705993652, -0.04006338119506836, -0.038802385330200195, -0.03754138946533203, -0.03628039360046387, -0.0350193977355957, -0.03375840187072754, -0.032497406005859375, -0.03123641014099121, -0.029975414276123047, -0.028714418411254883, -0.02745342254638672, -0.026192426681518555, -0.02493143081665039, -0.023670434951782227, -0.022409439086914062, -0.0211484432220459, -0.019887447357177734, -0.01862645149230957, -0.017365455627441406, -0.016104459762573242, -0.014843463897705078, -0.013582468032836914, -0.01232147216796875, -0.011060476303100586, -0.009799480438232422, -0.008538484573364258, -0.007277488708496094, -0.00601649284362793, -0.004755496978759766, -0.0034945011138916016, -0.0022335052490234375, -0.0009725093841552734, 0.0002884864807128906, 0.0015494823455810547, 0.0028104782104492188, 0.004071474075317383, 0.005332469940185547, 0.006593465805053711, 0.007854461669921875, 0.009115457534790039, 0.010376453399658203, 0.011637449264526367, 0.012898445129394531, 0.014159440994262695, 0.01542043685913086, 0.016681432723999023, 0.017942428588867188, 0.01920342445373535, 0.020464420318603516, 0.02172541618347168, 0.022986412048339844, 0.024247407913208008, 0.025508403778076172, 0.026769399642944336, 0.0280303955078125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 8.0, 9.0, 17.0, 19.0, 29.0, 41.0, 63.0, 99.0, 103.0, 196.0, 353.0, 589.0, 999.0, 1848.0, 3580.0, 8158.0, 22301.0, 96306.0, 5103252.0, 955721.0, 66450.0, 17511.0, 6739.0, 3148.0, 1571.0, 932.0, 529.0, 303.0, 198.0, 111.0, 87.0, 42.0, 34.0, 37.0, 19.0, 11.0, 3.0, 7.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.005123138427734375, -0.004967391490936279, -0.004811644554138184, -0.004655897617340088, -0.004500150680541992, -0.0043444037437438965, -0.004188656806945801, -0.004032909870147705, -0.0038771629333496094, -0.0037214159965515137, -0.003565669059753418, -0.0034099221229553223, -0.0032541751861572266, -0.003098428249359131, -0.002942681312561035, -0.0027869343757629395, -0.0026311874389648438, -0.002475440502166748, -0.0023196935653686523, -0.0021639466285705566, -0.002008199691772461, -0.0018524527549743652, -0.0016967058181762695, -0.0015409588813781738, -0.0013852119445800781, -0.0012294650077819824, -0.0010737180709838867, -0.000917971134185791, -0.0007622241973876953, -0.0006064772605895996, -0.0004507303237915039, -0.0002949833869934082, -0.0001392364501953125, 1.6510486602783203e-05, 0.0001722574234008789, 0.0003280043601989746, 0.0004837512969970703, 0.000639498233795166, 0.0007952451705932617, 0.0009509921073913574, 0.0011067390441894531, 0.0012624859809875488, 0.0014182329177856445, 0.0015739798545837402, 0.001729726791381836, 0.0018854737281799316, 0.0020412206649780273, 0.002196967601776123, 0.0023527145385742188, 0.0025084614753723145, 0.00266420841217041, 0.002819955348968506, 0.0029757022857666016, 0.0031314492225646973, 0.003287196159362793, 0.0034429430961608887, 0.0035986900329589844, 0.00375443696975708, 0.003910183906555176, 0.0040659308433532715, 0.004221677780151367, 0.004377424716949463, 0.004533171653747559, 0.004688918590545654, 0.00484466552734375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 3.0, 6.0, 7.0, 9.0, 14.0, 26.0, 18.0, 43.0, 65.0, 97.0, 187.0, 769.0, 312.0, 147.0, 113.0, 66.0, 43.0, 21.0, 19.0, 16.0, 2.0, 2.0, 8.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00858306884765625, -0.008327007293701172, -0.008070945739746094, -0.007814884185791016, -0.0075588226318359375, -0.007302761077880859, -0.007046699523925781, -0.006790637969970703, -0.006534576416015625, -0.006278514862060547, -0.006022453308105469, -0.005766391754150391, -0.0055103302001953125, -0.005254268646240234, -0.004998207092285156, -0.004742145538330078, -0.004486083984375, -0.004230022430419922, -0.003973960876464844, -0.0037178993225097656, -0.0034618377685546875, -0.0032057762145996094, -0.0029497146606445312, -0.002693653106689453, -0.002437591552734375, -0.002181529998779297, -0.0019254684448242188, -0.0016694068908691406, -0.0014133453369140625, -0.0011572837829589844, -0.0009012222290039062, -0.0006451606750488281, -0.00038909912109375, -0.00013303756713867188, 0.00012302398681640625, 0.0003790855407714844, 0.0006351470947265625, 0.0008912086486816406, 0.0011472702026367188, 0.0014033317565917969, 0.001659393310546875, 0.0019154548645019531, 0.0021715164184570312, 0.0024275779724121094, 0.0026836395263671875, 0.0029397010803222656, 0.0031957626342773438, 0.003451824188232422, 0.0037078857421875, 0.003963947296142578, 0.004220008850097656, 0.004476070404052734, 0.0047321319580078125, 0.004988193511962891, 0.005244255065917969, 0.005500316619873047, 0.005756378173828125, 0.006012439727783203, 0.006268501281738281, 0.006524562835693359, 0.0067806243896484375, 0.007036685943603516, 0.007292747497558594, 0.007548809051513672, 0.00780487060546875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 20.0, 438.0, 276.0, 124.0, 67.0, 32.0, 27.0, 6.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09881081432104111, -0.09678125381469727, -0.09475168585777283, -0.09272212535142899, -0.09069256484508514, -0.0886630043387413, -0.08663344383239746, -0.08460387587547302, -0.08257431536912918, -0.08054475486278534, -0.0785151869058609, -0.07648562639951706, -0.07445606589317322, -0.07242650538682938, -0.07039694488048553, -0.0683673769235611, -0.06633781641721725, -0.06430825591087341, -0.06227869167923927, -0.06024912744760513, -0.05821956694126129, -0.05619000643491745, -0.05416044220328331, -0.05213087797164917, -0.05010131746530533, -0.04807175695896149, -0.04604219272732735, -0.04401262849569321, -0.041983067989349365, -0.039953507483005524, -0.037923943251371384, -0.035894379019737244, -0.0338648185133934, -0.03183525800704956, -0.02980569377541542, -0.02777613140642643, -0.02574656903743744, -0.023717006668448448, -0.021687444299459457, -0.019657881930470467, -0.017628321424126625, -0.015598759055137634, -0.013569196686148643, -0.011539634317159653, -0.009510071948170662, -0.007480509579181671, -0.00545094721019268, -0.0034213848412036896, -0.0013918224722146988, 0.000637739896774292, 0.0026673022657632828, 0.0046968646347522736, 0.006726427003741264, 0.008755989372730255, 0.010785551741719246, 0.012815114110708237, 0.014844676479697227, 0.016874238848686218, 0.01890380121767521, 0.0209333635866642, 0.02296292595565319, 0.02499248832464218, 0.027022050693631172, 0.029051613062620163, 0.031081175431609154]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 4.0, 8.0, 6.0, 8.0, 9.0, 19.0, 11.0, 16.0, 18.0, 29.0, 22.0, 21.0, 34.0, 34.0, 28.0, 23.0, 40.0, 44.0, 35.0, 53.0, 40.0, 34.0, 46.0, 26.0, 38.0, 37.0, 44.0, 30.0, 33.0, 30.0, 17.0, 20.0, 23.0, 26.0, 19.0, 17.0, 11.0, 5.0, 9.0, 4.0, 6.0, 11.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014644205570220947, -0.014194274321198463, -0.01374434307217598, -0.013294411823153496, -0.012844480574131012, -0.012394549325108528, -0.011944618076086044, -0.01149468682706356, -0.011044755578041077, -0.010594824329018593, -0.010144893079996109, -0.009694961830973625, -0.009245030581951141, -0.008795099332928658, -0.008345168083906174, -0.00789523683488369, -0.007445305585861206, -0.006995374336838722, -0.006545443087816238, -0.006095511838793755, -0.005645580589771271, -0.005195649340748787, -0.004745718091726303, -0.004295786842703819, -0.0038458555936813354, -0.0033959243446588516, -0.002945993095636368, -0.002496061846613884, -0.0020461305975914, -0.0015961993485689163, -0.0011462680995464325, -0.0006963368505239487, -0.00024640560150146484, 0.00020352564752101898, 0.0006534568965435028, 0.0011033881455659866, 0.0015533193945884705, 0.0020032506436109543, 0.002453181892633438, 0.002903113141655922, 0.0033530443906784058, 0.0038029756397008896, 0.004252906888723373, 0.004702838137745857, 0.005152769386768341, 0.005602700635790825, 0.006052631884813309, 0.0065025631338357925, 0.006952494382858276, 0.00740242563188076, 0.007852356880903244, 0.008302288129925728, 0.008752219378948212, 0.009202150627970695, 0.00965208187699318, 0.010102013126015663, 0.010551944375038147, 0.01100187562406063, 0.011451806873083115, 0.011901738122105598, 0.012351669371128082, 0.012801600620150566, 0.01325153186917305, 0.013701463118195534, 0.014151394367218018]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 5.0, 8.0, 6.0, 16.0, 15.0, 32.0, 75.0, 113.0, 270.0, 578.0, 1235.0, 2622.0, 6667.0, 21208.0, 88121.0, 3928760.0, 107876.0, 22585.0, 7630.0, 3004.0, 1344.0, 738.0, 429.0, 311.0, 178.0, 138.0, 109.0, 58.0, 42.0, 34.0, 29.0, 14.0, 11.0, 5.0, 3.0, 5.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00024199485778808594, -0.0002317279577255249, -0.00022146105766296387, -0.00021119415760040283, -0.0002009272575378418, -0.00019066035747528076, -0.00018039345741271973, -0.0001701265573501587, -0.00015985965728759766, -0.00014959275722503662, -0.00013932585716247559, -0.00012905895709991455, -0.00011879205703735352, -0.00010852515697479248, -9.825825691223145e-05, -8.799135684967041e-05, -7.772445678710938e-05, -6.745755672454834e-05, -5.7190656661987305e-05, -4.692375659942627e-05, -3.6656856536865234e-05, -2.63899564743042e-05, -1.6123056411743164e-05, -5.856156349182129e-06, 4.410743713378906e-06, 1.4677643775939941e-05, 2.4944543838500977e-05, 3.521144390106201e-05, 4.547834396362305e-05, 5.574524402618408e-05, 6.601214408874512e-05, 7.627904415130615e-05, 8.654594421386719e-05, 9.681284427642822e-05, 0.00010707974433898926, 0.00011734664440155029, 0.00012761354446411133, 0.00013788044452667236, 0.0001481473445892334, 0.00015841424465179443, 0.00016868114471435547, 0.0001789480447769165, 0.00018921494483947754, 0.00019948184490203857, 0.0002097487449645996, 0.00022001564502716064, 0.00023028254508972168, 0.00024054944515228271, 0.00025081634521484375, 0.0002610832452774048, 0.0002713501453399658, 0.00028161704540252686, 0.0002918839454650879, 0.0003021508455276489, 0.00031241774559020996, 0.000322684645652771, 0.00033295154571533203, 0.00034321844577789307, 0.0003534853458404541, 0.00036375224590301514, 0.00037401914596557617, 0.0003842860460281372, 0.00039455294609069824, 0.0004048198461532593, 0.0004150867462158203]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 8.0, 9.0, 14.0, 21.0, 30.0, 30.0, 49.0, 67.0, 81.0, 130.0, 137.0, 130.0, 84.0, 59.0, 43.0, 26.0, 21.0, 14.0, 10.0, 8.0, 11.0, 6.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3053417205810547e-05, -1.2495554983615875e-05, -1.1937692761421204e-05, -1.1379830539226532e-05, -1.082196831703186e-05, -1.0264106094837189e-05, -9.706243872642517e-06, -9.148381650447845e-06, -8.590519428253174e-06, -8.032657206058502e-06, -7.4747949838638306e-06, -6.916932761669159e-06, -6.359070539474487e-06, -5.801208317279816e-06, -5.243346095085144e-06, -4.685483872890472e-06, -4.127621650695801e-06, -3.569759428501129e-06, -3.0118972063064575e-06, -2.454034984111786e-06, -1.8961727619171143e-06, -1.3383105397224426e-06, -7.80448317527771e-07, -2.2258609533309937e-07, 3.3527612686157227e-07, 8.931383490562439e-07, 1.4510005712509155e-06, 2.008862793445587e-06, 2.566725015640259e-06, 3.1245872378349304e-06, 3.682449460029602e-06, 4.240311682224274e-06, 4.798173904418945e-06, 5.356036126613617e-06, 5.9138983488082886e-06, 6.47176057100296e-06, 7.029622793197632e-06, 7.5874850153923035e-06, 8.145347237586975e-06, 8.703209459781647e-06, 9.261071681976318e-06, 9.81893390417099e-06, 1.0376796126365662e-05, 1.0934658348560333e-05, 1.1492520570755005e-05, 1.2050382792949677e-05, 1.2608245015144348e-05, 1.316610723733902e-05, 1.3723969459533691e-05, 1.4281831681728363e-05, 1.4839693903923035e-05, 1.5397556126117706e-05, 1.5955418348312378e-05, 1.651328057050705e-05, 1.707114279270172e-05, 1.7629005014896393e-05, 1.8186867237091064e-05, 1.8744729459285736e-05, 1.9302591681480408e-05, 1.986045390367508e-05, 2.041831612586975e-05, 2.0976178348064423e-05, 2.1534040570259094e-05, 2.2091902792453766e-05, 2.2649765014648438e-05]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 7.0, 8.0, 25.0, 27.0, 47.0, 99.0, 175.0, 527.0, 1430.0, 5334.0, 23879.0, 198091.0, 3873905.0, 74218.0, 12133.0, 2811.0, 745.0, 295.0, 133.0, 94.0, 50.0, 49.0, 45.0, 25.0, 28.0, 29.0, 24.0, 10.0, 12.0, 6.0, 9.0, 7.0, 3.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.83936882019043e-05, -8.29668715596199e-05, -7.754005491733551e-05, -7.211323827505112e-05, -6.668642163276672e-05, -6.125960499048233e-05, -5.583278834819794e-05, -5.0405971705913544e-05, -4.497915506362915e-05, -3.955233842134476e-05, -3.4125521779060364e-05, -2.869870513677597e-05, -2.3271888494491577e-05, -1.7845071852207184e-05, -1.241825520992279e-05, -6.991438567638397e-06, -1.564621925354004e-06, 3.862194716930389e-06, 9.289011359214783e-06, 1.4715828001499176e-05, 2.014264464378357e-05, 2.5569461286067963e-05, 3.0996277928352356e-05, 3.642309457063675e-05, 4.184991121292114e-05, 4.7276727855205536e-05, 5.270354449748993e-05, 5.813036113977432e-05, 6.355717778205872e-05, 6.898399442434311e-05, 7.44108110666275e-05, 7.98376277089119e-05, 8.526444435119629e-05, 9.069126099348068e-05, 9.611807763576508e-05, 0.00010154489427804947, 0.00010697171092033386, 0.00011239852756261826, 0.00011782534420490265, 0.00012325216084718704, 0.00012867897748947144, 0.00013410579413175583, 0.00013953261077404022, 0.00014495942741632462, 0.000150386244058609, 0.0001558130607008934, 0.0001612398773431778, 0.0001666666939854622, 0.00017209351062774658, 0.00017752032727003098, 0.00018294714391231537, 0.00018837396055459976, 0.00019380077719688416, 0.00019922759383916855, 0.00020465441048145294, 0.00021008122712373734, 0.00021550804376602173, 0.00022093486040830612, 0.00022636167705059052, 0.0002317884936928749, 0.0002372153103351593, 0.0002426421269774437, 0.0002480689436197281, 0.0002534957602620125, 0.0002589225769042969]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 2.0, 4.0, 8.0, 6.0, 8.0, 13.0, 10.0, 26.0, 26.0, 21.0, 32.0, 30.0, 46.0, 45.0, 38.0, 55.0, 58.0, 56.0, 81.0, 109.0, 329.0, 2057.0, 590.0, 138.0, 79.0, 74.0, 38.0, 27.0, 20.0, 22.0, 9.0, 6.0, 10.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.598234176635742e-05, -6.457231938838959e-05, -6.316229701042175e-05, -6.175227463245392e-05, -6.0342252254486084e-05, -5.893222987651825e-05, -5.7522207498550415e-05, -5.611218512058258e-05, -5.4702162742614746e-05, -5.329214036464691e-05, -5.188211798667908e-05, -5.047209560871124e-05, -4.906207323074341e-05, -4.7652050852775574e-05, -4.624202847480774e-05, -4.4832006096839905e-05, -4.342198371887207e-05, -4.2011961340904236e-05, -4.06019389629364e-05, -3.919191658496857e-05, -3.778189420700073e-05, -3.63718718290329e-05, -3.4961849451065063e-05, -3.355182707309723e-05, -3.2141804695129395e-05, -3.073178231716156e-05, -2.9321759939193726e-05, -2.791173756122589e-05, -2.6501715183258057e-05, -2.5091692805290222e-05, -2.3681670427322388e-05, -2.2271648049354553e-05, -2.086162567138672e-05, -1.9451603293418884e-05, -1.804158091545105e-05, -1.6631558537483215e-05, -1.5221536159515381e-05, -1.3811513781547546e-05, -1.2401491403579712e-05, -1.0991469025611877e-05, -9.581446647644043e-06, -8.171424269676208e-06, -6.761401891708374e-06, -5.3513795137405396e-06, -3.941357135772705e-06, -2.5313347578048706e-06, -1.1213123798370361e-06, 2.8870999813079834e-07, 1.6987323760986328e-06, 3.1087547540664673e-06, 4.518777132034302e-06, 5.928799510002136e-06, 7.338821887969971e-06, 8.748844265937805e-06, 1.015886664390564e-05, 1.1568889021873474e-05, 1.2978911399841309e-05, 1.4388933777809143e-05, 1.5798956155776978e-05, 1.7208978533744812e-05, 1.8619000911712646e-05, 2.002902328968048e-05, 2.1439045667648315e-05, 2.284906804561615e-05, 2.4259090423583984e-05]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 37.0, 295.0, 622.0, 54.0, 5.0], "bins": [-0.012877784669399261, -0.012667235918343067, -0.012456687167286873, -0.012246138416230679, -0.012035589665174484, -0.01182504091411829, -0.011614492163062096, -0.011403942480683327, -0.011193393729627132, -0.010982844978570938, -0.010772296227514744, -0.01056174747645855, -0.010351198725402355, -0.010140649974346161, -0.009930100291967392, -0.009719552472233772, -0.009509003721177578, -0.009298454970121384, -0.00908790621906519, -0.008877357468008995, -0.0086668087169528, -0.008456259965896606, -0.008245710283517838, -0.008035162463784218, -0.007824612781405449, -0.007614064030349255, -0.00740351527929306, -0.007192966528236866, -0.006982417311519384, -0.00677186856046319, -0.006561319809406996, -0.0063507710583508015, -0.006140222307294607, -0.005929673556238413, -0.0057191248051822186, -0.005508575588464737, -0.005298026837408543, -0.005087478086352348, -0.004876929335296154, -0.00466638058423996, -0.004455831833183765, -0.004245283082127571, -0.004034734331071377, -0.003824185347184539, -0.0036136365961283445, -0.0034030876122415066, -0.0031925388611853123, -0.002981990110129118, -0.0027714408934116364, -0.002560892142355442, -0.002350343158468604, -0.0021397944074124098, -0.0019292456563562155, -0.0017186967888846993, -0.0015081479214131832, -0.001297599170356989, -0.0010870504193007946, -0.0008765016100369394, -0.0006659528007730842, -0.00045540393330156803, -0.0002448551240377128, -3.4306314773857594e-05, 0.00017624255269765854, 0.00038679130375385284, 0.000597340171225369]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 6.0, 10.0, 6.0, 18.0, 29.0, 38.0, 39.0, 51.0, 50.0, 62.0, 51.0, 68.0, 66.0, 67.0, 69.0, 58.0, 60.0, 49.0, 48.0, 42.0, 38.0, 26.0, 18.0, 10.0, 8.0, 8.0, 0.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001138925552368164, -0.0011098375543951988, -0.0010807495564222336, -0.0010516615584492683, -0.001022573560476303, -0.0009934855625033379, -0.0009643975645303726, -0.0009353095665574074, -0.0009062215685844421, -0.0008771335706114769, -0.0008480455726385117, -0.0008189575746655464, -0.0007898695766925812, -0.0007607815787196159, -0.0007316935807466507, -0.0007026055827736855, -0.0006735175848007202, -0.000644429586827755, -0.0006153415888547897, -0.0005862535908818245, -0.0005571655929088593, -0.000528077594935894, -0.0004989895969629288, -0.00046990159898996353, -0.0004408136010169983, -0.00041172560304403305, -0.0003826376050710678, -0.00035354960709810257, -0.00032446160912513733, -0.0002953736111521721, -0.00026628561317920685, -0.0002371976152062416, -0.00020810961723327637, -0.00017902161926031113, -0.00014993362128734589, -0.00012084562331438065, -9.17576253414154e-05, -6.266962736845016e-05, -3.3581629395484924e-05, -4.493631422519684e-06, 2.4594366550445557e-05, 5.36823645234108e-05, 8.277036249637604e-05, 0.00011185836046934128, 0.00014094635844230652, 0.00017003435641527176, 0.000199122354388237, 0.00022821035236120224, 0.0002572983503341675, 0.0002863863483071327, 0.00031547434628009796, 0.0003445623442530632, 0.00037365034222602844, 0.0004027383401989937, 0.0004318263381719589, 0.00046091433614492416, 0.0004900023341178894, 0.0005190903320908546, 0.0005481783300638199, 0.0005772663280367851, 0.0006063543260097504, 0.0006354423239827156, 0.0006645303219556808, 0.0006936183199286461, 0.0007227063179016113]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 7.0, 12.0, 14.0, 9.0, 19.0, 16.0, 20.0, 59.0, 82.0, 138.0, 207.0, 324.0, 580.0, 1166.0, 2408.0, 6487.0, 23937.0, 217109.0, 740107.0, 39996.0, 9100.0, 3292.0, 1516.0, 770.0, 412.0, 250.0, 176.0, 98.0, 72.0, 46.0, 34.0, 23.0, 13.0, 13.0, 12.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004649162292480469, -0.00045304372906684875, -0.00044117122888565063, -0.0004292987287044525, -0.0004174262285232544, -0.0004055537283420563, -0.00039368122816085815, -0.00038180872797966003, -0.0003699362277984619, -0.0003580637276172638, -0.0003461912274360657, -0.00033431872725486755, -0.00032244622707366943, -0.0003105737268924713, -0.0002987012267112732, -0.0002868287265300751, -0.00027495622634887695, -0.00026308372616767883, -0.0002512112259864807, -0.0002393387258052826, -0.00022746622562408447, -0.00021559372544288635, -0.00020372122526168823, -0.0001918487250804901, -0.000179976224899292, -0.00016810372471809387, -0.00015623122453689575, -0.00014435872435569763, -0.0001324862241744995, -0.00012061372399330139, -0.00010874122381210327, -9.686872363090515e-05, -8.499622344970703e-05, -7.312372326850891e-05, -6.125122308731079e-05, -4.937872290611267e-05, -3.750622272491455e-05, -2.563372254371643e-05, -1.376122236251831e-05, -1.8887221813201904e-06, 9.98377799987793e-06, 2.185627818107605e-05, 3.372877836227417e-05, 4.560127854347229e-05, 5.747377872467041e-05, 6.934627890586853e-05, 8.121877908706665e-05, 9.309127926826477e-05, 0.00010496377944946289, 0.00011683627963066101, 0.00012870877981185913, 0.00014058127999305725, 0.00015245378017425537, 0.0001643262803554535, 0.0001761987805366516, 0.00018807128071784973, 0.00019994378089904785, 0.00021181628108024597, 0.0002236887812614441, 0.0002355612814426422, 0.00024743378162384033, 0.00025930628180503845, 0.00027117878198623657, 0.0002830512821674347, 0.0002949237823486328]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 1.0, 3.0, 4.0, 7.0, 10.0, 16.0, 14.0, 18.0, 24.0, 39.0, 38.0, 76.0, 91.0, 99.0, 113.0, 131.0, 86.0, 75.0, 31.0, 39.0, 17.0, 16.0, 9.0, 10.0, 12.0, 9.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0609626770019531e-05, -1.0116957128047943e-05, -9.624287486076355e-06, -9.131617844104767e-06, -8.638948202133179e-06, -8.14627856016159e-06, -7.653608918190002e-06, -7.160939276218414e-06, -6.668269634246826e-06, -6.175599992275238e-06, -5.68293035030365e-06, -5.190260708332062e-06, -4.697591066360474e-06, -4.2049214243888855e-06, -3.7122517824172974e-06, -3.2195821404457092e-06, -2.726912498474121e-06, -2.234242856502533e-06, -1.7415732145309448e-06, -1.2489035725593567e-06, -7.562339305877686e-07, -2.635642886161804e-07, 2.2910535335540771e-07, 7.217749953269958e-07, 1.214444637298584e-06, 1.7071142792701721e-06, 2.1997839212417603e-06, 2.6924535632133484e-06, 3.1851232051849365e-06, 3.6777928471565247e-06, 4.170462489128113e-06, 4.663132131099701e-06, 5.155801773071289e-06, 5.648471415042877e-06, 6.141141057014465e-06, 6.6338106989860535e-06, 7.126480340957642e-06, 7.61914998292923e-06, 8.111819624900818e-06, 8.604489266872406e-06, 9.097158908843994e-06, 9.589828550815582e-06, 1.008249819278717e-05, 1.0575167834758759e-05, 1.1067837476730347e-05, 1.1560507118701935e-05, 1.2053176760673523e-05, 1.2545846402645111e-05, 1.30385160446167e-05, 1.3531185686588287e-05, 1.4023855328559875e-05, 1.4516524970531464e-05, 1.5009194612503052e-05, 1.550186425447464e-05, 1.5994533896446228e-05, 1.6487203538417816e-05, 1.6979873180389404e-05, 1.7472542822360992e-05, 1.796521246433258e-05, 1.845788210630417e-05, 1.8950551748275757e-05, 1.9443221390247345e-05, 1.9935891032218933e-05, 2.042856067419052e-05, 2.092123031616211e-05]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 12.0, 14.0, 12.0, 15.0, 37.0, 49.0, 65.0, 86.0, 119.0, 203.0, 298.0, 396.0, 642.0, 1029.0, 1740.0, 2964.0, 5177.0, 9187.0, 17679.0, 39275.0, 103831.0, 523896.0, 218035.0, 65685.0, 27705.0, 13201.0, 7078.0, 3925.0, 2347.0, 1378.0, 867.0, 514.0, 340.0, 240.0, 162.0, 96.0, 79.0, 63.0, 29.0, 22.0, 17.0, 13.0, 11.0, 10.0, 8.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.316205978393555e-05, -9.013526141643524e-05, -8.710846304893494e-05, -8.408166468143463e-05, -8.105486631393433e-05, -7.802806794643402e-05, -7.500126957893372e-05, -7.197447121143341e-05, -6.89476728439331e-05, -6.59208744764328e-05, -6.28940761089325e-05, -5.986727774143219e-05, -5.6840479373931885e-05, -5.381368100643158e-05, -5.0786882638931274e-05, -4.776008427143097e-05, -4.4733285903930664e-05, -4.170648753643036e-05, -3.8679689168930054e-05, -3.565289080142975e-05, -3.262609243392944e-05, -2.9599294066429138e-05, -2.6572495698928833e-05, -2.3545697331428528e-05, -2.0518898963928223e-05, -1.7492100596427917e-05, -1.4465302228927612e-05, -1.1438503861427307e-05, -8.411705493927002e-06, -5.384907126426697e-06, -2.3581087589263916e-06, 6.686896085739136e-07, 3.6954879760742188e-06, 6.722286343574524e-06, 9.749084711074829e-06, 1.2775883078575134e-05, 1.580268144607544e-05, 1.8829479813575745e-05, 2.185627818107605e-05, 2.4883076548576355e-05, 2.790987491607666e-05, 3.0936673283576965e-05, 3.396347165107727e-05, 3.6990270018577576e-05, 4.001706838607788e-05, 4.3043866753578186e-05, 4.607066512107849e-05, 4.9097463488578796e-05, 5.21242618560791e-05, 5.515106022357941e-05, 5.817785859107971e-05, 6.120465695858002e-05, 6.423145532608032e-05, 6.725825369358063e-05, 7.028505206108093e-05, 7.331185042858124e-05, 7.633864879608154e-05, 7.936544716358185e-05, 8.239224553108215e-05, 8.541904389858246e-05, 8.844584226608276e-05, 9.147264063358307e-05, 9.449943900108337e-05, 9.752623736858368e-05, 0.00010055303573608398]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 8.0, 7.0, 5.0, 15.0, 15.0, 23.0, 18.0, 26.0, 26.0, 30.0, 25.0, 48.0, 36.0, 41.0, 61.0, 60.0, 83.0, 43.0, 58.0, 58.0, 46.0, 39.0, 40.0, 32.0, 24.0, 23.0, 20.0, 16.0, 13.0, 12.0, 9.0, 12.0, 6.0, 3.0, 4.0, 0.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6133995056152344e-05, -4.434678703546524e-05, -4.255957901477814e-05, -4.0772370994091034e-05, -3.898516297340393e-05, -3.719795495271683e-05, -3.5410746932029724e-05, -3.362353891134262e-05, -3.183633089065552e-05, -3.0049122869968414e-05, -2.826191484928131e-05, -2.6474706828594208e-05, -2.4687498807907104e-05, -2.290029078722e-05, -2.1113082766532898e-05, -1.9325874745845795e-05, -1.753866672515869e-05, -1.5751458704471588e-05, -1.3964250683784485e-05, -1.2177042663097382e-05, -1.0389834642410278e-05, -8.602626621723175e-06, -6.815418601036072e-06, -5.0282105803489685e-06, -3.2410025596618652e-06, -1.453794538974762e-06, 3.334134817123413e-07, 2.1206215023994446e-06, 3.907829523086548e-06, 5.695037543773651e-06, 7.482245564460754e-06, 9.269453585147858e-06, 1.1056661605834961e-05, 1.2843869626522064e-05, 1.4631077647209167e-05, 1.641828566789627e-05, 1.8205493688583374e-05, 1.9992701709270477e-05, 2.177990972995758e-05, 2.3567117750644684e-05, 2.5354325771331787e-05, 2.714153379201889e-05, 2.8928741812705994e-05, 3.07159498333931e-05, 3.25031578540802e-05, 3.4290365874767303e-05, 3.607757389545441e-05, 3.786478191614151e-05, 3.965198993682861e-05, 4.1439197957515717e-05, 4.322640597820282e-05, 4.501361399888992e-05, 4.6800822019577026e-05, 4.858803004026413e-05, 5.037523806095123e-05, 5.2162446081638336e-05, 5.394965410232544e-05, 5.573686212301254e-05, 5.7524070143699646e-05, 5.931127816438675e-05, 6.109848618507385e-05, 6.288569420576096e-05, 6.467290222644806e-05, 6.646011024713516e-05, 6.824731826782227e-05]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 6.0, 10.0, 14.0, 25.0, 34.0, 36.0, 72.0, 97.0, 175.0, 231.0, 508.0, 967.0, 1990.0, 4257.0, 10529.0, 1004324.0, 14991.0, 5331.0, 2385.0, 1153.0, 667.0, 288.0, 186.0, 84.0, 55.0, 37.0, 26.0, 13.0, 18.0, 9.0, 7.0, 2.0, 5.0, 5.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011816024780273438, -0.001145392656326294, -0.0011091828346252441, -0.0010729730129241943, -0.0010367631912231445, -0.0010005533695220947, -0.0009643435478210449, -0.0009281337261199951, -0.0008919239044189453, -0.0008557140827178955, -0.0008195042610168457, -0.0007832944393157959, -0.0007470846176147461, -0.0007108747959136963, -0.0006746649742126465, -0.0006384551525115967, -0.0006022453308105469, -0.0005660355091094971, -0.0005298256874084473, -0.0004936158657073975, -0.00045740604400634766, -0.00042119622230529785, -0.00038498640060424805, -0.00034877657890319824, -0.00031256675720214844, -0.00027635693550109863, -0.00024014711380004883, -0.00020393729209899902, -0.00016772747039794922, -0.00013151764869689941, -9.530782699584961e-05, -5.9098005294799805e-05, -2.288818359375e-05, 1.3321638107299805e-05, 4.953145980834961e-05, 8.574128150939941e-05, 0.00012195110321044922, 0.00015816092491149902, 0.00019437074661254883, 0.00023058056831359863, 0.00026679039001464844, 0.00030300021171569824, 0.00033921003341674805, 0.00037541985511779785, 0.00041162967681884766, 0.00044783949851989746, 0.00048404932022094727, 0.0005202591419219971, 0.0005564689636230469, 0.0005926787853240967, 0.0006288886070251465, 0.0006650984287261963, 0.0007013082504272461, 0.0007375180721282959, 0.0007737278938293457, 0.0008099377155303955, 0.0008461475372314453, 0.0008823573589324951, 0.0009185671806335449, 0.0009547770023345947, 0.0009909868240356445, 0.0010271966457366943, 0.0010634064674377441, 0.001099616289138794, 0.0011358261108398438]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 9.0, 7.0, 9.0, 11.0, 14.0, 10.0, 11.0, 33.0, 79.0, 101.0, 175.0, 168.0, 142.0, 66.0, 40.0, 16.0, 8.0, 9.0, 15.0, 7.0, 7.0, 9.0, 4.0, 9.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.357929229736328e-06, -9.074807167053223e-06, -8.791685104370117e-06, -8.508563041687012e-06, -8.225440979003906e-06, -7.9423189163208e-06, -7.659196853637695e-06, -7.37607479095459e-06, -7.092952728271484e-06, -6.809830665588379e-06, -6.5267086029052734e-06, -6.243586540222168e-06, -5.9604644775390625e-06, -5.677342414855957e-06, -5.3942203521728516e-06, -5.111098289489746e-06, -4.827976226806641e-06, -4.544854164123535e-06, -4.26173210144043e-06, -3.978610038757324e-06, -3.6954879760742188e-06, -3.4123659133911133e-06, -3.129243850708008e-06, -2.8461217880249023e-06, -2.562999725341797e-06, -2.2798776626586914e-06, -1.996755599975586e-06, -1.7136335372924805e-06, -1.430511474609375e-06, -1.1473894119262695e-06, -8.642673492431641e-07, -5.811452865600586e-07, -2.980232238769531e-07, -1.4901161193847656e-08, 2.682209014892578e-07, 5.513429641723633e-07, 8.344650268554688e-07, 1.1175870895385742e-06, 1.4007091522216797e-06, 1.6838312149047852e-06, 1.9669532775878906e-06, 2.250075340270996e-06, 2.5331974029541016e-06, 2.816319465637207e-06, 3.0994415283203125e-06, 3.382563591003418e-06, 3.6656856536865234e-06, 3.948807716369629e-06, 4.231929779052734e-06, 4.51505184173584e-06, 4.798173904418945e-06, 5.081295967102051e-06, 5.364418029785156e-06, 5.647540092468262e-06, 5.930662155151367e-06, 6.213784217834473e-06, 6.496906280517578e-06, 6.780028343200684e-06, 7.063150405883789e-06, 7.3462724685668945e-06, 7.62939453125e-06, 7.912516593933105e-06, 8.195638656616211e-06, 8.478760719299316e-06, 8.761882781982422e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 9.0, 16.0, 12.0, 20.0, 20.0, 30.0, 34.0, 53.0, 80.0, 99.0, 163.0, 188.0, 237.0, 380.0, 569.0, 757.0, 1265.0, 1925.0, 3391.0, 8252.0, 95008.0, 911695.0, 13507.0, 4190.0, 2263.0, 1356.0, 943.0, 635.0, 386.0, 277.0, 217.0, 129.0, 110.0, 90.0, 79.0, 41.0, 37.0, 17.0, 24.0, 12.0, 9.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.226799011230469e-05, -8.910335600376129e-05, -8.59387218952179e-05, -8.27740877866745e-05, -7.96094536781311e-05, -7.644481956958771e-05, -7.328018546104431e-05, -7.011555135250092e-05, -6.695091724395752e-05, -6.378628313541412e-05, -6.062164902687073e-05, -5.745701491832733e-05, -5.4292380809783936e-05, -5.112774670124054e-05, -4.7963112592697144e-05, -4.479847848415375e-05, -4.163384437561035e-05, -3.8469210267066956e-05, -3.530457615852356e-05, -3.2139942049980164e-05, -2.8975307941436768e-05, -2.581067383289337e-05, -2.2646039724349976e-05, -1.948140561580658e-05, -1.6316771507263184e-05, -1.3152137398719788e-05, -9.987503290176392e-06, -6.822869181632996e-06, -3.6582350730895996e-06, -4.936009645462036e-07, 2.6710331439971924e-06, 5.835667252540588e-06, 9.000301361083984e-06, 1.216493546962738e-05, 1.5329569578170776e-05, 1.8494203686714172e-05, 2.165883779525757e-05, 2.4823471903800964e-05, 2.798810601234436e-05, 3.1152740120887756e-05, 3.431737422943115e-05, 3.748200833797455e-05, 4.0646642446517944e-05, 4.381127655506134e-05, 4.6975910663604736e-05, 5.014054477214813e-05, 5.330517888069153e-05, 5.6469812989234924e-05, 5.963444709777832e-05, 6.279908120632172e-05, 6.596371531486511e-05, 6.912834942340851e-05, 7.22929835319519e-05, 7.54576176404953e-05, 7.86222517490387e-05, 8.178688585758209e-05, 8.495151996612549e-05, 8.811615407466888e-05, 9.128078818321228e-05, 9.444542229175568e-05, 9.761005640029907e-05, 0.00010077469050884247, 0.00010393932461738586, 0.00010710395872592926, 0.00011026859283447266]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 5.0, 19.0, 67.0, 200.0, 581.0, 71.0, 23.0, 7.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.783008575439453e-05, -6.550364196300507e-05, -6.31771981716156e-05, -6.0850754380226135e-05, -5.852431058883667e-05, -5.6197866797447205e-05, -5.387142300605774e-05, -5.1544979214668274e-05, -4.921853542327881e-05, -4.689209163188934e-05, -4.456564784049988e-05, -4.223920404911041e-05, -3.991276025772095e-05, -3.758631646633148e-05, -3.5259872674942017e-05, -3.293342888355255e-05, -3.0606985092163086e-05, -2.828054130077362e-05, -2.5954097509384155e-05, -2.362765371799469e-05, -2.1301209926605225e-05, -1.897476613521576e-05, -1.6648322343826294e-05, -1.4321878552436829e-05, -1.1995434761047363e-05, -9.668990969657898e-06, -7.342547178268433e-06, -5.016103386878967e-06, -2.689659595489502e-06, -3.632158041000366e-07, 1.9632279872894287e-06, 4.289671778678894e-06, 6.616115570068359e-06, 8.942559361457825e-06, 1.126900315284729e-05, 1.3595446944236755e-05, 1.592189073562622e-05, 1.8248334527015686e-05, 2.057477831840515e-05, 2.2901222109794617e-05, 2.5227665901184082e-05, 2.7554109692573547e-05, 2.9880553483963013e-05, 3.220699727535248e-05, 3.453344106674194e-05, 3.685988485813141e-05, 3.9186328649520874e-05, 4.151277244091034e-05, 4.3839216232299805e-05, 4.616566002368927e-05, 4.8492103815078735e-05, 5.08185476064682e-05, 5.3144991397857666e-05, 5.547143518924713e-05, 5.77978789806366e-05, 6.012432277202606e-05, 6.245076656341553e-05, 6.477721035480499e-05, 6.710365414619446e-05, 6.943009793758392e-05, 7.175654172897339e-05, 7.408298552036285e-05, 7.640942931175232e-05, 7.873587310314178e-05, 8.106231689453125e-05]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 20.0, 24.0, 31.0, 46.0, 50.0, 71.0, 127.0, 156.0, 186.0, 101.0, 63.0, 31.0, 21.0, 14.0, 9.0, 7.0, 6.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025740095879882574, -0.0024893530644476414, -0.002404696773737669, -0.002320040250197053, -0.002235383726656437, -0.002150727203115821, -0.002066070679575205, -0.0019814143888652325, -0.0018967578653246164, -0.0018121013417840004, -0.0017274449346587062, -0.001642788527533412, -0.001558132003992796, -0.00147347548045218, -0.0013888190733268857, -0.0013041626662015915, -0.0012195061426609755, -0.0011348496191203594, -0.0010501932119950652, -0.0009655367466621101, -0.000880880281329155, -0.0007962238159961998, -0.0007115673506632447, -0.0006269108853302896, -0.0005422544199973345, -0.00045759795466437936, -0.00037294148933142424, -0.0002882850239984691, -0.000203628558665514, -0.00011897209333255887, -3.431562799960375e-05, 5.0340837333351374e-05, 0.00013499753549695015, 0.00021965400082990527, 0.0003043104661628604, 0.0003889669314958155, 0.00047362339682877064, 0.0005582798621617258, 0.0006429363274946809, 0.000727592792827636, 0.0008122492581605911, 0.0008969057234935462, 0.0009815621888265014, 0.0010662185959517956, 0.0011508751194924116, 0.0012355316430330276, 0.0013201880501583219, 0.001404844457283616, 0.001489500980824232, 0.0015741575043648481, 0.0016588139114901423, 0.0017434703186154366, 0.0018281268421560526, 0.0019127833656966686, 0.001997439656406641, 0.002082096179947257, 0.002166752703487873, 0.002251409227028489, 0.002336065750569105, 0.0024207220412790775, 0.0025053785648196936, 0.0025900350883603096, 0.002674691379070282, 0.002759347902610898, 0.002844004426151514]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 7.0, 12.0, 12.0, 18.0, 23.0, 21.0, 23.0, 24.0, 24.0, 23.0, 30.0, 22.0, 29.0, 29.0, 24.0, 35.0, 32.0, 28.0, 17.0, 24.0, 30.0, 24.0, 24.0, 31.0, 27.0, 43.0, 25.0, 28.0, 23.0, 34.0, 25.0, 36.0, 20.0, 19.0, 21.0, 18.0, 19.0, 22.0, 16.0, 12.0, 15.0, 10.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.000493168830871582, -0.0004785340279340744, -0.00046389922499656677, -0.00044926442205905914, -0.0004346296191215515, -0.0004199948161840439, -0.00040536001324653625, -0.0003907252103090286, -0.000376090407371521, -0.00036145560443401337, -0.00034682080149650574, -0.0003321859985589981, -0.0003175511956214905, -0.00030291639268398285, -0.0002882815897464752, -0.0002736467868089676, -0.00025901198387145996, -0.00024437718093395233, -0.0002297423779964447, -0.00021510757505893707, -0.00020047277212142944, -0.00018583796918392181, -0.00017120316624641418, -0.00015656836330890656, -0.00014193356037139893, -0.0001272987574338913, -0.00011266395449638367, -9.802915155887604e-05, -8.339434862136841e-05, -6.875954568386078e-05, -5.412474274635315e-05, -3.948993980884552e-05, -2.485513687133789e-05, -1.0220333933830261e-05, 4.414469003677368e-06, 1.9049271941184998e-05, 3.368407487869263e-05, 4.8318877816200256e-05, 6.295368075370789e-05, 7.758848369121552e-05, 9.222328662872314e-05, 0.00010685808956623077, 0.0001214928925037384, 0.00013612769544124603, 0.00015076249837875366, 0.0001653973013162613, 0.00018003210425376892, 0.00019466690719127655, 0.00020930171012878418, 0.0002239365130662918, 0.00023857131600379944, 0.00025320611894130707, 0.0002678409218788147, 0.0002824757248163223, 0.00029711052775382996, 0.0003117453306913376, 0.0003263801336288452, 0.00034101493656635284, 0.0003556497395038605, 0.0003702845424413681, 0.00038491934537887573, 0.00039955414831638336, 0.000414188951253891, 0.0004288237541913986, 0.00044345855712890625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 11.0, 17.0, 19.0, 46.0, 96.0, 325.0, 1180.0, 8011.0, 255423.0, 3913558.0, 12531.0, 1913.0, 601.0, 275.0, 110.0, 65.0, 37.0, 18.0, 13.0, 9.0, 4.0, 9.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007367134094238281, -0.0007033571600914001, -0.0006700009107589722, -0.0006366446614265442, -0.0006032884120941162, -0.0005699321627616882, -0.0005365759134292603, -0.0005032196640968323, -0.0004698634147644043, -0.0004365071654319763, -0.00040315091609954834, -0.00036979466676712036, -0.0003364384174346924, -0.0003030821681022644, -0.0002697259187698364, -0.00023636966943740845, -0.00020301342010498047, -0.0001696571707725525, -0.0001363009214401245, -0.00010294467210769653, -6.958842277526855e-05, -3.6232173442840576e-05, -2.8759241104125977e-06, 3.048032522201538e-05, 6.383657455444336e-05, 9.719282388687134e-05, 0.00013054907321929932, 0.0001639053225517273, 0.00019726157188415527, 0.00023061782121658325, 0.00026397407054901123, 0.0002973303198814392, 0.0003306865692138672, 0.00036404281854629517, 0.00039739906787872314, 0.0004307553172111511, 0.0004641115665435791, 0.0004974678158760071, 0.0005308240652084351, 0.000564180314540863, 0.000597536563873291, 0.000630892813205719, 0.000664249062538147, 0.000697605311870575, 0.0007309615612030029, 0.0007643178105354309, 0.0007976740598678589, 0.0008310303092002869, 0.0008643865585327148, 0.0008977428078651428, 0.0009310990571975708, 0.0009644553065299988, 0.0009978115558624268, 0.0010311678051948547, 0.0010645240545272827, 0.0010978803038597107, 0.0011312365531921387, 0.0011645928025245667, 0.0011979490518569946, 0.0012313053011894226, 0.0012646615505218506, 0.0012980177998542786, 0.0013313740491867065, 0.0013647302985191345, 0.0013980865478515625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 5.0, 11.0, 16.0, 23.0, 35.0, 66.0, 83.0, 120.0, 165.0, 163.0, 112.0, 56.0, 47.0, 43.0, 16.0, 8.0, 8.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8596649169921875e-05, -1.7746351659297943e-05, -1.689605414867401e-05, -1.604575663805008e-05, -1.5195459127426147e-05, -1.4345161616802216e-05, -1.3494864106178284e-05, -1.2644566595554352e-05, -1.179426908493042e-05, -1.0943971574306488e-05, -1.0093674063682556e-05, -9.243376553058624e-06, -8.393079042434692e-06, -7.5427815318107605e-06, -6.692484021186829e-06, -5.842186510562897e-06, -4.991888999938965e-06, -4.141591489315033e-06, -3.291293978691101e-06, -2.440996468067169e-06, -1.5906989574432373e-06, -7.404014468193054e-07, 1.0989606380462646e-07, 9.601935744285583e-07, 1.8104910850524902e-06, 2.660788595676422e-06, 3.511086106300354e-06, 4.361383616924286e-06, 5.211681127548218e-06, 6.06197863817215e-06, 6.9122761487960815e-06, 7.762573659420013e-06, 8.612871170043945e-06, 9.463168680667877e-06, 1.0313466191291809e-05, 1.1163763701915741e-05, 1.2014061212539673e-05, 1.2864358723163605e-05, 1.3714656233787537e-05, 1.4564953744411469e-05, 1.54152512550354e-05, 1.6265548765659332e-05, 1.7115846276283264e-05, 1.7966143786907196e-05, 1.8816441297531128e-05, 1.966673880815506e-05, 2.0517036318778992e-05, 2.1367333829402924e-05, 2.2217631340026855e-05, 2.3067928850650787e-05, 2.391822636127472e-05, 2.476852387189865e-05, 2.5618821382522583e-05, 2.6469118893146515e-05, 2.7319416403770447e-05, 2.816971391439438e-05, 2.902001142501831e-05, 2.9870308935642242e-05, 3.0720606446266174e-05, 3.1570903956890106e-05, 3.242120146751404e-05, 3.327149897813797e-05, 3.41217964887619e-05, 3.4972093999385834e-05, 3.5822391510009766e-05]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 2.0, 4.0, 5.0, 12.0, 21.0, 24.0, 32.0, 77.0, 144.0, 262.0, 531.0, 963.0, 2154.0, 4291.0, 9908.0, 25244.0, 81560.0, 1179580.0, 2757720.0, 86927.0, 26060.0, 10055.0, 4393.0, 2121.0, 1011.0, 540.0, 296.0, 139.0, 62.0, 36.0, 26.0, 29.0, 6.0, 6.0, 7.0, 7.0, 2.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00023829936981201172, -0.000231083482503891, -0.00022386759519577026, -0.00021665170788764954, -0.0002094358205795288, -0.00020221993327140808, -0.00019500404596328735, -0.00018778815865516663, -0.0001805722713470459, -0.00017335638403892517, -0.00016614049673080444, -0.00015892460942268372, -0.000151708722114563, -0.00014449283480644226, -0.00013727694749832153, -0.0001300610601902008, -0.00012284517288208008, -0.00011562928557395935, -0.00010841339826583862, -0.0001011975109577179, -9.398162364959717e-05, -8.676573634147644e-05, -7.954984903335571e-05, -7.233396172523499e-05, -6.511807441711426e-05, -5.790218710899353e-05, -5.06862998008728e-05, -4.3470412492752075e-05, -3.625452518463135e-05, -2.903863787651062e-05, -2.1822750568389893e-05, -1.4606863260269165e-05, -7.3909759521484375e-06, -1.7508864402770996e-07, 7.040798664093018e-06, 1.4256685972213745e-05, 2.1472573280334473e-05, 2.86884605884552e-05, 3.590434789657593e-05, 4.3120235204696655e-05, 5.033612251281738e-05, 5.755200982093811e-05, 6.476789712905884e-05, 7.198378443717957e-05, 7.919967174530029e-05, 8.641555905342102e-05, 9.363144636154175e-05, 0.00010084733366966248, 0.0001080632209777832, 0.00011527910828590393, 0.00012249499559402466, 0.00012971088290214539, 0.0001369267702102661, 0.00014414265751838684, 0.00015135854482650757, 0.0001585744321346283, 0.00016579031944274902, 0.00017300620675086975, 0.00018022209405899048, 0.0001874379813671112, 0.00019465386867523193, 0.00020186975598335266, 0.0002090856432914734, 0.00021630153059959412, 0.00022351741790771484]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 4.0, 7.0, 4.0, 14.0, 9.0, 24.0, 28.0, 42.0, 69.0, 88.0, 595.0, 2218.0, 256.0, 137.0, 100.0, 90.0, 90.0, 62.0, 60.0, 42.0, 32.0, 23.0, 20.0, 14.0, 14.0, 9.0, 3.0, 3.0, 5.0, 3.0, 3.0], "bins": [-0.0001010894775390625, -9.881891310214996e-05, -9.654834866523743e-05, -9.427778422832489e-05, -9.200721979141235e-05, -8.973665535449982e-05, -8.746609091758728e-05, -8.519552648067474e-05, -8.292496204376221e-05, -8.065439760684967e-05, -7.838383316993713e-05, -7.61132687330246e-05, -7.384270429611206e-05, -7.157213985919952e-05, -6.930157542228699e-05, -6.703101098537445e-05, -6.476044654846191e-05, -6.248988211154938e-05, -6.021931767463684e-05, -5.7948753237724304e-05, -5.567818880081177e-05, -5.340762436389923e-05, -5.1137059926986694e-05, -4.886649549007416e-05, -4.659593105316162e-05, -4.4325366616249084e-05, -4.205480217933655e-05, -3.978423774242401e-05, -3.7513673305511475e-05, -3.524310886859894e-05, -3.29725444316864e-05, -3.0701979994773865e-05, -2.8431415557861328e-05, -2.616085112094879e-05, -2.3890286684036255e-05, -2.1619722247123718e-05, -1.934915781021118e-05, -1.7078593373298645e-05, -1.4808028936386108e-05, -1.2537464499473572e-05, -1.0266900062561035e-05, -7.996335625648499e-06, -5.725771188735962e-06, -3.4552067518234253e-06, -1.1846423149108887e-06, 1.085922122001648e-06, 3.3564865589141846e-06, 5.627050995826721e-06, 7.897615432739258e-06, 1.0168179869651794e-05, 1.2438744306564331e-05, 1.4709308743476868e-05, 1.6979873180389404e-05, 1.925043761730194e-05, 2.1521002054214478e-05, 2.3791566491127014e-05, 2.606213092803955e-05, 2.8332695364952087e-05, 3.0603259801864624e-05, 3.287382423877716e-05, 3.51443886756897e-05, 3.7414953112602234e-05, 3.968551754951477e-05, 4.195608198642731e-05, 4.4226646423339844e-05]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 30.0, 152.0, 600.0, 173.0, 44.0, 13.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005533511284738779, -0.0004520610673353076, -0.00035077103530056775, -0.0002494810032658279, -0.00014819094212725759, -4.690088098868728e-05, 5.438912194222212e-05, 0.00015567918308079243, 0.00025696924421936274, 0.00035825930535793304, 0.0004595493373926729, 0.0005608393694274127, 0.0006621294305659831, 0.0007634194917045534, 0.0008647094946354628, 0.0009659995557740331, 0.0010672896169126034, 0.0011685796780511737, 0.001269869739189744, 0.0013711596839129925, 0.0014724498614668846, 0.001573739806190133, 0.0016750298673287034, 0.0017763199284672737, 0.001877609989605844, 0.0019789000507444143, 0.002080189995467663, 0.002181480173021555, 0.0022827701177448034, 0.0023840602952986956, 0.002485350240021944, 0.002586640417575836, 0.0026879305951297283, 0.002789220539852977, 0.002890510717406869, 0.0029918006621301174, 0.0030930908396840096, 0.003194380784407258, 0.0032956707291305065, 0.0033969609066843987, 0.003498251084238291, 0.0035995410289615393, 0.0037008312065154314, 0.00380212115123868, 0.003903411328792572, 0.004004701506346464, 0.004105991218239069, 0.004207281395792961, 0.004308571107685566, 0.004409861285239458, 0.004511150997132063, 0.004612441174685955, 0.004713731352239847, 0.004815021529793739, 0.004916311241686344, 0.005017601419240236, 0.005118891596794128, 0.0052201817743480206, 0.005321471486240625, 0.0054227616637945175, 0.00552405184134841, 0.005625342018902302, 0.005726631730794907, 0.005827921908348799, 0.005929212085902691]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 10.0, 8.0, 8.0, 11.0, 14.0, 21.0, 22.0, 25.0, 32.0, 30.0, 48.0, 33.0, 48.0, 57.0, 57.0, 40.0, 48.0, 59.0, 47.0, 38.0, 39.0, 47.0, 43.0, 41.0, 38.0, 26.0, 21.0, 21.0, 15.0, 14.0, 12.0, 6.0, 10.0, 8.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004980564117431641, -0.00048445630818605423, -0.0004708562046289444, -0.00045725610107183456, -0.00044365599751472473, -0.0004300558939576149, -0.00041645579040050507, -0.00040285568684339523, -0.0003892555832862854, -0.00037565547972917557, -0.00036205537617206573, -0.0003484552726149559, -0.00033485516905784607, -0.00032125506550073624, -0.0003076549619436264, -0.00029405485838651657, -0.00028045475482940674, -0.0002668546512722969, -0.00025325454771518707, -0.00023965444415807724, -0.0002260543406009674, -0.00021245423704385757, -0.00019885413348674774, -0.0001852540299296379, -0.00017165392637252808, -0.00015805382281541824, -0.0001444537192583084, -0.00013085361570119858, -0.00011725351214408875, -0.00010365340858697891, -9.005330502986908e-05, -7.645320147275925e-05, -6.285309791564941e-05, -4.925299435853958e-05, -3.565289080142975e-05, -2.2052787244319916e-05, -8.452683687210083e-06, 5.14741986989975e-06, 1.8747523427009583e-05, 3.2347626984119415e-05, 4.594773054122925e-05, 5.954783409833908e-05, 7.314793765544891e-05, 8.674804121255875e-05, 0.00010034814476966858, 0.00011394824832677841, 0.00012754835188388824, 0.00014114845544099808, 0.0001547485589981079, 0.00016834866255521774, 0.00018194876611232758, 0.0001955488696694374, 0.00020914897322654724, 0.00022274907678365707, 0.0002363491803407669, 0.00024994928389787674, 0.00026354938745498657, 0.0002771494910120964, 0.00029074959456920624, 0.00030434969812631607, 0.0003179498016834259, 0.00033154990524053574, 0.00034515000879764557, 0.0003587501123547554, 0.00037235021591186523]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 2.0, 7.0, 6.0, 10.0, 12.0, 12.0, 19.0, 24.0, 39.0, 27.0, 82.0, 114.0, 172.0, 318.0, 612.0, 1247.0, 2584.0, 6195.0, 16373.0, 55942.0, 432263.0, 448723.0, 56115.0, 16228.0, 6108.0, 2655.0, 1234.0, 604.0, 315.0, 189.0, 116.0, 62.0, 35.0, 29.0, 17.0, 20.0, 9.0, 6.0, 10.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028586387634277344, -0.00027693063020706177, -0.0002679973840713501, -0.00025906413793563843, -0.00025013089179992676, -0.0002411976456642151, -0.00023226439952850342, -0.00022333115339279175, -0.00021439790725708008, -0.0002054646611213684, -0.00019653141498565674, -0.00018759816884994507, -0.0001786649227142334, -0.00016973167657852173, -0.00016079843044281006, -0.0001518651843070984, -0.00014293193817138672, -0.00013399869203567505, -0.00012506544589996338, -0.00011613219976425171, -0.00010719895362854004, -9.826570749282837e-05, -8.93324613571167e-05, -8.039921522140503e-05, -7.146596908569336e-05, -6.253272294998169e-05, -5.359947681427002e-05, -4.466623067855835e-05, -3.573298454284668e-05, -2.679973840713501e-05, -1.786649227142334e-05, -8.93324613571167e-06, 0.0, 8.93324613571167e-06, 1.786649227142334e-05, 2.679973840713501e-05, 3.573298454284668e-05, 4.466623067855835e-05, 5.359947681427002e-05, 6.253272294998169e-05, 7.146596908569336e-05, 8.039921522140503e-05, 8.93324613571167e-05, 9.826570749282837e-05, 0.00010719895362854004, 0.00011613219976425171, 0.00012506544589996338, 0.00013399869203567505, 0.00014293193817138672, 0.0001518651843070984, 0.00016079843044281006, 0.00016973167657852173, 0.0001786649227142334, 0.00018759816884994507, 0.00019653141498565674, 0.0002054646611213684, 0.00021439790725708008, 0.00022333115339279175, 0.00023226439952850342, 0.0002411976456642151, 0.00025013089179992676, 0.00025906413793563843, 0.0002679973840713501, 0.00027693063020706177, 0.00028586387634277344]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 5.0, 18.0, 18.0, 24.0, 36.0, 43.0, 73.0, 102.0, 117.0, 112.0, 124.0, 101.0, 58.0, 49.0, 29.0, 20.0, 11.0, 16.0, 13.0, 8.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.239776611328125e-05, -1.1721625924110413e-05, -1.1045485734939575e-05, -1.0369345545768738e-05, -9.6932053565979e-06, -9.017065167427063e-06, -8.340924978256226e-06, -7.664784789085388e-06, -6.988644599914551e-06, -6.312504410743713e-06, -5.636364221572876e-06, -4.9602240324020386e-06, -4.284083843231201e-06, -3.6079436540603638e-06, -2.9318034648895264e-06, -2.255663275718689e-06, -1.5795230865478516e-06, -9.033828973770142e-07, -2.2724270820617676e-07, 4.4889748096466064e-07, 1.125037670135498e-06, 1.8011778593063354e-06, 2.477318048477173e-06, 3.1534582376480103e-06, 3.829598426818848e-06, 4.505738615989685e-06, 5.1818788051605225e-06, 5.85801899433136e-06, 6.534159183502197e-06, 7.210299372673035e-06, 7.886439561843872e-06, 8.56257975101471e-06, 9.238719940185547e-06, 9.914860129356384e-06, 1.0591000318527222e-05, 1.1267140507698059e-05, 1.1943280696868896e-05, 1.2619420886039734e-05, 1.3295561075210571e-05, 1.3971701264381409e-05, 1.4647841453552246e-05, 1.5323981642723083e-05, 1.600012183189392e-05, 1.6676262021064758e-05, 1.7352402210235596e-05, 1.8028542399406433e-05, 1.870468258857727e-05, 1.9380822777748108e-05, 2.0056962966918945e-05, 2.0733103156089783e-05, 2.140924334526062e-05, 2.2085383534431458e-05, 2.2761523723602295e-05, 2.3437663912773132e-05, 2.411380410194397e-05, 2.4789944291114807e-05, 2.5466084480285645e-05, 2.6142224669456482e-05, 2.681836485862732e-05, 2.7494505047798157e-05, 2.8170645236968994e-05, 2.884678542613983e-05, 2.952292561531067e-05, 3.0199065804481506e-05, 3.0875205993652344e-05]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 7.0, 15.0, 18.0, 23.0, 28.0, 42.0, 61.0, 77.0, 136.0, 169.0, 260.0, 362.0, 598.0, 1004.0, 1503.0, 2718.0, 4672.0, 8749.0, 17790.0, 40270.0, 116271.0, 545894.0, 200835.0, 57545.0, 23875.0, 11311.0, 5890.0, 3184.0, 1895.0, 1156.0, 731.0, 473.0, 300.0, 217.0, 120.0, 92.0, 75.0, 54.0, 35.0, 25.0, 23.0, 11.0, 10.0, 4.0, 3.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.00014519691467285156, -0.0001406148076057434, -0.00013603270053863525, -0.0001314505934715271, -0.00012686848640441895, -0.0001222863793373108, -0.00011770427227020264, -0.00011312216520309448, -0.00010854005813598633, -0.00010395795106887817, -9.937584400177002e-05, -9.479373693466187e-05, -9.021162986755371e-05, -8.562952280044556e-05, -8.10474157333374e-05, -7.646530866622925e-05, -7.18832015991211e-05, -6.730109453201294e-05, -6.271898746490479e-05, -5.813688039779663e-05, -5.3554773330688477e-05, -4.897266626358032e-05, -4.439055919647217e-05, -3.9808452129364014e-05, -3.522634506225586e-05, -3.0644237995147705e-05, -2.606213092803955e-05, -2.1480023860931396e-05, -1.6897916793823242e-05, -1.2315809726715088e-05, -7.733702659606934e-06, -3.1515955924987793e-06, 1.430511474609375e-06, 6.012618541717529e-06, 1.0594725608825684e-05, 1.5176832675933838e-05, 1.9758939743041992e-05, 2.4341046810150146e-05, 2.89231538772583e-05, 3.3505260944366455e-05, 3.808736801147461e-05, 4.2669475078582764e-05, 4.725158214569092e-05, 5.183368921279907e-05, 5.6415796279907227e-05, 6.099790334701538e-05, 6.558001041412354e-05, 7.016211748123169e-05, 7.474422454833984e-05, 7.9326331615448e-05, 8.390843868255615e-05, 8.84905457496643e-05, 9.307265281677246e-05, 9.765475988388062e-05, 0.00010223686695098877, 0.00010681897401809692, 0.00011140108108520508, 0.00011598318815231323, 0.00012056529521942139, 0.00012514740228652954, 0.0001297295093536377, 0.00013431161642074585, 0.000138893723487854, 0.00014347583055496216, 0.0001480579376220703]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 6.0, 7.0, 4.0, 13.0, 16.0, 17.0, 16.0, 25.0, 26.0, 25.0, 20.0, 21.0, 37.0, 35.0, 50.0, 58.0, 41.0, 57.0, 46.0, 50.0, 43.0, 46.0, 42.0, 37.0, 42.0, 22.0, 23.0, 20.0, 21.0, 22.0, 15.0, 14.0, 11.0, 12.0, 9.0, 4.0, 11.0, 2.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.4405460357666016e-05, -4.303455352783203e-05, -4.166364669799805e-05, -4.029273986816406e-05, -3.892183303833008e-05, -3.7550926208496094e-05, -3.618001937866211e-05, -3.4809112548828125e-05, -3.343820571899414e-05, -3.2067298889160156e-05, -3.069639205932617e-05, -2.9325485229492188e-05, -2.7954578399658203e-05, -2.658367156982422e-05, -2.5212764739990234e-05, -2.384185791015625e-05, -2.2470951080322266e-05, -2.110004425048828e-05, -1.9729137420654297e-05, -1.8358230590820312e-05, -1.6987323760986328e-05, -1.5616416931152344e-05, -1.424551010131836e-05, -1.2874603271484375e-05, -1.150369644165039e-05, -1.0132789611816406e-05, -8.761882781982422e-06, -7.3909759521484375e-06, -6.020069122314453e-06, -4.649162292480469e-06, -3.2782554626464844e-06, -1.9073486328125e-06, -5.364418029785156e-07, 8.344650268554688e-07, 2.205371856689453e-06, 3.5762786865234375e-06, 4.947185516357422e-06, 6.318092346191406e-06, 7.68899917602539e-06, 9.059906005859375e-06, 1.043081283569336e-05, 1.1801719665527344e-05, 1.3172626495361328e-05, 1.4543533325195312e-05, 1.5914440155029297e-05, 1.728534698486328e-05, 1.8656253814697266e-05, 2.002716064453125e-05, 2.1398067474365234e-05, 2.276897430419922e-05, 2.4139881134033203e-05, 2.5510787963867188e-05, 2.6881694793701172e-05, 2.8252601623535156e-05, 2.962350845336914e-05, 3.0994415283203125e-05, 3.236532211303711e-05, 3.3736228942871094e-05, 3.510713577270508e-05, 3.647804260253906e-05, 3.784894943237305e-05, 3.921985626220703e-05, 4.0590763092041016e-05, 4.1961669921875e-05, 4.3332576751708984e-05]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 4.0, 5.0, 7.0, 10.0, 21.0, 30.0, 63.0, 75.0, 163.0, 272.0, 449.0, 949.0, 1842.0, 3723.0, 8496.0, 24603.0, 106719.0, 748640.0, 110788.0, 24911.0, 9065.0, 3735.0, 1865.0, 938.0, 507.0, 292.0, 153.0, 81.0, 51.0, 34.0, 19.0, 14.0, 8.0, 10.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001081228256225586, -0.00010498985648155212, -0.00010185688734054565, -9.872391819953918e-05, -9.559094905853271e-05, -9.245797991752625e-05, -8.932501077651978e-05, -8.61920416355133e-05, -8.305907249450684e-05, -7.992610335350037e-05, -7.67931342124939e-05, -7.366016507148743e-05, -7.052719593048096e-05, -6.739422678947449e-05, -6.426125764846802e-05, -6.112828850746155e-05, -5.799531936645508e-05, -5.486235022544861e-05, -5.172938108444214e-05, -4.859641194343567e-05, -4.54634428024292e-05, -4.233047366142273e-05, -3.919750452041626e-05, -3.606453537940979e-05, -3.293156623840332e-05, -2.979859709739685e-05, -2.666562795639038e-05, -2.353265881538391e-05, -2.039968967437744e-05, -1.726672053337097e-05, -1.4133751392364502e-05, -1.1000782251358032e-05, -7.867813110351562e-06, -4.734843969345093e-06, -1.601874828338623e-06, 1.5310943126678467e-06, 4.664063453674316e-06, 7.797032594680786e-06, 1.0930001735687256e-05, 1.4062970876693726e-05, 1.7195940017700195e-05, 2.0328909158706665e-05, 2.3461878299713135e-05, 2.6594847440719604e-05, 2.9727816581726074e-05, 3.2860785722732544e-05, 3.5993754863739014e-05, 3.9126724004745483e-05, 4.225969314575195e-05, 4.539266228675842e-05, 4.852563142776489e-05, 5.165860056877136e-05, 5.479156970977783e-05, 5.79245388507843e-05, 6.105750799179077e-05, 6.419047713279724e-05, 6.732344627380371e-05, 7.045641541481018e-05, 7.358938455581665e-05, 7.672235369682312e-05, 7.985532283782959e-05, 8.298829197883606e-05, 8.612126111984253e-05, 8.9254230260849e-05, 9.238719940185547e-05]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 2.0, 12.0, 11.0, 12.0, 14.0, 21.0, 27.0, 34.0, 43.0, 51.0, 78.0, 184.0, 200.0, 73.0, 42.0, 32.0, 31.0, 22.0, 28.0, 9.0, 16.0, 9.0, 15.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0907649993896484e-05, -1.0545365512371063e-05, -1.0183081030845642e-05, -9.820796549320221e-06, -9.4585120677948e-06, -9.096227586269379e-06, -8.733943104743958e-06, -8.371658623218536e-06, -8.009374141693115e-06, -7.647089660167694e-06, -7.284805178642273e-06, -6.922520697116852e-06, -6.560236215591431e-06, -6.1979517340660095e-06, -5.835667252540588e-06, -5.473382771015167e-06, -5.111098289489746e-06, -4.748813807964325e-06, -4.386529326438904e-06, -4.024244844913483e-06, -3.6619603633880615e-06, -3.2996758818626404e-06, -2.9373914003372192e-06, -2.575106918811798e-06, -2.212822437286377e-06, -1.8505379557609558e-06, -1.4882534742355347e-06, -1.1259689927101135e-06, -7.636845111846924e-07, -4.0140002965927124e-07, -3.91155481338501e-08, 3.2316893339157104e-07, 6.854534149169922e-07, 1.0477378964424133e-06, 1.4100223779678345e-06, 1.7723068594932556e-06, 2.1345913410186768e-06, 2.496875822544098e-06, 2.859160304069519e-06, 3.22144478559494e-06, 3.5837292671203613e-06, 3.9460137486457825e-06, 4.308298230171204e-06, 4.670582711696625e-06, 5.032867193222046e-06, 5.395151674747467e-06, 5.757436156272888e-06, 6.119720637798309e-06, 6.4820051193237305e-06, 6.844289600849152e-06, 7.206574082374573e-06, 7.568858563899994e-06, 7.931143045425415e-06, 8.293427526950836e-06, 8.655712008476257e-06, 9.017996490001678e-06, 9.3802809715271e-06, 9.74256545305252e-06, 1.0104849934577942e-05, 1.0467134416103363e-05, 1.0829418897628784e-05, 1.1191703379154205e-05, 1.1553987860679626e-05, 1.1916272342205048e-05, 1.2278556823730469e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 6.0, 18.0, 28.0, 25.0, 31.0, 43.0, 50.0, 93.0, 105.0, 175.0, 241.0, 400.0, 576.0, 923.0, 1481.0, 2548.0, 4556.0, 8986.0, 21773.0, 59975.0, 472824.0, 382663.0, 52448.0, 19100.0, 8544.0, 4559.0, 2362.0, 1435.0, 897.0, 568.0, 352.0, 238.0, 150.0, 123.0, 63.0, 43.0, 43.0, 28.0, 16.0, 11.0, 9.0, 12.0, 7.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.594160079956055e-05, -3.485102206468582e-05, -3.3760443329811096e-05, -3.266986459493637e-05, -3.1579285860061646e-05, -3.048870712518692e-05, -2.9398128390312195e-05, -2.830754965543747e-05, -2.7216970920562744e-05, -2.612639218568802e-05, -2.5035813450813293e-05, -2.3945234715938568e-05, -2.2854655981063843e-05, -2.1764077246189117e-05, -2.0673498511314392e-05, -1.9582919776439667e-05, -1.849234104156494e-05, -1.7401762306690216e-05, -1.631118357181549e-05, -1.5220604836940765e-05, -1.413002610206604e-05, -1.3039447367191315e-05, -1.194886863231659e-05, -1.0858289897441864e-05, -9.767711162567139e-06, -8.677132427692413e-06, -7.586553692817688e-06, -6.495974957942963e-06, -5.405396223068237e-06, -4.314817488193512e-06, -3.2242387533187866e-06, -2.1336600184440613e-06, -1.043081283569336e-06, 4.7497451305389404e-08, 1.1380761861801147e-06, 2.22865492105484e-06, 3.3192336559295654e-06, 4.409812390804291e-06, 5.500391125679016e-06, 6.5909698605537415e-06, 7.681548595428467e-06, 8.772127330303192e-06, 9.862706065177917e-06, 1.0953284800052643e-05, 1.2043863534927368e-05, 1.3134442269802094e-05, 1.4225021004676819e-05, 1.5315599739551544e-05, 1.640617847442627e-05, 1.7496757209300995e-05, 1.858733594417572e-05, 1.9677914679050446e-05, 2.076849341392517e-05, 2.1859072148799896e-05, 2.294965088367462e-05, 2.4040229618549347e-05, 2.5130808353424072e-05, 2.6221387088298798e-05, 2.7311965823173523e-05, 2.8402544558048248e-05, 2.9493123292922974e-05, 3.05837020277977e-05, 3.1674280762672424e-05, 3.276485949754715e-05, 3.3855438232421875e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 6.0, 2.0, 4.0, 8.0, 6.0, 12.0, 7.0, 14.0, 13.0, 19.0, 21.0, 39.0, 32.0, 37.0, 37.0, 64.0, 69.0, 107.0, 107.0, 71.0, 61.0, 37.0, 49.0, 24.0, 11.0, 19.0, 25.0, 21.0, 10.0, 13.0, 7.0, 4.0, 7.0, 1.0, 4.0, 7.0, 3.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.055002212524414e-05, -1.0229647159576416e-05, -9.909272193908691e-06, -9.588897228240967e-06, -9.268522262573242e-06, -8.948147296905518e-06, -8.627772331237793e-06, -8.307397365570068e-06, -7.987022399902344e-06, -7.666647434234619e-06, -7.3462724685668945e-06, -7.02589750289917e-06, -6.705522537231445e-06, -6.385147571563721e-06, -6.064772605895996e-06, -5.7443976402282715e-06, -5.424022674560547e-06, -5.103647708892822e-06, -4.783272743225098e-06, -4.462897777557373e-06, -4.1425228118896484e-06, -3.822147846221924e-06, -3.5017728805541992e-06, -3.1813979148864746e-06, -2.86102294921875e-06, -2.5406479835510254e-06, -2.2202730178833008e-06, -1.8998980522155762e-06, -1.5795230865478516e-06, -1.259148120880127e-06, -9.387731552124023e-07, -6.183981895446777e-07, -2.980232238769531e-07, 2.2351741790771484e-08, 3.427267074584961e-07, 6.631016731262207e-07, 9.834766387939453e-07, 1.30385160446167e-06, 1.6242265701293945e-06, 1.944601535797119e-06, 2.2649765014648438e-06, 2.5853514671325684e-06, 2.905726432800293e-06, 3.2261013984680176e-06, 3.546476364135742e-06, 3.866851329803467e-06, 4.187226295471191e-06, 4.507601261138916e-06, 4.827976226806641e-06, 5.148351192474365e-06, 5.46872615814209e-06, 5.7891011238098145e-06, 6.109476089477539e-06, 6.429851055145264e-06, 6.750226020812988e-06, 7.070600986480713e-06, 7.3909759521484375e-06, 7.711350917816162e-06, 8.031725883483887e-06, 8.352100849151611e-06, 8.672475814819336e-06, 8.99285078048706e-06, 9.313225746154785e-06, 9.63360071182251e-06, 9.953975677490234e-06]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 19.0, 41.0, 100.0, 184.0, 437.0, 162.0, 32.0, 19.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011511954944580793, -0.001085653668269515, -0.0010201118420809507, -0.0009545700158923864, -0.0008890281897038221, -0.0008234863635152578, -0.0007579445373266935, -0.0006924027111381292, -0.0006268608849495649, -0.0005613190587610006, -0.0004957772325724363, -0.00043023540638387203, -0.00036469358019530773, -0.00029915175400674343, -0.00023360992781817913, -0.00016806810162961483, -0.00010252627544105053, -3.698444925248623e-05, 2.855737693607807e-05, 9.409920312464237e-05, 0.00015964102931320667, 0.00022518285550177097, 0.0002907246816903353, 0.0003562665078788996, 0.0004218083340674639, 0.0004873501602560282, 0.0005528919864445925, 0.0006184338126331568, 0.0006839756388217211, 0.0007495174650102854, 0.0008150592911988497, 0.000880601117387414, 0.0009461429435759783, 0.0010116847697645426, 0.0010772265959531069, 0.0011427684221416712, 0.0012083102483302355, 0.0012738520745187998, 0.001339393900707364, 0.0014049357268959284, 0.0014704775530844927, 0.001536019379273057, 0.0016015612054616213, 0.0016671030316501856, 0.0017326448578387499, 0.0017981866840273142, 0.0018637285102158785, 0.0019292703364044428, 0.001994812162593007, 0.0020603539887815714, 0.0021258958149701357, 0.0021914376411587, 0.0022569794673472643, 0.0023225212935358286, 0.002388063119724393, 0.002453604945912957, 0.0025191467721015215, 0.002584688598290086, 0.00265023042447865, 0.0027157722506672144, 0.0027813140768557787, 0.002846855903044343, 0.0029123977292329073, 0.0029779395554214716, 0.003043481381610036]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 6.0, 15.0, 22.0, 13.0, 31.0, 36.0, 36.0, 40.0, 52.0, 56.0, 61.0, 54.0, 54.0, 55.0, 65.0, 40.0, 47.0, 46.0, 52.0, 43.0, 33.0, 46.0, 26.0, 17.0, 23.0, 7.0, 11.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006004571914672852, -0.000584891065955162, -0.0005693249404430389, -0.0005537588149309158, -0.0005381926894187927, -0.0005226265639066696, -0.0005070604383945465, -0.0004914943128824234, -0.0004759281873703003, -0.0004603620618581772, -0.0004447959363460541, -0.00042922981083393097, -0.00041366368532180786, -0.00039809755980968475, -0.00038253143429756165, -0.00036696530878543854, -0.00035139918327331543, -0.0003358330577611923, -0.0003202669322490692, -0.0003047008067369461, -0.000289134681224823, -0.0002735685557126999, -0.0002580024302005768, -0.00024243630468845367, -0.00022687017917633057, -0.00021130405366420746, -0.00019573792815208435, -0.00018017180263996124, -0.00016460567712783813, -0.00014903955161571503, -0.00013347342610359192, -0.00011790730059146881, -0.0001023411750793457, -8.67750495672226e-05, -7.120892405509949e-05, -5.564279854297638e-05, -4.007667303085327e-05, -2.4510547518730164e-05, -8.944422006607056e-06, 6.621703505516052e-06, 2.218782901763916e-05, 3.775395452976227e-05, 5.3320080041885376e-05, 6.888620555400848e-05, 8.445233106613159e-05, 0.0001000184565782547, 0.00011558458209037781, 0.00013115070760250092, 0.00014671683311462402, 0.00016228295862674713, 0.00017784908413887024, 0.00019341520965099335, 0.00020898133516311646, 0.00022454746067523956, 0.00024011358618736267, 0.0002556797116994858, 0.0002712458372116089, 0.000286811962723732, 0.0003023780882358551, 0.0003179442137479782, 0.0003335103392601013, 0.0003490764647722244, 0.00036464259028434753, 0.00038020871579647064, 0.00039577484130859375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 5.0, 9.0, 9.0, 9.0, 21.0, 27.0, 42.0, 81.0, 136.0, 227.0, 329.0, 610.0, 1052.0, 1685.0, 3028.0, 5094.0, 9606.0, 19833.0, 46664.0, 145987.0, 3454658.0, 364133.0, 78681.0, 29952.0, 13936.0, 7334.0, 4103.0, 2410.0, 1583.0, 957.0, 708.0, 452.0, 276.0, 194.0, 131.0, 94.0, 66.0, 41.0, 27.0, 22.0, 14.0, 15.0, 9.0, 3.0, 4.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001628398895263672, -0.00015698187053203583, -0.00015112385153770447, -0.0001452658325433731, -0.00013940781354904175, -0.0001335497945547104, -0.00012769177556037903, -0.00012183375656604767, -0.00011597573757171631, -0.00011011771857738495, -0.00010425969958305359, -9.840168058872223e-05, -9.254366159439087e-05, -8.668564260005951e-05, -8.082762360572815e-05, -7.496960461139679e-05, -6.911158561706543e-05, -6.325356662273407e-05, -5.739554762840271e-05, -5.153752863407135e-05, -4.567950963973999e-05, -3.982149064540863e-05, -3.396347165107727e-05, -2.810545265674591e-05, -2.224743366241455e-05, -1.638941466808319e-05, -1.0531395673751831e-05, -4.673376679420471e-06, 1.1846423149108887e-06, 7.0426613092422485e-06, 1.2900680303573608e-05, 1.8758699297904968e-05, 2.4616718292236328e-05, 3.0474737286567688e-05, 3.633275628089905e-05, 4.219077527523041e-05, 4.804879426956177e-05, 5.390681326389313e-05, 5.976483225822449e-05, 6.562285125255585e-05, 7.148087024688721e-05, 7.733888924121857e-05, 8.319690823554993e-05, 8.905492722988129e-05, 9.491294622421265e-05, 0.000100770965218544, 0.00010662898421287537, 0.00011248700320720673, 0.00011834502220153809, 0.00012420304119586945, 0.0001300610601902008, 0.00013591907918453217, 0.00014177709817886353, 0.00014763511717319489, 0.00015349313616752625, 0.0001593511551618576, 0.00016520917415618896, 0.00017106719315052032, 0.00017692521214485168, 0.00018278323113918304, 0.0001886412501335144, 0.00019449926912784576, 0.00020035728812217712, 0.00020621530711650848, 0.00021207332611083984]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 10.0, 4.0, 9.0, 7.0, 10.0, 27.0, 21.0, 38.0, 31.0, 52.0, 70.0, 86.0, 76.0, 96.0, 73.0, 66.0, 87.0, 47.0, 31.0, 28.0, 28.0, 18.0, 9.0, 14.0, 12.0, 7.0, 3.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2755393981933594e-05, -1.2277625501155853e-05, -1.1799857020378113e-05, -1.1322088539600372e-05, -1.0844320058822632e-05, -1.0366551578044891e-05, -9.888783097267151e-06, -9.41101461648941e-06, -8.93324613571167e-06, -8.45547765493393e-06, -7.977709174156189e-06, -7.4999406933784485e-06, -7.022172212600708e-06, -6.5444037318229675e-06, -6.066635251045227e-06, -5.5888667702674866e-06, -5.111098289489746e-06, -4.633329808712006e-06, -4.155561327934265e-06, -3.6777928471565247e-06, -3.200024366378784e-06, -2.7222558856010437e-06, -2.2444874048233032e-06, -1.7667189240455627e-06, -1.2889504432678223e-06, -8.111819624900818e-07, -3.334134817123413e-07, 1.4435499906539917e-07, 6.221234798431396e-07, 1.0998919606208801e-06, 1.5776604413986206e-06, 2.055428922176361e-06, 2.5331974029541016e-06, 3.010965883731842e-06, 3.4887343645095825e-06, 3.966502845287323e-06, 4.4442713260650635e-06, 4.922039806842804e-06, 5.3998082876205444e-06, 5.877576768398285e-06, 6.355345249176025e-06, 6.833113729953766e-06, 7.310882210731506e-06, 7.788650691509247e-06, 8.266419172286987e-06, 8.744187653064728e-06, 9.221956133842468e-06, 9.699724614620209e-06, 1.017749309539795e-05, 1.065526157617569e-05, 1.113303005695343e-05, 1.161079853773117e-05, 1.2088567018508911e-05, 1.2566335499286652e-05, 1.3044103980064392e-05, 1.3521872460842133e-05, 1.3999640941619873e-05, 1.4477409422397614e-05, 1.4955177903175354e-05, 1.5432946383953094e-05, 1.5910714864730835e-05, 1.6388483345508575e-05, 1.6866251826286316e-05, 1.7344020307064056e-05, 1.7821788787841797e-05]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 12.0, 6.0, 12.0, 12.0, 25.0, 29.0, 33.0, 55.0, 109.0, 197.0, 322.0, 636.0, 1192.0, 2552.0, 5954.0, 15044.0, 46396.0, 202722.0, 3523628.0, 303526.0, 60033.0, 18596.0, 7026.0, 3096.0, 1373.0, 775.0, 380.0, 204.0, 123.0, 76.0, 47.0, 28.0, 19.0, 12.0, 8.0, 8.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.00015246868133544922, -0.00014627166092395782, -0.00014007464051246643, -0.00013387762010097504, -0.00012768059968948364, -0.00012148357927799225, -0.00011528655886650085, -0.00010908953845500946, -0.00010289251804351807, -9.669549763202667e-05, -9.049847722053528e-05, -8.430145680904388e-05, -7.810443639755249e-05, -7.19074159860611e-05, -6.57103955745697e-05, -5.951337516307831e-05, -5.3316354751586914e-05, -4.711933434009552e-05, -4.0922313928604126e-05, -3.472529351711273e-05, -2.8528273105621338e-05, -2.2331252694129944e-05, -1.613423228263855e-05, -9.937211871147156e-06, -3.7401914596557617e-06, 2.4568289518356323e-06, 8.653849363327026e-06, 1.485086977481842e-05, 2.1047890186309814e-05, 2.724491059780121e-05, 3.34419310092926e-05, 3.9638951420783997e-05, 4.583597183227539e-05, 5.2032992243766785e-05, 5.823001265525818e-05, 6.442703306674957e-05, 7.062405347824097e-05, 7.682107388973236e-05, 8.301809430122375e-05, 8.921511471271515e-05, 9.541213512420654e-05, 0.00010160915553569794, 0.00010780617594718933, 0.00011400319635868073, 0.00012020021677017212, 0.0001263972371816635, 0.0001325942575931549, 0.0001387912780046463, 0.0001449882984161377, 0.0001511853188276291, 0.00015738233923912048, 0.00016357935965061188, 0.00016977638006210327, 0.00017597340047359467, 0.00018217042088508606, 0.00018836744129657745, 0.00019456446170806885, 0.00020076148211956024, 0.00020695850253105164, 0.00021315552294254303, 0.00021935254335403442, 0.00022554956376552582, 0.0002317465841770172, 0.0002379436045885086, 0.000244140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 11.0, 8.0, 6.0, 12.0, 19.0, 25.0, 24.0, 36.0, 31.0, 45.0, 46.0, 88.0, 109.0, 146.0, 146.0, 407.0, 1672.0, 470.0, 162.0, 107.0, 82.0, 70.0, 64.0, 60.0, 46.0, 35.0, 28.0, 24.0, 18.0, 16.0, 11.0, 12.0, 8.0, 10.0, 4.0, 4.0, 3.0, 7.0, 3.0, 0.0, 3.0], "bins": [-5.602836608886719e-05, -5.4613687098026276e-05, -5.3199008107185364e-05, -5.178432911634445e-05, -5.036965012550354e-05, -4.895497113466263e-05, -4.7540292143821716e-05, -4.6125613152980804e-05, -4.471093416213989e-05, -4.329625517129898e-05, -4.188157618045807e-05, -4.046689718961716e-05, -3.9052218198776245e-05, -3.763753920793533e-05, -3.622286021709442e-05, -3.480818122625351e-05, -3.33935022354126e-05, -3.1978823244571686e-05, -3.0564144253730774e-05, -2.9149465262889862e-05, -2.773478627204895e-05, -2.632010728120804e-05, -2.4905428290367126e-05, -2.3490749299526215e-05, -2.2076070308685303e-05, -2.066139131784439e-05, -1.924671232700348e-05, -1.7832033336162567e-05, -1.6417354345321655e-05, -1.5002675354480743e-05, -1.3587996363639832e-05, -1.217331737279892e-05, -1.0758638381958008e-05, -9.343959391117096e-06, -7.929280400276184e-06, -6.514601409435272e-06, -5.09992241859436e-06, -3.6852434277534485e-06, -2.2705644369125366e-06, -8.558854460716248e-07, 5.587935447692871e-07, 1.973472535610199e-06, 3.388151526451111e-06, 4.802830517292023e-06, 6.2175095081329346e-06, 7.632188498973846e-06, 9.046867489814758e-06, 1.046154648065567e-05, 1.1876225471496582e-05, 1.3290904462337494e-05, 1.4705583453178406e-05, 1.6120262444019318e-05, 1.753494143486023e-05, 1.894962042570114e-05, 2.0364299416542053e-05, 2.1778978407382965e-05, 2.3193657398223877e-05, 2.460833638906479e-05, 2.60230153799057e-05, 2.7437694370746613e-05, 2.8852373361587524e-05, 3.0267052352428436e-05, 3.168173134326935e-05, 3.309641033411026e-05, 3.451108932495117e-05]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 5.0, 5.0, 15.0, 38.0, 104.0, 355.0, 253.0, 127.0, 54.0, 34.0, 16.0, 11.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002162230375688523, -0.0001843953796196729, -0.00015256772167049348, -0.00012074004916939884, -8.891239122021943e-05, -5.708473327104002e-05, -2.5257060769945383e-05, 6.570597179234028e-06, 3.839825512841344e-05, 7.022591307759285e-05, 0.00010205357830272987, 0.0001338812435278669, 0.0001657089014770463, 0.00019753655942622572, 0.00022936423192732036, 0.00026119188987649977, 0.0002930195478256792, 0.0003248472057748586, 0.000356674863724038, 0.00038850255077704787, 0.0004203302087262273, 0.0004521578666754067, 0.0004839855246245861, 0.0005158131825737655, 0.0005476408405229449, 0.0005794684984721243, 0.0006112961564213037, 0.0006431238143704832, 0.0006749514723196626, 0.000706779130268842, 0.0007386067882180214, 0.0007704345043748617, 0.000802262220531702, 0.0008340898784808815, 0.0008659175364300609, 0.0008977451943792403, 0.0009295728523284197, 0.0009614005102775991, 0.0009932281682267785, 0.0010250558843836188, 0.0010568834841251373, 0.0010887112002819777, 0.0011205388000234962, 0.0011523665161803365, 0.001184194115921855, 0.0012160218320786953, 0.0012478494318202138, 0.0012796771479770541, 0.0013115047477185726, 0.001343332463875413, 0.0013751600636169314, 0.0014069877797737718, 0.0014388153795152903, 0.0014706430956721306, 0.001502470695413649, 0.0015342984115704894, 0.0015661261277273297, 0.00159795384388417, 0.0016297814436256886, 0.0016616091597825289, 0.0016934367595240474, 0.0017252644756808877, 0.0017570920754224062, 0.0017889197915792465, 0.001820747391320765]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 5.0, 10.0, 15.0, 8.0, 16.0, 9.0, 31.0, 21.0, 21.0, 23.0, 31.0, 35.0, 36.0, 35.0, 44.0, 42.0, 33.0, 42.0, 49.0, 49.0, 41.0, 56.0, 38.0, 39.0, 46.0, 26.0, 28.0, 29.0, 25.0, 21.0, 12.0, 10.0, 16.0, 14.0, 11.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00018328428268432617, -0.00017753895372152328, -0.0001717936247587204, -0.0001660482957959175, -0.00016030296683311462, -0.00015455763787031174, -0.00014881230890750885, -0.00014306697994470596, -0.00013732165098190308, -0.0001315763220191002, -0.0001258309930562973, -0.00012008566409349442, -0.00011434033513069153, -0.00010859500616788864, -0.00010284967720508575, -9.710434824228287e-05, -9.135901927947998e-05, -8.56136903166771e-05, -7.98683613538742e-05, -7.412303239107132e-05, -6.837770342826843e-05, -6.263237446546555e-05, -5.688704550266266e-05, -5.114171653985977e-05, -4.5396387577056885e-05, -3.9651058614254e-05, -3.390572965145111e-05, -2.8160400688648224e-05, -2.2415071725845337e-05, -1.666974276304245e-05, -1.0924413800239563e-05, -5.179084837436676e-06, 5.662441253662109e-07, 6.311573088169098e-06, 1.2056902050971985e-05, 1.7802231013774872e-05, 2.354755997657776e-05, 2.9292888939380646e-05, 3.503821790218353e-05, 4.078354686498642e-05, 4.652887582778931e-05, 5.2274204790592194e-05, 5.801953375339508e-05, 6.376486271619797e-05, 6.951019167900085e-05, 7.525552064180374e-05, 8.100084960460663e-05, 8.674617856740952e-05, 9.24915075302124e-05, 9.823683649301529e-05, 0.00010398216545581818, 0.00010972749441862106, 0.00011547282338142395, 0.00012121815234422684, 0.00012696348130702972, 0.0001327088102698326, 0.0001384541392326355, 0.00014419946819543839, 0.00014994479715824127, 0.00015569012612104416, 0.00016143545508384705, 0.00016718078404664993, 0.00017292611300945282, 0.0001786714419722557, 0.0001844167709350586]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 13.0, 11.0, 24.0, 30.0, 49.0, 53.0, 89.0, 142.0, 194.0, 345.0, 517.0, 862.0, 1465.0, 2612.0, 4923.0, 10058.0, 22259.0, 63283.0, 270451.0, 525485.0, 89735.0, 29815.0, 12435.0, 5996.0, 3147.0, 1777.0, 1015.0, 628.0, 375.0, 236.0, 158.0, 113.0, 79.0, 59.0, 41.0, 18.0, 15.0, 11.0, 7.0, 6.0, 6.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0], "bins": [-0.0001475811004638672, -0.00014349818229675293, -0.00013941526412963867, -0.00013533234596252441, -0.00013124942779541016, -0.0001271665096282959, -0.00012308359146118164, -0.00011900067329406738, -0.00011491775512695312, -0.00011083483695983887, -0.00010675191879272461, -0.00010266900062561035, -9.85860824584961e-05, -9.450316429138184e-05, -9.042024612426758e-05, -8.633732795715332e-05, -8.225440979003906e-05, -7.81714916229248e-05, -7.408857345581055e-05, -7.000565528869629e-05, -6.592273712158203e-05, -6.183981895446777e-05, -5.7756900787353516e-05, -5.367398262023926e-05, -4.9591064453125e-05, -4.550814628601074e-05, -4.1425228118896484e-05, -3.7342309951782227e-05, -3.325939178466797e-05, -2.917647361755371e-05, -2.5093555450439453e-05, -2.1010637283325195e-05, -1.6927719116210938e-05, -1.284480094909668e-05, -8.761882781982422e-06, -4.678964614868164e-06, -5.960464477539062e-07, 3.4868717193603516e-06, 7.569789886474609e-06, 1.1652708053588867e-05, 1.5735626220703125e-05, 1.9818544387817383e-05, 2.390146255493164e-05, 2.79843807220459e-05, 3.2067298889160156e-05, 3.6150217056274414e-05, 4.023313522338867e-05, 4.431605339050293e-05, 4.839897155761719e-05, 5.2481889724731445e-05, 5.65648078918457e-05, 6.064772605895996e-05, 6.473064422607422e-05, 6.881356239318848e-05, 7.289648056030273e-05, 7.697939872741699e-05, 8.106231689453125e-05, 8.514523506164551e-05, 8.922815322875977e-05, 9.331107139587402e-05, 9.739398956298828e-05, 0.00010147690773010254, 0.0001055598258972168, 0.00010964274406433105, 0.00011372566223144531]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 9.0, 10.0, 11.0, 20.0, 14.0, 28.0, 34.0, 43.0, 72.0, 73.0, 94.0, 90.0, 89.0, 85.0, 76.0, 53.0, 50.0, 28.0, 26.0, 19.0, 11.0, 14.0, 6.0, 6.0, 11.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5079975128173828e-05, -1.4542602002620697e-05, -1.4005228877067566e-05, -1.3467855751514435e-05, -1.2930482625961304e-05, -1.2393109500408173e-05, -1.1855736374855042e-05, -1.131836324930191e-05, -1.078099012374878e-05, -1.0243616998195648e-05, -9.706243872642517e-06, -9.168870747089386e-06, -8.631497621536255e-06, -8.094124495983124e-06, -7.556751370429993e-06, -7.0193782448768616e-06, -6.4820051193237305e-06, -5.944631993770599e-06, -5.407258868217468e-06, -4.869885742664337e-06, -4.332512617111206e-06, -3.795139491558075e-06, -3.257766366004944e-06, -2.7203932404518127e-06, -2.1830201148986816e-06, -1.6456469893455505e-06, -1.1082738637924194e-06, -5.709007382392883e-07, -3.3527612686157227e-08, 5.038455128669739e-07, 1.041218638420105e-06, 1.578591763973236e-06, 2.115964889526367e-06, 2.6533380150794983e-06, 3.1907111406326294e-06, 3.7280842661857605e-06, 4.265457391738892e-06, 4.802830517292023e-06, 5.340203642845154e-06, 5.877576768398285e-06, 6.414949893951416e-06, 6.952323019504547e-06, 7.489696145057678e-06, 8.02706927061081e-06, 8.56444239616394e-06, 9.101815521717072e-06, 9.639188647270203e-06, 1.0176561772823334e-05, 1.0713934898376465e-05, 1.1251308023929596e-05, 1.1788681149482727e-05, 1.2326054275035858e-05, 1.286342740058899e-05, 1.340080052614212e-05, 1.3938173651695251e-05, 1.4475546777248383e-05, 1.5012919902801514e-05, 1.5550293028354645e-05, 1.6087666153907776e-05, 1.6625039279460907e-05, 1.7162412405014038e-05, 1.769978553056717e-05, 1.82371586561203e-05, 1.877453178167343e-05, 1.9311904907226562e-05]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 11.0, 11.0, 15.0, 26.0, 26.0, 37.0, 66.0, 73.0, 156.0, 163.0, 309.0, 442.0, 575.0, 894.0, 1281.0, 2104.0, 3176.0, 5045.0, 7822.0, 12889.0, 21676.0, 38914.0, 75417.0, 181056.0, 403687.0, 142927.0, 64379.0, 33859.0, 19670.0, 11588.0, 7068.0, 4581.0, 2921.0, 1893.0, 1256.0, 854.0, 538.0, 337.0, 257.0, 191.0, 92.0, 103.0, 44.0, 39.0, 35.0, 19.0, 15.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-7.56978988647461e-05, -7.343105971813202e-05, -7.116422057151794e-05, -6.889738142490387e-05, -6.66305422782898e-05, -6.436370313167572e-05, -6.209686398506165e-05, -5.983002483844757e-05, -5.7563185691833496e-05, -5.529634654521942e-05, -5.302950739860535e-05, -5.076266825199127e-05, -4.84958291053772e-05, -4.622898995876312e-05, -4.396215081214905e-05, -4.169531166553497e-05, -3.94284725189209e-05, -3.7161633372306824e-05, -3.489479422569275e-05, -3.2627955079078674e-05, -3.03611159324646e-05, -2.8094276785850525e-05, -2.582743763923645e-05, -2.3560598492622375e-05, -2.12937593460083e-05, -1.9026920199394226e-05, -1.676008105278015e-05, -1.4493241906166077e-05, -1.2226402759552002e-05, -9.959563612937927e-06, -7.692724466323853e-06, -5.425885319709778e-06, -3.159046173095703e-06, -8.922070264816284e-07, 1.3746321201324463e-06, 3.641471266746521e-06, 5.908310413360596e-06, 8.17514955997467e-06, 1.0441988706588745e-05, 1.270882785320282e-05, 1.4975666999816895e-05, 1.724250614643097e-05, 1.9509345293045044e-05, 2.177618443965912e-05, 2.4043023586273193e-05, 2.6309862732887268e-05, 2.8576701879501343e-05, 3.084354102611542e-05, 3.311038017272949e-05, 3.537721931934357e-05, 3.764405846595764e-05, 3.9910897612571716e-05, 4.217773675918579e-05, 4.4444575905799866e-05, 4.671141505241394e-05, 4.8978254199028015e-05, 5.124509334564209e-05, 5.3511932492256165e-05, 5.577877163887024e-05, 5.8045610785484314e-05, 6.031244993209839e-05, 6.257928907871246e-05, 6.484612822532654e-05, 6.711296737194061e-05, 6.937980651855469e-05]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 4.0, 6.0, 19.0, 10.0, 10.0, 11.0, 20.0, 17.0, 37.0, 32.0, 32.0, 39.0, 35.0, 33.0, 60.0, 36.0, 47.0, 60.0, 38.0, 48.0, 47.0, 39.0, 47.0, 26.0, 24.0, 29.0, 32.0, 10.0, 17.0, 16.0, 17.0, 15.0, 7.0, 21.0, 9.0, 12.0, 4.0, 11.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3974647521972656e-05, -3.2862648367881775e-05, -3.1750649213790894e-05, -3.063865005970001e-05, -2.952665090560913e-05, -2.841465175151825e-05, -2.7302652597427368e-05, -2.6190653443336487e-05, -2.5078654289245605e-05, -2.3966655135154724e-05, -2.2854655981063843e-05, -2.174265682697296e-05, -2.063065767288208e-05, -1.95186585187912e-05, -1.8406659364700317e-05, -1.7294660210609436e-05, -1.6182661056518555e-05, -1.5070661902427673e-05, -1.3958662748336792e-05, -1.284666359424591e-05, -1.173466444015503e-05, -1.0622665286064148e-05, -9.510666131973267e-06, -8.398666977882385e-06, -7.286667823791504e-06, -6.1746686697006226e-06, -5.062669515609741e-06, -3.95067036151886e-06, -2.8386712074279785e-06, -1.7266720533370972e-06, -6.146728992462158e-07, 4.973262548446655e-07, 1.6093254089355469e-06, 2.7213245630264282e-06, 3.8333237171173096e-06, 4.945322871208191e-06, 6.057322025299072e-06, 7.169321179389954e-06, 8.281320333480835e-06, 9.393319487571716e-06, 1.0505318641662598e-05, 1.1617317795753479e-05, 1.272931694984436e-05, 1.3841316103935242e-05, 1.4953315258026123e-05, 1.6065314412117004e-05, 1.7177313566207886e-05, 1.8289312720298767e-05, 1.940131187438965e-05, 2.051331102848053e-05, 2.162531018257141e-05, 2.2737309336662292e-05, 2.3849308490753174e-05, 2.4961307644844055e-05, 2.6073306798934937e-05, 2.7185305953025818e-05, 2.82973051071167e-05, 2.940930426120758e-05, 3.052130341529846e-05, 3.163330256938934e-05, 3.2745301723480225e-05, 3.3857300877571106e-05, 3.496930003166199e-05, 3.608129918575287e-05, 3.719329833984375e-05]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 5.0, 13.0, 9.0, 11.0, 29.0, 30.0, 45.0, 53.0, 97.0, 124.0, 177.0, 313.0, 466.0, 616.0, 1114.0, 1914.0, 2919.0, 6415.0, 14211.0, 31290.0, 129829.0, 629828.0, 161251.0, 36182.0, 15995.0, 7078.0, 3230.0, 2084.0, 1164.0, 601.0, 475.0, 314.0, 211.0, 128.0, 107.0, 57.0, 51.0, 41.0, 26.0, 12.0, 18.0, 4.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.537799835205078e-05, -1.4919787645339966e-05, -1.446157693862915e-05, -1.4003366231918335e-05, -1.354515552520752e-05, -1.3086944818496704e-05, -1.2628734111785889e-05, -1.2170523405075073e-05, -1.1712312698364258e-05, -1.1254101991653442e-05, -1.0795891284942627e-05, -1.0337680578231812e-05, -9.879469871520996e-06, -9.42125916481018e-06, -8.963048458099365e-06, -8.50483775138855e-06, -8.046627044677734e-06, -7.588416337966919e-06, -7.1302056312561035e-06, -6.671994924545288e-06, -6.213784217834473e-06, -5.755573511123657e-06, -5.297362804412842e-06, -4.839152097702026e-06, -4.380941390991211e-06, -3.9227306842803955e-06, -3.46451997756958e-06, -3.0063092708587646e-06, -2.5480985641479492e-06, -2.089887857437134e-06, -1.6316771507263184e-06, -1.173466444015503e-06, -7.152557373046875e-07, -2.5704503059387207e-07, 2.0116567611694336e-07, 6.593763828277588e-07, 1.1175870895385742e-06, 1.5757977962493896e-06, 2.034008502960205e-06, 2.4922192096710205e-06, 2.950429916381836e-06, 3.4086406230926514e-06, 3.866851329803467e-06, 4.325062036514282e-06, 4.783272743225098e-06, 5.241483449935913e-06, 5.6996941566467285e-06, 6.157904863357544e-06, 6.616115570068359e-06, 7.074326276779175e-06, 7.53253698348999e-06, 7.990747690200806e-06, 8.448958396911621e-06, 8.907169103622437e-06, 9.365379810333252e-06, 9.823590517044067e-06, 1.0281801223754883e-05, 1.0740011930465698e-05, 1.1198222637176514e-05, 1.1656433343887329e-05, 1.2114644050598145e-05, 1.257285475730896e-05, 1.3031065464019775e-05, 1.348927617073059e-05, 1.3947486877441406e-05]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 4.0, 6.0, 14.0, 10.0, 16.0, 32.0, 17.0, 52.0, 45.0, 91.0, 78.0, 159.0, 93.0, 100.0, 55.0, 64.0, 29.0, 36.0, 13.0, 23.0, 11.0, 10.0, 4.0, 6.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.7220458984375e-06, -5.574896931648254e-06, -5.427747964859009e-06, -5.280598998069763e-06, -5.133450031280518e-06, -4.986301064491272e-06, -4.839152097702026e-06, -4.692003130912781e-06, -4.544854164123535e-06, -4.3977051973342896e-06, -4.250556230545044e-06, -4.103407263755798e-06, -3.956258296966553e-06, -3.809109330177307e-06, -3.6619603633880615e-06, -3.514811396598816e-06, -3.3676624298095703e-06, -3.2205134630203247e-06, -3.073364496231079e-06, -2.9262155294418335e-06, -2.779066562652588e-06, -2.6319175958633423e-06, -2.4847686290740967e-06, -2.337619662284851e-06, -2.1904706954956055e-06, -2.04332172870636e-06, -1.8961727619171143e-06, -1.7490237951278687e-06, -1.601874828338623e-06, -1.4547258615493774e-06, -1.3075768947601318e-06, -1.1604279279708862e-06, -1.0132789611816406e-06, -8.66129994392395e-07, -7.189810276031494e-07, -5.718320608139038e-07, -4.246830940246582e-07, -2.775341272354126e-07, -1.30385160446167e-07, 1.6763806343078613e-08, 1.6391277313232422e-07, 3.110617399215698e-07, 4.5821070671081543e-07, 6.05359673500061e-07, 7.525086402893066e-07, 8.996576070785522e-07, 1.0468065738677979e-06, 1.1939555406570435e-06, 1.341104507446289e-06, 1.4882534742355347e-06, 1.6354024410247803e-06, 1.7825514078140259e-06, 1.9297003746032715e-06, 2.076849341392517e-06, 2.2239983081817627e-06, 2.3711472749710083e-06, 2.518296241760254e-06, 2.6654452085494995e-06, 2.812594175338745e-06, 2.9597431421279907e-06, 3.1068921089172363e-06, 3.254041075706482e-06, 3.4011900424957275e-06, 3.548339009284973e-06, 3.6954879760742188e-06]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 10.0, 8.0, 9.0, 15.0, 23.0, 26.0, 36.0, 44.0, 77.0, 104.0, 176.0, 219.0, 342.0, 509.0, 822.0, 1811.0, 3459.0, 10532.0, 31146.0, 249962.0, 654514.0, 65639.0, 18138.0, 5320.0, 2550.0, 1063.0, 725.0, 405.0, 276.0, 156.0, 105.0, 102.0, 64.0, 51.0, 23.0, 30.0, 17.0, 14.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.519918441772461e-05, -1.4696270227432251e-05, -1.4193356037139893e-05, -1.3690441846847534e-05, -1.3187527656555176e-05, -1.2684613466262817e-05, -1.2181699275970459e-05, -1.16787850856781e-05, -1.1175870895385742e-05, -1.0672956705093384e-05, -1.0170042514801025e-05, -9.667128324508667e-06, -9.164214134216309e-06, -8.66129994392395e-06, -8.158385753631592e-06, -7.655471563339233e-06, -7.152557373046875e-06, -6.649643182754517e-06, -6.146728992462158e-06, -5.6438148021698e-06, -5.140900611877441e-06, -4.637986421585083e-06, -4.135072231292725e-06, -3.632158041000366e-06, -3.129243850708008e-06, -2.6263296604156494e-06, -2.123415470123291e-06, -1.6205012798309326e-06, -1.1175870895385742e-06, -6.146728992462158e-07, -1.1175870895385742e-07, 3.91155481338501e-07, 8.940696716308594e-07, 1.3969838619232178e-06, 1.8998980522155762e-06, 2.4028122425079346e-06, 2.905726432800293e-06, 3.4086406230926514e-06, 3.91155481338501e-06, 4.414469003677368e-06, 4.9173831939697266e-06, 5.420297384262085e-06, 5.923211574554443e-06, 6.426125764846802e-06, 6.92903995513916e-06, 7.4319541454315186e-06, 7.934868335723877e-06, 8.437782526016235e-06, 8.940696716308594e-06, 9.443610906600952e-06, 9.94652509689331e-06, 1.0449439287185669e-05, 1.0952353477478027e-05, 1.1455267667770386e-05, 1.1958181858062744e-05, 1.2461096048355103e-05, 1.2964010238647461e-05, 1.346692442893982e-05, 1.3969838619232178e-05, 1.4472752809524536e-05, 1.4975666999816895e-05, 1.5478581190109253e-05, 1.598149538040161e-05, 1.648440957069397e-05, 1.6987323760986328e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 11.0, 13.0, 28.0, 27.0, 44.0, 73.0, 117.0, 161.0, 180.0, 131.0, 56.0, 60.0, 22.0, 30.0, 14.0, 10.0, 10.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.463859558105469e-06, -8.230097591876984e-06, -7.996335625648499e-06, -7.762573659420013e-06, -7.528811693191528e-06, -7.295049726963043e-06, -7.061287760734558e-06, -6.827525794506073e-06, -6.593763828277588e-06, -6.360001862049103e-06, -6.126239895820618e-06, -5.8924779295921326e-06, -5.6587159633636475e-06, -5.424953997135162e-06, -5.191192030906677e-06, -4.957430064678192e-06, -4.723668098449707e-06, -4.489906132221222e-06, -4.256144165992737e-06, -4.022382199764252e-06, -3.7886202335357666e-06, -3.5548582673072815e-06, -3.3210963010787964e-06, -3.0873343348503113e-06, -2.853572368621826e-06, -2.619810402393341e-06, -2.386048436164856e-06, -2.152286469936371e-06, -1.9185245037078857e-06, -1.6847625374794006e-06, -1.4510005712509155e-06, -1.2172386050224304e-06, -9.834766387939453e-07, -7.497146725654602e-07, -5.159527063369751e-07, -2.8219074010849e-07, -4.842877388000488e-08, 1.8533319234848022e-07, 4.1909515857696533e-07, 6.528571248054504e-07, 8.866190910339355e-07, 1.1203810572624207e-06, 1.3541430234909058e-06, 1.5879049897193909e-06, 1.821666955947876e-06, 2.055428922176361e-06, 2.289190888404846e-06, 2.5229528546333313e-06, 2.7567148208618164e-06, 2.9904767870903015e-06, 3.2242387533187866e-06, 3.4580007195472717e-06, 3.691762685775757e-06, 3.925524652004242e-06, 4.159286618232727e-06, 4.393048584461212e-06, 4.626810550689697e-06, 4.860572516918182e-06, 5.0943344831466675e-06, 5.328096449375153e-06, 5.561858415603638e-06, 5.795620381832123e-06, 6.029382348060608e-06, 6.263144314289093e-06, 6.496906280517578e-06]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 37.0, 69.0, 145.0, 378.0, 190.0, 82.0, 46.0, 24.0, 14.0, 7.0, 3.0, 1.0, 1.0], "bins": [-0.00134546949993819, -0.0013208773452788591, -0.0012962851906195283, -0.0012716931523755193, -0.0012471009977161884, -0.0012225088430568576, -0.0011979166883975267, -0.0011733246501535177, -0.0011487324954941869, -0.001124140340834856, -0.0010995481861755252, -0.0010749561479315162, -0.0010503639932721853, -0.0010257718386128545, -0.0010011796839535236, -0.0009765876457095146, -0.0009519954910501838, -0.0009274033363908529, -0.000902811239939183, -0.0008782190852798522, -0.0008536269888281822, -0.0008290348341688514, -0.0008044427377171814, -0.0007798505830578506, -0.0007552584283985198, -0.0007306662737391889, -0.000706074177287519, -0.0006814820226281881, -0.0006568899261765182, -0.0006322977715171874, -0.0006077056750655174, -0.0005831135204061866, -0.0005585214821621776, -0.0005339293275028467, -0.0005093372310511768, -0.0004847451054956764, -0.000460152979940176, -0.00043556082528084517, -0.00041096872882917523, -0.0003863765741698444, -0.00036178441951051354, -0.00033719229395501316, -0.00031260016839951277, -0.0002880080428440124, -0.000263415917288512, -0.00023882377718109637, -0.000214231651625596, -0.0001896395260700956, -0.00016504741506651044, -0.00014045528951101005, -0.00011586316395550966, -9.127103112405166e-05, -6.667890556855127e-05, -4.208677273709327e-05, -1.749464718159288e-05, 7.0974783739075065e-06, 3.1689603929407895e-05, 5.628172948490828e-05, 8.087385504040867e-05, 0.00010546598787186667, 0.00013005812070332468, 0.00015465024625882506, 0.00017924237181432545, 0.00020383449736982584, 0.00022842662292532623]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 7.0, 8.0, 6.0, 9.0, 13.0, 19.0, 13.0, 13.0, 26.0, 22.0, 27.0, 36.0, 42.0, 38.0, 35.0, 40.0, 40.0, 30.0, 37.0, 30.0, 44.0, 43.0, 39.0, 35.0, 35.0, 33.0, 30.0, 26.0, 30.0, 33.0, 28.0, 27.0, 24.0, 13.0, 17.0, 14.0, 12.0, 10.0, 2.0, 5.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014394521713256836, -0.00013869162648916245, -0.00013343803584575653, -0.00012818444520235062, -0.0001229308545589447, -0.00011767726391553879, -0.00011242367327213287, -0.00010717008262872696, -0.00010191649198532104, -9.666290134191513e-05, -9.140931069850922e-05, -8.61557200551033e-05, -8.090212941169739e-05, -7.564853876829147e-05, -7.039494812488556e-05, -6.514135748147964e-05, -5.988776683807373e-05, -5.4634176194667816e-05, -4.93805855512619e-05, -4.412699490785599e-05, -3.887340426445007e-05, -3.361981362104416e-05, -2.8366222977638245e-05, -2.311263233423233e-05, -1.7859041690826416e-05, -1.2605451047420502e-05, -7.351860404014587e-06, -2.098269760608673e-06, 3.155320882797241e-06, 8.408911526203156e-06, 1.366250216960907e-05, 1.8916092813014984e-05, 2.41696834564209e-05, 2.9423274099826813e-05, 3.467686474323273e-05, 3.993045538663864e-05, 4.5184046030044556e-05, 5.043763667345047e-05, 5.5691227316856384e-05, 6.09448179602623e-05, 6.619840860366821e-05, 7.145199924707413e-05, 7.670558989048004e-05, 8.195918053388596e-05, 8.721277117729187e-05, 9.246636182069778e-05, 9.77199524641037e-05, 0.00010297354310750961, 0.00010822713375091553, 0.00011348072439432144, 0.00011873431503772736, 0.00012398790568113327, 0.00012924149632453918, 0.0001344950869679451, 0.000139748677611351, 0.00014500226825475693, 0.00015025585889816284, 0.00015550944954156876, 0.00016076304018497467, 0.00016601663082838058, 0.0001712702214717865, 0.0001765238121151924, 0.00018177740275859833, 0.00018703099340200424, 0.00019228458404541016]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 6.0, 17.0, 28.0, 50.0, 120.0, 218.0, 439.0, 897.0, 1837.0, 3952.0, 8950.0, 21846.0, 64043.0, 393311.0, 3518458.0, 117931.0, 36627.0, 13708.0, 5642.0, 2625.0, 1259.0, 719.0, 394.0, 259.0, 188.0, 154.0, 96.0, 102.0, 71.0, 63.0, 55.0, 30.0, 34.0, 34.0, 32.0, 20.0, 21.0, 10.0, 7.0, 13.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.957220077514648e-05, -7.520709186792374e-05, -7.084198296070099e-05, -6.647687405347824e-05, -6.211176514625549e-05, -5.7746656239032745e-05, -5.338154733181e-05, -4.901643842458725e-05, -4.46513295173645e-05, -4.0286220610141754e-05, -3.5921111702919006e-05, -3.155600279569626e-05, -2.719089388847351e-05, -2.2825784981250763e-05, -1.8460676074028015e-05, -1.4095567166805267e-05, -9.73045825958252e-06, -5.365349352359772e-06, -1.000240445137024e-06, 3.364868462085724e-06, 7.729977369308472e-06, 1.209508627653122e-05, 1.6460195183753967e-05, 2.0825304090976715e-05, 2.5190412998199463e-05, 2.955552190542221e-05, 3.392063081264496e-05, 3.8285739719867706e-05, 4.2650848627090454e-05, 4.70159575343132e-05, 5.138106644153595e-05, 5.57461753487587e-05, 6.0111284255981445e-05, 6.447639316320419e-05, 6.884150207042694e-05, 7.320661097764969e-05, 7.757171988487244e-05, 8.193682879209518e-05, 8.630193769931793e-05, 9.066704660654068e-05, 9.503215551376343e-05, 9.939726442098618e-05, 0.00010376237332820892, 0.00010812748223543167, 0.00011249259114265442, 0.00011685770004987717, 0.00012122280895709991, 0.00012558791786432266, 0.0001299530267715454, 0.00013431813567876816, 0.0001386832445859909, 0.00014304835349321365, 0.0001474134624004364, 0.00015177857130765915, 0.0001561436802148819, 0.00016050878912210464, 0.0001648738980293274, 0.00016923900693655014, 0.0001736041158437729, 0.00017796922475099564, 0.00018233433365821838, 0.00018669944256544113, 0.00019106455147266388, 0.00019542966037988663, 0.00019979476928710938]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 11.0, 12.0, 15.0, 16.0, 33.0, 50.0, 57.0, 112.0, 114.0, 148.0, 111.0, 90.0, 66.0, 36.0, 44.0, 23.0, 25.0, 9.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3649463653564453e-05, -1.2916512787342072e-05, -1.218356192111969e-05, -1.1450611054897308e-05, -1.0717660188674927e-05, -9.984709322452545e-06, -9.251758456230164e-06, -8.518807590007782e-06, -7.7858567237854e-06, -7.052905857563019e-06, -6.319954991340637e-06, -5.587004125118256e-06, -4.854053258895874e-06, -4.1211023926734924e-06, -3.388151526451111e-06, -2.6552006602287292e-06, -1.9222497940063477e-06, -1.189298927783966e-06, -4.5634806156158447e-07, 2.766028046607971e-07, 1.0095536708831787e-06, 1.7425045371055603e-06, 2.475455403327942e-06, 3.2084062695503235e-06, 3.941357135772705e-06, 4.674308001995087e-06, 5.407258868217468e-06, 6.14020973443985e-06, 6.8731606006622314e-06, 7.606111466884613e-06, 8.339062333106995e-06, 9.072013199329376e-06, 9.804964065551758e-06, 1.053791493177414e-05, 1.1270865797996521e-05, 1.2003816664218903e-05, 1.2736767530441284e-05, 1.3469718396663666e-05, 1.4202669262886047e-05, 1.4935620129108429e-05, 1.566857099533081e-05, 1.6401521861553192e-05, 1.7134472727775574e-05, 1.7867423593997955e-05, 1.8600374460220337e-05, 1.933332532644272e-05, 2.00662761926651e-05, 2.079922705888748e-05, 2.1532177925109863e-05, 2.2265128791332245e-05, 2.2998079657554626e-05, 2.3731030523777008e-05, 2.446398138999939e-05, 2.519693225622177e-05, 2.5929883122444153e-05, 2.6662833988666534e-05, 2.7395784854888916e-05, 2.8128735721111298e-05, 2.886168658733368e-05, 2.959463745355606e-05, 3.0327588319778442e-05, 3.1060539186000824e-05, 3.1793490052223206e-05, 3.252644091844559e-05, 3.325939178466797e-05]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 9.0, 8.0, 14.0, 29.0, 33.0, 74.0, 139.0, 241.0, 516.0, 1253.0, 3355.0, 10329.0, 36701.0, 198185.0, 3566080.0, 308565.0, 48989.0, 12841.0, 4139.0, 1527.0, 617.0, 288.0, 147.0, 63.0, 37.0, 27.0, 15.0, 13.0, 9.0, 9.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001423358917236328, -0.0001371782273054123, -0.00013202056288719177, -0.00012686289846897125, -0.00012170523405075073, -0.00011654756963253021, -0.00011138990521430969, -0.00010623224079608917, -0.00010107457637786865, -9.591691195964813e-05, -9.075924754142761e-05, -8.560158312320709e-05, -8.044391870498657e-05, -7.528625428676605e-05, -7.012858986854553e-05, -6.497092545032501e-05, -5.981326103210449e-05, -5.465559661388397e-05, -4.949793219566345e-05, -4.434026777744293e-05, -3.918260335922241e-05, -3.402493894100189e-05, -2.8867274522781372e-05, -2.3709610104560852e-05, -1.8551945686340332e-05, -1.3394281268119812e-05, -8.236616849899292e-06, -3.078952431678772e-06, 2.078711986541748e-06, 7.236376404762268e-06, 1.2394040822982788e-05, 1.7551705241203308e-05, 2.2709369659423828e-05, 2.7867034077644348e-05, 3.302469849586487e-05, 3.818236291408539e-05, 4.334002733230591e-05, 4.849769175052643e-05, 5.365535616874695e-05, 5.881302058696747e-05, 6.397068500518799e-05, 6.912834942340851e-05, 7.428601384162903e-05, 7.944367825984955e-05, 8.460134267807007e-05, 8.975900709629059e-05, 9.491667151451111e-05, 0.00010007433593273163, 0.00010523200035095215, 0.00011038966476917267, 0.00011554732918739319, 0.00012070499360561371, 0.00012586265802383423, 0.00013102032244205475, 0.00013617798686027527, 0.0001413356512784958, 0.0001464933156967163, 0.00015165098011493683, 0.00015680864453315735, 0.00016196630895137787, 0.0001671239733695984, 0.0001722816377878189, 0.00017743930220603943, 0.00018259696662425995, 0.00018775463104248047]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 11.0, 11.0, 9.0, 17.0, 19.0, 27.0, 33.0, 46.0, 54.0, 72.0, 91.0, 141.0, 172.0, 267.0, 770.0, 1262.0, 396.0, 184.0, 121.0, 85.0, 64.0, 52.0, 37.0, 28.0, 33.0, 16.0, 16.0, 12.0, 9.0, 6.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6835670471191406e-05, -3.5177916288375854e-05, -3.35201621055603e-05, -3.186240792274475e-05, -3.02046537399292e-05, -2.8546899557113647e-05, -2.6889145374298096e-05, -2.5231391191482544e-05, -2.3573637008666992e-05, -2.191588282585144e-05, -2.025812864303589e-05, -1.8600374460220337e-05, -1.6942620277404785e-05, -1.5284866094589233e-05, -1.3627111911773682e-05, -1.196935772895813e-05, -1.0311603546142578e-05, -8.653849363327026e-06, -6.996095180511475e-06, -5.338340997695923e-06, -3.680586814880371e-06, -2.0228326320648193e-06, -3.650784492492676e-07, 1.2926757335662842e-06, 2.950429916381836e-06, 4.608184099197388e-06, 6.2659382820129395e-06, 7.923692464828491e-06, 9.581446647644043e-06, 1.1239200830459595e-05, 1.2896955013275146e-05, 1.4554709196090698e-05, 1.621246337890625e-05, 1.7870217561721802e-05, 1.9527971744537354e-05, 2.1185725927352905e-05, 2.2843480110168457e-05, 2.450123429298401e-05, 2.615898847579956e-05, 2.7816742658615112e-05, 2.9474496841430664e-05, 3.1132251024246216e-05, 3.279000520706177e-05, 3.444775938987732e-05, 3.610551357269287e-05, 3.776326775550842e-05, 3.9421021938323975e-05, 4.1078776121139526e-05, 4.273653030395508e-05, 4.439428448677063e-05, 4.605203866958618e-05, 4.7709792852401733e-05, 4.9367547035217285e-05, 5.102530121803284e-05, 5.268305540084839e-05, 5.434080958366394e-05, 5.599856376647949e-05, 5.7656317949295044e-05, 5.9314072132110596e-05, 6.097182631492615e-05, 6.26295804977417e-05, 6.428733468055725e-05, 6.59450888633728e-05, 6.760284304618835e-05, 6.92605972290039e-05]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 12.0, 28.0, 46.0, 141.0, 349.0, 257.0, 106.0, 43.0, 11.0, 9.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032045351690612733, -0.0002907697344198823, -0.0002610859810374677, -0.00023140219855122268, -0.00020171841606497765, -0.0001720346335787326, -0.0001423508656444028, -0.000112667097710073, -8.298331522382796e-05, -5.3299540013540536e-05, -2.3615764803253114e-05, 6.068010407034308e-06, 3.575178561732173e-05, 6.543556810356677e-05, 9.511933603789657e-05, 0.00012480310397222638, 0.00015448688645847142, 0.00018417066894471645, 0.00021385443687904626, 0.00024353820481337607, 0.0002732219872996211, 0.00030290576978586614, 0.0003325895522721112, 0.00036227330565452576, 0.0003919570881407708, 0.00042164087062701583, 0.0004513246240094304, 0.00048100840649567544, 0.0005106921889819205, 0.0005403759423643351, 0.0005700597539544106, 0.0005997435073368251, 0.0006294272607192397, 0.0006591110141016543, 0.0006887948256917298, 0.0007184785790741444, 0.0007481623906642199, 0.0007778461440466344, 0.000807529897429049, 0.0008372137090191245, 0.0008668974624015391, 0.0008965812157839537, 0.0009262650273740292, 0.0009559487807564437, 0.0009856325341388583, 0.0010153163457289338, 0.0010450001573190093, 0.001074683852493763, 0.0011043676640838385, 0.001134051475673914, 0.0011637351708486676, 0.0011934189824387431, 0.0012231027940288186, 0.0012527864892035723, 0.0012824703007936478, 0.0013121541123837233, 0.0013418379239737988, 0.0013715217355638742, 0.001401205430738628, 0.0014308892423287034, 0.001460573053918779, 0.0014902567490935326, 0.001519940560683608, 0.0015496243722736835, 0.0015793080674484372]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 4.0, 13.0, 19.0, 16.0, 21.0, 30.0, 46.0, 53.0, 52.0, 62.0, 62.0, 66.0, 76.0, 72.0, 68.0, 64.0, 51.0, 38.0, 49.0, 33.0, 27.0, 16.0, 16.0, 15.0, 5.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002200007438659668, -0.00021190103143453598, -0.00020380131900310516, -0.00019570160657167435, -0.00018760189414024353, -0.00017950218170881271, -0.0001714024692773819, -0.00016330275684595108, -0.00015520304441452026, -0.00014710333198308945, -0.00013900361955165863, -0.00013090390712022781, -0.000122804194688797, -0.00011470448225736618, -0.00010660476982593536, -9.850505739450455e-05, -9.040534496307373e-05, -8.230563253164291e-05, -7.42059201002121e-05, -6.610620766878128e-05, -5.8006495237350464e-05, -4.990678280591965e-05, -4.180707037448883e-05, -3.3707357943058014e-05, -2.5607645511627197e-05, -1.750793308019638e-05, -9.408220648765564e-06, -1.3085082173347473e-06, 6.791204214096069e-06, 1.4890916645526886e-05, 2.2990629076957703e-05, 3.109034150838852e-05, 3.9190053939819336e-05, 4.728976637125015e-05, 5.538947880268097e-05, 6.348919123411179e-05, 7.15889036655426e-05, 7.968861609697342e-05, 8.778832852840424e-05, 9.588804095983505e-05, 0.00010398775339126587, 0.00011208746582269669, 0.0001201871782541275, 0.00012828689068555832, 0.00013638660311698914, 0.00014448631554841995, 0.00015258602797985077, 0.00016068574041128159, 0.0001687854528427124, 0.00017688516527414322, 0.00018498487770557404, 0.00019308459013700485, 0.00020118430256843567, 0.00020928401499986649, 0.0002173837274312973, 0.00022548343986272812, 0.00023358315229415894, 0.00024168286472558975, 0.00024978257715702057, 0.0002578822895884514, 0.0002659820020198822, 0.000274081714451313, 0.00028218142688274384, 0.00029028113931417465, 0.00029838085174560547]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 10.0, 13.0, 30.0, 26.0, 45.0, 75.0, 117.0, 173.0, 312.0, 562.0, 1020.0, 2247.0, 6335.0, 20367.0, 88901.0, 709674.0, 171580.0, 31956.0, 9001.0, 3180.0, 1345.0, 628.0, 345.0, 226.0, 122.0, 78.0, 45.0, 31.0, 30.0, 23.0, 12.0, 11.0, 7.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022161006927490234, -0.00021502748131752014, -0.00020844489336013794, -0.00020186230540275574, -0.00019527971744537354, -0.00018869712948799133, -0.00018211454153060913, -0.00017553195357322693, -0.00016894936561584473, -0.00016236677765846252, -0.00015578418970108032, -0.00014920160174369812, -0.00014261901378631592, -0.00013603642582893372, -0.00012945383787155151, -0.0001228712499141693, -0.00011628866195678711, -0.00010970607399940491, -0.0001031234860420227, -9.65408980846405e-05, -8.99583101272583e-05, -8.33757221698761e-05, -7.67931342124939e-05, -7.02105462551117e-05, -6.362795829772949e-05, -5.704537034034729e-05, -5.046278238296509e-05, -4.3880194425582886e-05, -3.7297606468200684e-05, -3.071501851081848e-05, -2.413243055343628e-05, -1.7549842596054077e-05, -1.0967254638671875e-05, -4.384666681289673e-06, 2.1979212760925293e-06, 8.780509233474731e-06, 1.5363097190856934e-05, 2.1945685148239136e-05, 2.8528273105621338e-05, 3.511086106300354e-05, 4.169344902038574e-05, 4.8276036977767944e-05, 5.4858624935150146e-05, 6.144121289253235e-05, 6.802380084991455e-05, 7.460638880729675e-05, 8.118897676467896e-05, 8.777156472206116e-05, 9.435415267944336e-05, 0.00010093674063682556, 0.00010751932859420776, 0.00011410191655158997, 0.00012068450450897217, 0.00012726709246635437, 0.00013384968042373657, 0.00014043226838111877, 0.00014701485633850098, 0.00015359744429588318, 0.00016018003225326538, 0.00016676262021064758, 0.00017334520816802979, 0.000179927796125412, 0.0001865103840827942, 0.0001930929720401764, 0.0001996755599975586]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 10.0, 15.0, 23.0, 37.0, 26.0, 51.0, 63.0, 99.0, 107.0, 143.0, 103.0, 100.0, 68.0, 52.0, 28.0, 20.0, 23.0, 9.0, 3.0, 4.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5735626220703125e-05, -1.5035271644592285e-05, -1.4334917068481445e-05, -1.3634562492370605e-05, -1.2934207916259766e-05, -1.2233853340148926e-05, -1.1533498764038086e-05, -1.0833144187927246e-05, -1.0132789611816406e-05, -9.432435035705566e-06, -8.732080459594727e-06, -8.031725883483887e-06, -7.331371307373047e-06, -6.631016731262207e-06, -5.930662155151367e-06, -5.230307579040527e-06, -4.5299530029296875e-06, -3.829598426818848e-06, -3.129243850708008e-06, -2.428889274597168e-06, -1.7285346984863281e-06, -1.0281801223754883e-06, -3.2782554626464844e-07, 3.725290298461914e-07, 1.0728836059570312e-06, 1.773238182067871e-06, 2.473592758178711e-06, 3.1739473342895508e-06, 3.874301910400391e-06, 4.5746564865112305e-06, 5.27501106262207e-06, 5.97536563873291e-06, 6.67572021484375e-06, 7.37607479095459e-06, 8.07642936706543e-06, 8.77678394317627e-06, 9.47713851928711e-06, 1.017749309539795e-05, 1.0877847671508789e-05, 1.1578202247619629e-05, 1.2278556823730469e-05, 1.2978911399841309e-05, 1.3679265975952148e-05, 1.4379620552062988e-05, 1.5079975128173828e-05, 1.5780329704284668e-05, 1.6480684280395508e-05, 1.7181038856506348e-05, 1.7881393432617188e-05, 1.8581748008728027e-05, 1.9282102584838867e-05, 1.9982457160949707e-05, 2.0682811737060547e-05, 2.1383166313171387e-05, 2.2083520889282227e-05, 2.2783875465393066e-05, 2.3484230041503906e-05, 2.4184584617614746e-05, 2.4884939193725586e-05, 2.5585293769836426e-05, 2.6285648345947266e-05, 2.6986002922058105e-05, 2.7686357498168945e-05, 2.8386712074279785e-05, 2.9087066650390625e-05]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 10.0, 11.0, 20.0, 14.0, 21.0, 28.0, 48.0, 69.0, 78.0, 109.0, 145.0, 231.0, 310.0, 445.0, 642.0, 947.0, 1451.0, 2111.0, 3305.0, 4832.0, 7817.0, 13028.0, 22214.0, 40288.0, 77669.0, 170858.0, 395572.0, 146863.0, 69618.0, 36396.0, 20303.0, 11825.0, 7391.0, 4655.0, 2966.0, 1921.0, 1333.0, 888.0, 652.0, 432.0, 306.0, 207.0, 132.0, 100.0, 78.0, 57.0, 42.0, 29.0, 24.0, 22.0, 15.0, 6.0, 9.0, 7.0, 2.0, 2.0, 3.0, 3.0], "bins": [-6.771087646484375e-05, -6.562191992998123e-05, -6.353296339511871e-05, -6.14440068602562e-05, -5.935505032539368e-05, -5.726609379053116e-05, -5.517713725566864e-05, -5.308818072080612e-05, -5.0999224185943604e-05, -4.8910267651081085e-05, -4.682131111621857e-05, -4.473235458135605e-05, -4.264339804649353e-05, -4.055444151163101e-05, -3.8465484976768494e-05, -3.6376528441905975e-05, -3.428757190704346e-05, -3.219861537218094e-05, -3.010965883731842e-05, -2.8020702302455902e-05, -2.5931745767593384e-05, -2.3842789232730865e-05, -2.1753832697868347e-05, -1.966487616300583e-05, -1.757591962814331e-05, -1.5486963093280792e-05, -1.3398006558418274e-05, -1.1309050023555756e-05, -9.220093488693237e-06, -7.131136953830719e-06, -5.042180418968201e-06, -2.9532238841056824e-06, -8.642673492431641e-07, 1.2246891856193542e-06, 3.3136457204818726e-06, 5.402602255344391e-06, 7.491558790206909e-06, 9.580515325069427e-06, 1.1669471859931946e-05, 1.3758428394794464e-05, 1.5847384929656982e-05, 1.79363414645195e-05, 2.002529799938202e-05, 2.2114254534244537e-05, 2.4203211069107056e-05, 2.6292167603969574e-05, 2.8381124138832092e-05, 3.047008067369461e-05, 3.255903720855713e-05, 3.464799374341965e-05, 3.6736950278282166e-05, 3.8825906813144684e-05, 4.09148633480072e-05, 4.300381988286972e-05, 4.509277641773224e-05, 4.718173295259476e-05, 4.9270689487457275e-05, 5.1359646022319794e-05, 5.344860255718231e-05, 5.553755909204483e-05, 5.762651562690735e-05, 5.971547216176987e-05, 6.180442869663239e-05, 6.38933852314949e-05, 6.598234176635742e-05]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 8.0, 9.0, 14.0, 19.0, 12.0, 16.0, 17.0, 25.0, 37.0, 32.0, 33.0, 36.0, 32.0, 45.0, 30.0, 40.0, 49.0, 50.0, 40.0, 48.0, 47.0, 43.0, 34.0, 39.0, 33.0, 25.0, 29.0, 15.0, 16.0, 17.0, 19.0, 9.0, 8.0, 8.0, 5.0, 5.0, 7.0, 7.0, 3.0, 5.0, 1.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.272294998168945e-05, -3.1682662665843964e-05, -3.0642375349998474e-05, -2.9602088034152985e-05, -2.8561800718307495e-05, -2.7521513402462006e-05, -2.6481226086616516e-05, -2.5440938770771027e-05, -2.4400651454925537e-05, -2.3360364139080048e-05, -2.2320076823234558e-05, -2.127978950738907e-05, -2.023950219154358e-05, -1.919921487569809e-05, -1.81589275598526e-05, -1.711864024400711e-05, -1.607835292816162e-05, -1.5038065612316132e-05, -1.3997778296470642e-05, -1.2957490980625153e-05, -1.1917203664779663e-05, -1.0876916348934174e-05, -9.836629033088684e-06, -8.796341717243195e-06, -7.756054401397705e-06, -6.7157670855522156e-06, -5.675479769706726e-06, -4.6351924538612366e-06, -3.594905138015747e-06, -2.5546178221702576e-06, -1.514330506324768e-06, -4.7404319047927856e-07, 5.662441253662109e-07, 1.6065314412117004e-06, 2.64681875705719e-06, 3.6871060729026794e-06, 4.727393388748169e-06, 5.7676807045936584e-06, 6.807968020439148e-06, 7.848255336284637e-06, 8.888542652130127e-06, 9.928829967975616e-06, 1.0969117283821106e-05, 1.2009404599666595e-05, 1.3049691915512085e-05, 1.4089979231357574e-05, 1.5130266547203064e-05, 1.6170553863048553e-05, 1.7210841178894043e-05, 1.8251128494739532e-05, 1.9291415810585022e-05, 2.033170312643051e-05, 2.1371990442276e-05, 2.241227775812149e-05, 2.345256507396698e-05, 2.449285238981247e-05, 2.553313970565796e-05, 2.657342702150345e-05, 2.7613714337348938e-05, 2.8654001653194427e-05, 2.9694288969039917e-05, 3.0734576284885406e-05, 3.1774863600730896e-05, 3.2815150916576385e-05, 3.3855438232421875e-05]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 10.0, 5.0, 9.0, 16.0, 22.0, 30.0, 35.0, 52.0, 89.0, 121.0, 147.0, 177.0, 343.0, 530.0, 947.0, 1814.0, 4318.0, 12456.0, 49371.0, 356958.0, 530555.0, 65234.0, 15371.0, 5062.0, 1883.0, 1137.0, 676.0, 375.0, 258.0, 161.0, 109.0, 72.0, 57.0, 31.0, 29.0, 23.0, 20.0, 12.0, 9.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2040138244628906e-05, -1.168716698884964e-05, -1.1334195733070374e-05, -1.0981224477291107e-05, -1.062825322151184e-05, -1.0275281965732574e-05, -9.922310709953308e-06, -9.569339454174042e-06, -9.216368198394775e-06, -8.863396942615509e-06, -8.510425686836243e-06, -8.157454431056976e-06, -7.80448317527771e-06, -7.451511919498444e-06, -7.098540663719177e-06, -6.745569407939911e-06, -6.3925981521606445e-06, -6.039626896381378e-06, -5.686655640602112e-06, -5.3336843848228455e-06, -4.980713129043579e-06, -4.627741873264313e-06, -4.274770617485046e-06, -3.92179936170578e-06, -3.5688281059265137e-06, -3.2158568501472473e-06, -2.862885594367981e-06, -2.5099143385887146e-06, -2.1569430828094482e-06, -1.8039718270301819e-06, -1.4510005712509155e-06, -1.0980293154716492e-06, -7.450580596923828e-07, -3.9208680391311646e-07, -3.91155481338501e-08, 3.1385570764541626e-07, 6.668269634246826e-07, 1.019798219203949e-06, 1.3727694749832153e-06, 1.7257407307624817e-06, 2.078711986541748e-06, 2.4316832423210144e-06, 2.7846544981002808e-06, 3.137625753879547e-06, 3.4905970096588135e-06, 3.84356826543808e-06, 4.196539521217346e-06, 4.5495107769966125e-06, 4.902482032775879e-06, 5.255453288555145e-06, 5.608424544334412e-06, 5.961395800113678e-06, 6.314367055892944e-06, 6.667338311672211e-06, 7.020309567451477e-06, 7.373280823230743e-06, 7.72625207901001e-06, 8.079223334789276e-06, 8.432194590568542e-06, 8.785165846347809e-06, 9.138137102127075e-06, 9.491108357906342e-06, 9.844079613685608e-06, 1.0197050869464874e-05, 1.055002212524414e-05]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 7.0, 0.0, 5.0, 10.0, 0.0, 8.0, 13.0, 0.0, 21.0, 23.0, 0.0, 25.0, 33.0, 0.0, 48.0, 0.0, 62.0, 60.0, 0.0, 79.0, 89.0, 0.0, 77.0, 71.0, 0.0, 79.0, 0.0, 57.0, 49.0, 0.0, 36.0, 30.0, 0.0, 27.0, 18.0, 0.0, 21.0, 18.0, 0.0, 6.0, 0.0, 12.0, 7.0, 0.0, 1.0, 6.0, 0.0, 7.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.3113021850585938e-06, -1.2731179594993591e-06, -1.2349337339401245e-06, -1.1967495083808899e-06, -1.1585652828216553e-06, -1.1203810572624207e-06, -1.082196831703186e-06, -1.0440126061439514e-06, -1.0058283805847168e-06, -9.676441550254822e-07, -9.294599294662476e-07, -8.912757039070129e-07, -8.530914783477783e-07, -8.149072527885437e-07, -7.767230272293091e-07, -7.385388016700745e-07, -7.003545761108398e-07, -6.621703505516052e-07, -6.239861249923706e-07, -5.85801899433136e-07, -5.476176738739014e-07, -5.094334483146667e-07, -4.7124922275543213e-07, -4.330649971961975e-07, -3.948807716369629e-07, -3.5669654607772827e-07, -3.1851232051849365e-07, -2.8032809495925903e-07, -2.421438694000244e-07, -2.039596438407898e-07, -1.6577541828155518e-07, -1.2759119272232056e-07, -8.940696716308594e-08, -5.122274160385132e-08, -1.30385160446167e-08, 2.514570951461792e-08, 6.332993507385254e-08, 1.0151416063308716e-07, 1.3969838619232178e-07, 1.778826117515564e-07, 2.1606683731079102e-07, 2.5425106287002563e-07, 2.9243528842926025e-07, 3.3061951398849487e-07, 3.688037395477295e-07, 4.069879651069641e-07, 4.4517219066619873e-07, 4.833564162254333e-07, 5.21540641784668e-07, 5.597248673439026e-07, 5.979090929031372e-07, 6.360933184623718e-07, 6.742775440216064e-07, 7.124617695808411e-07, 7.506459951400757e-07, 7.888302206993103e-07, 8.270144462585449e-07, 8.651986718177795e-07, 9.033828973770142e-07, 9.415671229362488e-07, 9.797513484954834e-07, 1.017935574054718e-06, 1.0561197996139526e-06, 1.0943040251731873e-06, 1.1324882507324219e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 7.0, 17.0, 11.0, 27.0, 19.0, 27.0, 72.0, 52.0, 93.0, 105.0, 249.0, 256.0, 367.0, 829.0, 982.0, 1557.0, 2743.0, 7599.0, 12771.0, 31142.0, 98950.0, 650378.0, 159516.0, 44760.0, 20561.0, 6298.0, 3524.0, 1965.0, 1438.0, 705.0, 421.0, 372.0, 201.0, 134.0, 93.0, 106.0, 56.0, 30.0, 31.0, 17.0, 11.0, 18.0, 12.0, 3.0, 4.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.377696990966797e-06, -6.182119250297546e-06, -5.986541509628296e-06, -5.790963768959045e-06, -5.595386028289795e-06, -5.3998082876205444e-06, -5.204230546951294e-06, -5.0086528062820435e-06, -4.813075065612793e-06, -4.6174973249435425e-06, -4.421919584274292e-06, -4.2263418436050415e-06, -4.030764102935791e-06, -3.8351863622665405e-06, -3.63960862159729e-06, -3.4440308809280396e-06, -3.248453140258789e-06, -3.0528753995895386e-06, -2.857297658920288e-06, -2.6617199182510376e-06, -2.466142177581787e-06, -2.2705644369125366e-06, -2.074986696243286e-06, -1.8794089555740356e-06, -1.6838312149047852e-06, -1.4882534742355347e-06, -1.2926757335662842e-06, -1.0970979928970337e-06, -9.015202522277832e-07, -7.059425115585327e-07, -5.103647708892822e-07, -3.1478703022003174e-07, -1.1920928955078125e-07, 7.636845111846924e-08, 2.7194619178771973e-07, 4.675239324569702e-07, 6.631016731262207e-07, 8.586794137954712e-07, 1.0542571544647217e-06, 1.2498348951339722e-06, 1.4454126358032227e-06, 1.6409903764724731e-06, 1.8365681171417236e-06, 2.032145857810974e-06, 2.2277235984802246e-06, 2.423301339149475e-06, 2.6188790798187256e-06, 2.814456820487976e-06, 3.0100345611572266e-06, 3.205612301826477e-06, 3.4011900424957275e-06, 3.596767783164978e-06, 3.7923455238342285e-06, 3.987923264503479e-06, 4.1835010051727295e-06, 4.37907874584198e-06, 4.5746564865112305e-06, 4.770234227180481e-06, 4.9658119678497314e-06, 5.161389708518982e-06, 5.356967449188232e-06, 5.552545189857483e-06, 5.748122930526733e-06, 5.943700671195984e-06, 6.139278411865234e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 2.0, 12.0, 13.0, 8.0, 18.0, 9.0, 49.0, 50.0, 27.0, 85.0, 59.0, 123.0, 66.0, 140.0, 123.0, 43.0, 50.0, 32.0, 26.0, 15.0, 7.0, 9.0, 2.0, 11.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9802322387695312e-06, -2.8852373361587524e-06, -2.7902424335479736e-06, -2.695247530937195e-06, -2.600252628326416e-06, -2.505257725715637e-06, -2.4102628231048584e-06, -2.3152679204940796e-06, -2.2202730178833008e-06, -2.125278115272522e-06, -2.030283212661743e-06, -1.9352883100509644e-06, -1.8402934074401855e-06, -1.7452985048294067e-06, -1.650303602218628e-06, -1.5553086996078491e-06, -1.4603137969970703e-06, -1.3653188943862915e-06, -1.2703239917755127e-06, -1.1753290891647339e-06, -1.080334186553955e-06, -9.853392839431763e-07, -8.903443813323975e-07, -7.953494787216187e-07, -7.003545761108398e-07, -6.05359673500061e-07, -5.103647708892822e-07, -4.153698682785034e-07, -3.203749656677246e-07, -2.253800630569458e-07, -1.30385160446167e-07, -3.5390257835388184e-08, 5.960464477539063e-08, 1.5459954738616943e-07, 2.4959444999694824e-07, 3.4458935260772705e-07, 4.3958425521850586e-07, 5.345791578292847e-07, 6.295740604400635e-07, 7.245689630508423e-07, 8.195638656616211e-07, 9.145587682723999e-07, 1.0095536708831787e-06, 1.1045485734939575e-06, 1.1995434761047363e-06, 1.2945383787155151e-06, 1.389533281326294e-06, 1.4845281839370728e-06, 1.5795230865478516e-06, 1.6745179891586304e-06, 1.7695128917694092e-06, 1.864507794380188e-06, 1.959502696990967e-06, 2.0544975996017456e-06, 2.1494925022125244e-06, 2.2444874048233032e-06, 2.339482307434082e-06, 2.434477210044861e-06, 2.5294721126556396e-06, 2.6244670152664185e-06, 2.7194619178771973e-06, 2.814456820487976e-06, 2.909451723098755e-06, 3.0044466257095337e-06, 3.0994415283203125e-06]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 12.0, 13.0, 19.0, 42.0, 81.0, 189.0, 336.0, 143.0, 74.0, 38.0, 24.0, 13.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.0008735902956686914, -0.0008565704920329154, -0.0008395506883971393, -0.0008225308847613633, -0.0008055110811255872, -0.0007884912774898112, -0.0007714714738540351, -0.0007544516702182591, -0.000737431866582483, -0.000720412062946707, -0.000703392259310931, -0.0006863724556751549, -0.0006693526520393789, -0.0006523328484036028, -0.0006353130447678268, -0.0006182932411320508, -0.0006012733792886138, -0.0005842535756528378, -0.0005672337720170617, -0.0005502139683812857, -0.0005331941647455096, -0.0005161743611097336, -0.0004991545574739575, -0.0004821347538381815, -0.00046511495020240545, -0.0004480951465666294, -0.00043107534293085337, -0.0004140555392950773, -0.0003970357356593013, -0.00038001593202352524, -0.0003629961283877492, -0.00034597632475197315, -0.000328956579323858, -0.000311936775688082, -0.00029491697205230594, -0.0002778971684165299, -0.00026087736478075385, -0.0002438575611449778, -0.00022683774295728654, -0.0002098179393215105, -0.00019279812113381922, -0.00017577831749804318, -0.00015875851386226714, -0.0001417387102264911, -0.00012471890659071505, -0.0001076990956789814, -9.067928476724774e-05, -7.36594811314717e-05, -5.663967749569565e-05, -3.961987385991961e-05, -2.2600066586164758e-05, -5.580259312409908e-06, 1.1439544323366135e-05, 2.8459347959142178e-05, 4.5479158870875835e-05, 6.249896250665188e-05, 7.951876614242792e-05, 9.653856977820396e-05, 0.00011355837341398001, 0.00013057817704975605, 0.0001475979806855321, 0.00016461778432130814, 0.0001816376025089994, 0.00019865740614477545, 0.0002156772097805515]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 12.0, 11.0, 6.0, 12.0, 11.0, 12.0, 13.0, 15.0, 18.0, 24.0, 24.0, 23.0, 27.0, 31.0, 41.0, 33.0, 39.0, 31.0, 51.0, 24.0, 49.0, 32.0, 31.0, 40.0, 38.0, 47.0, 30.0, 31.0, 27.0, 17.0, 27.0, 22.0, 17.0, 21.0, 17.0, 20.0, 8.0, 13.0, 12.0, 6.0, 7.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011730194091796875, -0.00011329818516969681, -0.00010929442942142487, -0.00010529067367315292, -0.00010128691792488098, -9.728316217660904e-05, -9.32794064283371e-05, -8.927565068006516e-05, -8.527189493179321e-05, -8.126813918352127e-05, -7.726438343524933e-05, -7.326062768697739e-05, -6.925687193870544e-05, -6.52531161904335e-05, -6.124936044216156e-05, -5.724560469388962e-05, -5.3241848945617676e-05, -4.9238093197345734e-05, -4.523433744907379e-05, -4.123058170080185e-05, -3.722682595252991e-05, -3.3223070204257965e-05, -2.9219314455986023e-05, -2.521555870771408e-05, -2.121180295944214e-05, -1.7208047211170197e-05, -1.3204291462898254e-05, -9.200535714626312e-06, -5.19677996635437e-06, -1.193024218082428e-06, 2.810731530189514e-06, 6.814487278461456e-06, 1.0818243026733398e-05, 1.482199877500534e-05, 1.8825754523277283e-05, 2.2829510271549225e-05, 2.6833266019821167e-05, 3.083702176809311e-05, 3.484077751636505e-05, 3.8844533264636993e-05, 4.2848289012908936e-05, 4.685204476118088e-05, 5.085580050945282e-05, 5.485955625772476e-05, 5.8863312005996704e-05, 6.286706775426865e-05, 6.687082350254059e-05, 7.087457925081253e-05, 7.487833499908447e-05, 7.888209074735641e-05, 8.288584649562836e-05, 8.68896022439003e-05, 9.089335799217224e-05, 9.489711374044418e-05, 9.890086948871613e-05, 0.00010290462523698807, 0.00010690838098526001, 0.00011091213673353195, 0.0001149158924818039, 0.00011891964823007584, 0.00012292340397834778, 0.00012692715972661972, 0.00013093091547489166, 0.0001349346712231636, 0.00013893842697143555]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 8.0, 7.0, 8.0, 18.0, 15.0, 21.0, 21.0, 48.0, 55.0, 82.0, 97.0, 117.0, 209.0, 285.0, 475.0, 798.0, 1402.0, 2500.0, 4320.0, 8246.0, 15682.0, 34121.0, 89278.0, 770508.0, 3052759.0, 127430.0, 44259.0, 18797.0, 9207.0, 4947.0, 2909.0, 1893.0, 1181.0, 821.0, 559.0, 336.0, 259.0, 169.0, 129.0, 90.0, 66.0, 33.0, 28.0, 31.0, 18.0, 12.0, 7.0, 12.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.00010186433792114258, -9.878911077976227e-05, -9.571388363838196e-05, -9.263865649700165e-05, -8.956342935562134e-05, -8.648820221424103e-05, -8.341297507286072e-05, -8.033774793148041e-05, -7.72625207901001e-05, -7.418729364871979e-05, -7.111206650733948e-05, -6.803683936595917e-05, -6.496161222457886e-05, -6.188638508319855e-05, -5.881115794181824e-05, -5.573593080043793e-05, -5.266070365905762e-05, -4.958547651767731e-05, -4.6510249376297e-05, -4.343502223491669e-05, -4.035979509353638e-05, -3.728456795215607e-05, -3.420934081077576e-05, -3.113411366939545e-05, -2.8058886528015137e-05, -2.4983659386634827e-05, -2.1908432245254517e-05, -1.8833205103874207e-05, -1.5757977962493896e-05, -1.2682750821113586e-05, -9.607523679733276e-06, -6.532296538352966e-06, -3.4570693969726562e-06, -3.818422555923462e-07, 2.693384885787964e-06, 5.768612027168274e-06, 8.843839168548584e-06, 1.1919066309928894e-05, 1.4994293451309204e-05, 1.8069520592689514e-05, 2.1144747734069824e-05, 2.4219974875450134e-05, 2.7295202016830444e-05, 3.0370429158210754e-05, 3.3445656299591064e-05, 3.6520883440971375e-05, 3.9596110582351685e-05, 4.2671337723731995e-05, 4.5746564865112305e-05, 4.8821792006492615e-05, 5.1897019147872925e-05, 5.4972246289253235e-05, 5.8047473430633545e-05, 6.112270057201385e-05, 6.419792771339417e-05, 6.727315485477448e-05, 7.034838199615479e-05, 7.34236091375351e-05, 7.64988362789154e-05, 7.957406342029572e-05, 8.264929056167603e-05, 8.572451770305634e-05, 8.879974484443665e-05, 9.187497198581696e-05, 9.495019912719727e-05]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 8.0, 8.0, 12.0, 9.0, 12.0, 21.0, 30.0, 35.0, 40.0, 65.0, 105.0, 113.0, 93.0, 119.0, 89.0, 67.0, 42.0, 38.0, 30.0, 16.0, 14.0, 8.0, 10.0, 2.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-05, -1.906324177980423e-05, -1.8456950783729553e-05, -1.7850659787654877e-05, -1.72443687915802e-05, -1.6638077795505524e-05, -1.6031786799430847e-05, -1.542549580335617e-05, -1.4819204807281494e-05, -1.4212913811206818e-05, -1.3606622815132141e-05, -1.3000331819057465e-05, -1.2394040822982788e-05, -1.1787749826908112e-05, -1.1181458830833435e-05, -1.0575167834758759e-05, -9.968876838684082e-06, -9.362585842609406e-06, -8.756294846534729e-06, -8.150003850460052e-06, -7.543712854385376e-06, -6.9374218583106995e-06, -6.331130862236023e-06, -5.7248398661613464e-06, -5.11854887008667e-06, -4.512257874011993e-06, -3.905966877937317e-06, -3.2996758818626404e-06, -2.693384885787964e-06, -2.0870938897132874e-06, -1.4808028936386108e-06, -8.745118975639343e-07, -2.682209014892578e-07, 3.380700945854187e-07, 9.443610906600952e-07, 1.5506520867347717e-06, 2.1569430828094482e-06, 2.7632340788841248e-06, 3.3695250749588013e-06, 3.975816071033478e-06, 4.582107067108154e-06, 5.188398063182831e-06, 5.794689059257507e-06, 6.400980055332184e-06, 7.00727105140686e-06, 7.613562047481537e-06, 8.219853043556213e-06, 8.82614403963089e-06, 9.432435035705566e-06, 1.0038726031780243e-05, 1.064501702785492e-05, 1.1251308023929596e-05, 1.1857599020004272e-05, 1.2463890016078949e-05, 1.3070181012153625e-05, 1.3676472008228302e-05, 1.4282763004302979e-05, 1.4889054000377655e-05, 1.549534499645233e-05, 1.6101635992527008e-05, 1.6707926988601685e-05, 1.731421798467636e-05, 1.7920508980751038e-05, 1.8526799976825714e-05, 1.913309097290039e-05]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 20.0, 24.0, 31.0, 46.0, 80.0, 126.0, 197.0, 295.0, 528.0, 849.0, 1492.0, 2741.0, 5070.0, 9967.0, 21325.0, 48654.0, 128258.0, 600987.0, 2991211.0, 244899.0, 75856.0, 31589.0, 14383.0, 6985.0, 3780.0, 1933.0, 1154.0, 684.0, 402.0, 221.0, 139.0, 117.0, 69.0, 50.0, 32.0, 20.0, 17.0, 7.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.159875869750977e-05, -7.914472371339798e-05, -7.66906887292862e-05, -7.423665374517441e-05, -7.178261876106262e-05, -6.932858377695084e-05, -6.687454879283905e-05, -6.442051380872726e-05, -6.196647882461548e-05, -5.951244384050369e-05, -5.705840885639191e-05, -5.460437387228012e-05, -5.2150338888168335e-05, -4.969630390405655e-05, -4.724226891994476e-05, -4.478823393583298e-05, -4.233419895172119e-05, -3.9880163967609406e-05, -3.742612898349762e-05, -3.4972093999385834e-05, -3.251805901527405e-05, -3.0064024031162262e-05, -2.7609989047050476e-05, -2.515595406293869e-05, -2.2701919078826904e-05, -2.024788409471512e-05, -1.7793849110603333e-05, -1.5339814126491547e-05, -1.288577914237976e-05, -1.0431744158267975e-05, -7.977709174156189e-06, -5.523674190044403e-06, -3.069639205932617e-06, -6.156042218208313e-07, 1.8384307622909546e-06, 4.2924657464027405e-06, 6.746500730514526e-06, 9.200535714626312e-06, 1.1654570698738098e-05, 1.4108605682849884e-05, 1.656264066696167e-05, 1.9016675651073456e-05, 2.1470710635185242e-05, 2.3924745619297028e-05, 2.6378780603408813e-05, 2.88328155875206e-05, 3.1286850571632385e-05, 3.374088555574417e-05, 3.619492053985596e-05, 3.864895552396774e-05, 4.110299050807953e-05, 4.3557025492191315e-05, 4.60110604763031e-05, 4.8465095460414886e-05, 5.091913044452667e-05, 5.337316542863846e-05, 5.5827200412750244e-05, 5.828123539686203e-05, 6.0735270380973816e-05, 6.31893053650856e-05, 6.564334034919739e-05, 6.809737533330917e-05, 7.055141031742096e-05, 7.300544530153275e-05, 7.545948028564453e-05]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 10.0, 9.0, 21.0, 26.0, 29.0, 40.0, 53.0, 63.0, 79.0, 102.0, 151.0, 253.0, 654.0, 1275.0, 474.0, 202.0, 121.0, 100.0, 91.0, 60.0, 46.0, 51.0, 42.0, 24.0, 25.0, 20.0, 9.0, 15.0, 10.0, 7.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.257129669189453e-05, -5.112774670124054e-05, -4.968419671058655e-05, -4.8240646719932556e-05, -4.6797096729278564e-05, -4.535354673862457e-05, -4.390999674797058e-05, -4.246644675731659e-05, -4.10228967666626e-05, -3.9579346776008606e-05, -3.8135796785354614e-05, -3.669224679470062e-05, -3.524869680404663e-05, -3.380514681339264e-05, -3.236159682273865e-05, -3.0918046832084656e-05, -2.9474496841430664e-05, -2.8030946850776672e-05, -2.658739686012268e-05, -2.514384686946869e-05, -2.3700296878814697e-05, -2.2256746888160706e-05, -2.0813196897506714e-05, -1.9369646906852722e-05, -1.792609691619873e-05, -1.648254692554474e-05, -1.5038996934890747e-05, -1.3595446944236755e-05, -1.2151896953582764e-05, -1.0708346962928772e-05, -9.26479697227478e-06, -7.821246981620789e-06, -6.377696990966797e-06, -4.934147000312805e-06, -3.4905970096588135e-06, -2.0470470190048218e-06, -6.034970283508301e-07, 8.400529623031616e-07, 2.2836029529571533e-06, 3.727152943611145e-06, 5.170702934265137e-06, 6.614252924919128e-06, 8.05780291557312e-06, 9.501352906227112e-06, 1.0944902896881104e-05, 1.2388452887535095e-05, 1.3832002878189087e-05, 1.527555286884308e-05, 1.671910285949707e-05, 1.8162652850151062e-05, 1.9606202840805054e-05, 2.1049752831459045e-05, 2.2493302822113037e-05, 2.393685281276703e-05, 2.538040280342102e-05, 2.6823952794075012e-05, 2.8267502784729004e-05, 2.9711052775382996e-05, 3.115460276603699e-05, 3.259815275669098e-05, 3.404170274734497e-05, 3.548525273799896e-05, 3.6928802728652954e-05, 3.8372352719306946e-05, 3.981590270996094e-05]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 24.0, 84.0, 288.0, 356.0, 129.0, 62.0, 27.0, 23.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003272871836088598, -0.00029459752840921283, -0.0002619078441057354, -0.00022921817435417324, -0.00019652850460261106, -0.0001638388348510489, -0.0001311491650994867, -9.845949534792453e-05, -6.576982559636235e-05, -3.3080155844800174e-05, -3.904860932379961e-07, 3.229918365832418e-05, 6.498885340988636e-05, 9.767852316144854e-05, 0.00013036819291301072, 0.0001630578626645729, 0.00019574753241613507, 0.00022843720216769725, 0.00026112687191925943, 0.00029381655622273684, 0.0003265062114223838, 0.00035919586662203074, 0.00039188555092550814, 0.00042457523522898555, 0.0004572648904286325, 0.0004899545456282794, 0.0005226442590355873, 0.0005553339142352343, 0.0005880235694348812, 0.0006207132246345282, 0.0006534028798341751, 0.000686092593241483, 0.0007187823066487908, 0.0007514719618484378, 0.0007841616170480847, 0.0008168513304553926, 0.0008495409856550395, 0.0008822306408546865, 0.0009149203542619944, 0.0009476100094616413, 0.0009802996646612883, 0.0010129893198609352, 0.0010456789750605822, 0.0010783686302602291, 0.001111058285459876, 0.0011437480570748448, 0.0011764377122744918, 0.0012091273674741387, 0.0012418170226737857, 0.0012745066778734326, 0.0013071963330730796, 0.0013398859882727265, 0.0013725757598876953, 0.0014052654150873423, 0.0014379550702869892, 0.0014706447254866362, 0.0015033343806862831, 0.00153602403588593, 0.001568713691085577, 0.001601403346285224, 0.001634093001484871, 0.0016667827730998397, 0.0016994724282994866, 0.0017321620834991336, 0.0017648517386987805]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 7.0, 12.0, 12.0, 10.0, 17.0, 11.0, 14.0, 18.0, 19.0, 43.0, 32.0, 38.0, 33.0, 47.0, 55.0, 53.0, 55.0, 55.0, 52.0, 54.0, 55.0, 37.0, 34.0, 38.0, 34.0, 28.0, 24.0, 24.0, 20.0, 10.0, 15.0, 13.0, 10.0, 5.0, 6.0, 6.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00024056434631347656, -0.00023416057229042053, -0.0002277567982673645, -0.00022135302424430847, -0.00021494925022125244, -0.0002085454761981964, -0.00020214170217514038, -0.00019573792815208435, -0.00018933415412902832, -0.0001829303801059723, -0.00017652660608291626, -0.00017012283205986023, -0.0001637190580368042, -0.00015731528401374817, -0.00015091150999069214, -0.0001445077359676361, -0.00013810396194458008, -0.00013170018792152405, -0.00012529641389846802, -0.00011889263987541199, -0.00011248886585235596, -0.00010608509182929993, -9.96813178062439e-05, -9.327754378318787e-05, -8.687376976013184e-05, -8.04699957370758e-05, -7.406622171401978e-05, -6.766244769096375e-05, -6.125867366790771e-05, -5.4854899644851685e-05, -4.8451125621795654e-05, -4.2047351598739624e-05, -3.5643577575683594e-05, -2.9239803552627563e-05, -2.2836029529571533e-05, -1.6432255506515503e-05, -1.0028481483459473e-05, -3.6247074604034424e-06, 2.779066562652588e-06, 9.182840585708618e-06, 1.558661460876465e-05, 2.199038863182068e-05, 2.839416265487671e-05, 3.479793667793274e-05, 4.120171070098877e-05, 4.76054847240448e-05, 5.400925874710083e-05, 6.041303277015686e-05, 6.681680679321289e-05, 7.322058081626892e-05, 7.962435483932495e-05, 8.602812886238098e-05, 9.243190288543701e-05, 9.883567690849304e-05, 0.00010523945093154907, 0.0001116432249546051, 0.00011804699897766113, 0.00012445077300071716, 0.0001308545470237732, 0.00013725832104682922, 0.00014366209506988525, 0.00015006586909294128, 0.00015646964311599731, 0.00016287341713905334, 0.00016927719116210938]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 5.0, 9.0, 8.0, 6.0, 10.0, 15.0, 13.0, 17.0, 26.0, 21.0, 39.0, 45.0, 81.0, 129.0, 195.0, 368.0, 641.0, 1191.0, 2298.0, 4860.0, 12481.0, 36727.0, 158675.0, 668289.0, 114094.0, 29540.0, 10002.0, 4204.0, 1976.0, 1070.0, 584.0, 318.0, 201.0, 117.0, 69.0, 44.0, 46.0, 28.0, 21.0, 22.0, 12.0, 11.0, 14.0, 7.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.00016295909881591797, -0.00015792995691299438, -0.0001529008150100708, -0.00014787167310714722, -0.00014284253120422363, -0.00013781338930130005, -0.00013278424739837646, -0.00012775510549545288, -0.0001227259635925293, -0.00011769682168960571, -0.00011266767978668213, -0.00010763853788375854, -0.00010260939598083496, -9.758025407791138e-05, -9.255111217498779e-05, -8.752197027206421e-05, -8.249282836914062e-05, -7.746368646621704e-05, -7.243454456329346e-05, -6.740540266036987e-05, -6.237626075744629e-05, -5.7347118854522705e-05, -5.231797695159912e-05, -4.728883504867554e-05, -4.225969314575195e-05, -3.723055124282837e-05, -3.2201409339904785e-05, -2.71722674369812e-05, -2.2143125534057617e-05, -1.7113983631134033e-05, -1.208484172821045e-05, -7.055699825286865e-06, -2.0265579223632812e-06, 3.0025839805603027e-06, 8.031725883483887e-06, 1.306086778640747e-05, 1.8090009689331055e-05, 2.311915159225464e-05, 2.8148293495178223e-05, 3.317743539810181e-05, 3.820657730102539e-05, 4.3235719203948975e-05, 4.826486110687256e-05, 5.329400300979614e-05, 5.8323144912719727e-05, 6.335228681564331e-05, 6.83814287185669e-05, 7.341057062149048e-05, 7.843971252441406e-05, 8.346885442733765e-05, 8.849799633026123e-05, 9.352713823318481e-05, 9.85562801361084e-05, 0.00010358542203903198, 0.00010861456394195557, 0.00011364370584487915, 0.00011867284774780273, 0.00012370198965072632, 0.0001287311315536499, 0.00013376027345657349, 0.00013878941535949707, 0.00014381855726242065, 0.00014884769916534424, 0.00015387684106826782, 0.0001589059829711914]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 6.0, 6.0, 6.0, 15.0, 29.0, 23.0, 48.0, 58.0, 94.0, 129.0, 138.0, 119.0, 109.0, 73.0, 45.0, 35.0, 22.0, 16.0, 9.0, 6.0, 3.0, 2.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3768672943115234e-05, -1.3032928109169006e-05, -1.2297183275222778e-05, -1.156143844127655e-05, -1.0825693607330322e-05, -1.0089948773384094e-05, -9.354203939437866e-06, -8.618459105491638e-06, -7.88271427154541e-06, -7.146969437599182e-06, -6.411224603652954e-06, -5.675479769706726e-06, -4.939734935760498e-06, -4.20399010181427e-06, -3.468245267868042e-06, -2.732500433921814e-06, -1.996755599975586e-06, -1.261010766029358e-06, -5.252659320831299e-07, 2.1047890186309814e-07, 9.462237358093262e-07, 1.6819685697555542e-06, 2.4177134037017822e-06, 3.1534582376480103e-06, 3.889203071594238e-06, 4.624947905540466e-06, 5.360692739486694e-06, 6.096437573432922e-06, 6.83218240737915e-06, 7.567927241325378e-06, 8.303672075271606e-06, 9.039416909217834e-06, 9.775161743164062e-06, 1.051090657711029e-05, 1.1246651411056519e-05, 1.1982396245002747e-05, 1.2718141078948975e-05, 1.3453885912895203e-05, 1.418963074684143e-05, 1.4925375580787659e-05, 1.5661120414733887e-05, 1.6396865248680115e-05, 1.7132610082626343e-05, 1.786835491657257e-05, 1.86040997505188e-05, 1.9339844584465027e-05, 2.0075589418411255e-05, 2.0811334252357483e-05, 2.154707908630371e-05, 2.228282392024994e-05, 2.3018568754196167e-05, 2.3754313588142395e-05, 2.4490058422088623e-05, 2.522580325603485e-05, 2.596154808998108e-05, 2.6697292923927307e-05, 2.7433037757873535e-05, 2.8168782591819763e-05, 2.890452742576599e-05, 2.964027225971222e-05, 3.0376017093658447e-05, 3.1111761927604675e-05, 3.18475067615509e-05, 3.258325159549713e-05, 3.331899642944336e-05]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 19.0, 20.0, 32.0, 47.0, 81.0, 135.0, 179.0, 306.0, 473.0, 730.0, 1223.0, 1903.0, 3181.0, 5599.0, 9596.0, 17017.0, 31089.0, 57098.0, 120866.0, 364020.0, 234432.0, 94541.0, 46198.0, 25618.0, 14133.0, 8050.0, 4694.0, 2781.0, 1648.0, 1029.0, 638.0, 436.0, 260.0, 157.0, 113.0, 60.0, 56.0, 32.0, 23.0, 14.0, 6.0, 5.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61015510559082e-05, -6.40256330370903e-05, -6.19497150182724e-05, -5.98737969994545e-05, -5.77978789806366e-05, -5.5721960961818695e-05, -5.3646042943000793e-05, -5.157012492418289e-05, -4.949420690536499e-05, -4.741828888654709e-05, -4.534237086772919e-05, -4.3266452848911285e-05, -4.1190534830093384e-05, -3.911461681127548e-05, -3.703869879245758e-05, -3.496278077363968e-05, -3.288686275482178e-05, -3.0810944736003876e-05, -2.8735026717185974e-05, -2.6659108698368073e-05, -2.458319067955017e-05, -2.250727266073227e-05, -2.0431354641914368e-05, -1.8355436623096466e-05, -1.6279518604278564e-05, -1.4203600585460663e-05, -1.2127682566642761e-05, -1.005176454782486e-05, -7.975846529006958e-06, -5.899928510189056e-06, -3.824010491371155e-06, -1.7480924725532532e-06, 3.2782554626464844e-07, 2.40374356508255e-06, 4.479661583900452e-06, 6.555579602718353e-06, 8.631497621536255e-06, 1.0707415640354156e-05, 1.2783333659172058e-05, 1.485925167798996e-05, 1.693516969680786e-05, 1.9011087715625763e-05, 2.1087005734443665e-05, 2.3162923753261566e-05, 2.5238841772079468e-05, 2.731475979089737e-05, 2.939067780971527e-05, 3.146659582853317e-05, 3.3542513847351074e-05, 3.5618431866168976e-05, 3.769434988498688e-05, 3.977026790380478e-05, 4.184618592262268e-05, 4.392210394144058e-05, 4.5998021960258484e-05, 4.8073939979076385e-05, 5.014985799789429e-05, 5.222577601671219e-05, 5.430169403553009e-05, 5.637761205434799e-05, 5.8453530073165894e-05, 6.0529448091983795e-05, 6.26053661108017e-05, 6.46812841296196e-05, 6.67572021484375e-05]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 2.0, 7.0, 4.0, 9.0, 8.0, 13.0, 12.0, 16.0, 19.0, 17.0, 28.0, 21.0, 33.0, 42.0, 30.0, 35.0, 41.0, 38.0, 43.0, 50.0, 41.0, 41.0, 46.0, 56.0, 38.0, 47.0, 27.0, 30.0, 25.0, 21.0, 29.0, 22.0, 14.0, 25.0, 18.0, 5.0, 13.0, 11.0, 7.0, 5.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.075599670410156e-05, -2.9587186872959137e-05, -2.841837704181671e-05, -2.7249567210674286e-05, -2.608075737953186e-05, -2.4911947548389435e-05, -2.374313771724701e-05, -2.2574327886104584e-05, -2.1405518054962158e-05, -2.0236708223819733e-05, -1.9067898392677307e-05, -1.789908856153488e-05, -1.6730278730392456e-05, -1.556146889925003e-05, -1.4392659068107605e-05, -1.322384923696518e-05, -1.2055039405822754e-05, -1.0886229574680328e-05, -9.717419743537903e-06, -8.548609912395477e-06, -7.379800081253052e-06, -6.210990250110626e-06, -5.042180418968201e-06, -3.873370587825775e-06, -2.7045607566833496e-06, -1.535750925540924e-06, -3.6694109439849854e-07, 8.01868736743927e-07, 1.9706785678863525e-06, 3.139488399028778e-06, 4.308298230171204e-06, 5.477108061313629e-06, 6.645917892456055e-06, 7.81472772359848e-06, 8.983537554740906e-06, 1.0152347385883331e-05, 1.1321157217025757e-05, 1.2489967048168182e-05, 1.3658776879310608e-05, 1.4827586710453033e-05, 1.599639654159546e-05, 1.7165206372737885e-05, 1.833401620388031e-05, 1.9502826035022736e-05, 2.067163586616516e-05, 2.1840445697307587e-05, 2.3009255528450012e-05, 2.4178065359592438e-05, 2.5346875190734863e-05, 2.651568502187729e-05, 2.7684494853019714e-05, 2.885330468416214e-05, 3.0022114515304565e-05, 3.119092434644699e-05, 3.2359734177589417e-05, 3.352854400873184e-05, 3.469735383987427e-05, 3.586616367101669e-05, 3.703497350215912e-05, 3.8203783333301544e-05, 3.937259316444397e-05, 4.0541402995586395e-05, 4.171021282672882e-05, 4.2879022657871246e-05, 4.404783248901367e-05]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 4.0, 8.0, 13.0, 15.0, 11.0, 37.0, 40.0, 62.0, 92.0, 173.0, 216.0, 309.0, 487.0, 1083.0, 1387.0, 2192.0, 3641.0, 10747.0, 19292.0, 49544.0, 317244.0, 467052.0, 108156.0, 35164.0, 17609.0, 5663.0, 3188.0, 1853.0, 1343.0, 638.0, 439.0, 255.0, 238.0, 115.0, 59.0, 60.0, 42.0, 31.0, 15.0, 14.0, 7.0, 8.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.67572021484375e-06, -6.481073796749115e-06, -6.28642737865448e-06, -6.091780960559845e-06, -5.89713454246521e-06, -5.702488124370575e-06, -5.50784170627594e-06, -5.313195288181305e-06, -5.11854887008667e-06, -4.923902451992035e-06, -4.7292560338974e-06, -4.534609615802765e-06, -4.33996319770813e-06, -4.145316779613495e-06, -3.95067036151886e-06, -3.756023943424225e-06, -3.56137752532959e-06, -3.366731107234955e-06, -3.17208468914032e-06, -2.977438271045685e-06, -2.78279185295105e-06, -2.588145434856415e-06, -2.3934990167617798e-06, -2.1988525986671448e-06, -2.0042061805725098e-06, -1.8095597624778748e-06, -1.6149133443832397e-06, -1.4202669262886047e-06, -1.2256205081939697e-06, -1.0309740900993347e-06, -8.363276720046997e-07, -6.416812539100647e-07, -4.470348358154297e-07, -2.523884177207947e-07, -5.774199962615967e-08, 1.3690441846847534e-07, 3.3155083656311035e-07, 5.261972546577454e-07, 7.208436727523804e-07, 9.154900908470154e-07, 1.1101365089416504e-06, 1.3047829270362854e-06, 1.4994293451309204e-06, 1.6940757632255554e-06, 1.8887221813201904e-06, 2.0833685994148254e-06, 2.2780150175094604e-06, 2.4726614356040955e-06, 2.6673078536987305e-06, 2.8619542717933655e-06, 3.0566006898880005e-06, 3.2512471079826355e-06, 3.4458935260772705e-06, 3.6405399441719055e-06, 3.8351863622665405e-06, 4.0298327803611755e-06, 4.2244791984558105e-06, 4.4191256165504456e-06, 4.6137720346450806e-06, 4.8084184527397156e-06, 5.003064870834351e-06, 5.197711288928986e-06, 5.392357707023621e-06, 5.587004125118256e-06, 5.781650543212891e-06]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 7.0, 14.0, 22.0, 30.0, 37.0, 33.0, 47.0, 66.0, 78.0, 91.0, 100.0, 88.0, 67.0, 60.0, 52.0, 39.0, 31.0, 27.0, 18.0, 16.0, 16.0, 5.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.086162567138672e-06, -2.0274892449378967e-06, -1.9688159227371216e-06, -1.9101426005363464e-06, -1.8514692783355713e-06, -1.7927959561347961e-06, -1.734122633934021e-06, -1.6754493117332458e-06, -1.6167759895324707e-06, -1.5581026673316956e-06, -1.4994293451309204e-06, -1.4407560229301453e-06, -1.3820827007293701e-06, -1.323409378528595e-06, -1.2647360563278198e-06, -1.2060627341270447e-06, -1.1473894119262695e-06, -1.0887160897254944e-06, -1.0300427675247192e-06, -9.71369445323944e-07, -9.126961231231689e-07, -8.540228009223938e-07, -7.953494787216187e-07, -7.366761565208435e-07, -6.780028343200684e-07, -6.193295121192932e-07, -5.606561899185181e-07, -5.019828677177429e-07, -4.4330954551696777e-07, -3.8463622331619263e-07, -3.259629011154175e-07, -2.6728957891464233e-07, -2.086162567138672e-07, -1.4994293451309204e-07, -9.12696123123169e-08, -3.259629011154175e-08, 2.60770320892334e-08, 8.475035429000854e-08, 1.434236764907837e-07, 2.0209699869155884e-07, 2.60770320892334e-07, 3.1944364309310913e-07, 3.781169652938843e-07, 4.367902874946594e-07, 4.954636096954346e-07, 5.541369318962097e-07, 6.128102540969849e-07, 6.7148357629776e-07, 7.301568984985352e-07, 7.888302206993103e-07, 8.475035429000854e-07, 9.061768651008606e-07, 9.648501873016357e-07, 1.0235235095024109e-06, 1.082196831703186e-06, 1.1408701539039612e-06, 1.1995434761047363e-06, 1.2582167983055115e-06, 1.3168901205062866e-06, 1.3755634427070618e-06, 1.434236764907837e-06, 1.492910087108612e-06, 1.5515834093093872e-06, 1.6102567315101624e-06, 1.6689300537109375e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 8.0, 17.0, 9.0, 18.0, 29.0, 31.0, 34.0, 69.0, 88.0, 103.0, 142.0, 191.0, 288.0, 333.0, 578.0, 823.0, 1069.0, 2726.0, 3057.0, 4530.0, 7491.0, 12702.0, 23119.0, 48146.0, 122209.0, 441460.0, 228577.0, 73682.0, 32865.0, 17012.0, 12929.0, 4685.0, 2963.0, 1956.0, 1388.0, 943.0, 631.0, 456.0, 329.0, 222.0, 173.0, 126.0, 101.0, 86.0, 50.0, 34.0, 24.0, 17.0, 16.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 3.0], "bins": [-4.172325134277344e-06, -4.048459231853485e-06, -3.9245933294296265e-06, -3.800727427005768e-06, -3.676861524581909e-06, -3.5529956221580505e-06, -3.429129719734192e-06, -3.3052638173103333e-06, -3.1813979148864746e-06, -3.057532012462616e-06, -2.9336661100387573e-06, -2.8098002076148987e-06, -2.68593430519104e-06, -2.5620684027671814e-06, -2.4382025003433228e-06, -2.314336597919464e-06, -2.1904706954956055e-06, -2.066604793071747e-06, -1.942738890647888e-06, -1.8188729882240295e-06, -1.695007085800171e-06, -1.5711411833763123e-06, -1.4472752809524536e-06, -1.323409378528595e-06, -1.1995434761047363e-06, -1.0756775736808777e-06, -9.51811671257019e-07, -8.279457688331604e-07, -7.040798664093018e-07, -5.802139639854431e-07, -4.5634806156158447e-07, -3.3248215913772583e-07, -2.086162567138672e-07, -8.475035429000854e-08, 3.91155481338501e-08, 1.6298145055770874e-07, 2.868473529815674e-07, 4.10713255405426e-07, 5.345791578292847e-07, 6.584450602531433e-07, 7.82310962677002e-07, 9.061768651008606e-07, 1.0300427675247192e-06, 1.1539086699485779e-06, 1.2777745723724365e-06, 1.4016404747962952e-06, 1.5255063772201538e-06, 1.6493722796440125e-06, 1.773238182067871e-06, 1.8971040844917297e-06, 2.0209699869155884e-06, 2.144835889339447e-06, 2.2687017917633057e-06, 2.3925676941871643e-06, 2.516433596611023e-06, 2.6402994990348816e-06, 2.7641654014587402e-06, 2.888031303882599e-06, 3.0118972063064575e-06, 3.135763108730316e-06, 3.259629011154175e-06, 3.3834949135780334e-06, 3.507360816001892e-06, 3.6312267184257507e-06, 3.7550926208496094e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 5.0, 2.0, 5.0, 5.0, 2.0, 9.0, 12.0, 6.0, 11.0, 21.0, 18.0, 15.0, 49.0, 20.0, 31.0, 65.0, 51.0, 62.0, 134.0, 63.0, 111.0, 48.0, 41.0, 64.0, 29.0, 18.0, 23.0, 16.0, 7.0, 14.0, 4.0, 8.0, 7.0, 2.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6226043701171875e-06, -2.5425106287002563e-06, -2.462416887283325e-06, -2.382323145866394e-06, -2.302229404449463e-06, -2.2221356630325317e-06, -2.1420419216156006e-06, -2.0619481801986694e-06, -1.9818544387817383e-06, -1.9017606973648071e-06, -1.821666955947876e-06, -1.7415732145309448e-06, -1.6614794731140137e-06, -1.5813857316970825e-06, -1.5012919902801514e-06, -1.4211982488632202e-06, -1.341104507446289e-06, -1.261010766029358e-06, -1.1809170246124268e-06, -1.1008232831954956e-06, -1.0207295417785645e-06, -9.406358003616333e-07, -8.605420589447021e-07, -7.80448317527771e-07, -7.003545761108398e-07, -6.202608346939087e-07, -5.401670932769775e-07, -4.600733518600464e-07, -3.7997961044311523e-07, -2.998858690261841e-07, -2.1979212760925293e-07, -1.3969838619232178e-07, -5.960464477539063e-08, 2.0489096641540527e-08, 1.0058283805847168e-07, 1.8067657947540283e-07, 2.60770320892334e-07, 3.4086406230926514e-07, 4.209578037261963e-07, 5.010515451431274e-07, 5.811452865600586e-07, 6.612390279769897e-07, 7.413327693939209e-07, 8.21426510810852e-07, 9.015202522277832e-07, 9.816139936447144e-07, 1.0617077350616455e-06, 1.1418014764785767e-06, 1.2218952178955078e-06, 1.301988959312439e-06, 1.3820827007293701e-06, 1.4621764421463013e-06, 1.5422701835632324e-06, 1.6223639249801636e-06, 1.7024576663970947e-06, 1.7825514078140259e-06, 1.862645149230957e-06, 1.942738890647888e-06, 2.0228326320648193e-06, 2.1029263734817505e-06, 2.1830201148986816e-06, 2.263113856315613e-06, 2.343207597732544e-06, 2.423301339149475e-06, 2.5033950805664062e-06]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 12.0, 15.0, 24.0, 41.0, 90.0, 171.0, 340.0, 139.0, 66.0, 41.0, 27.0, 14.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0008525124285370111, -0.0008359133498743176, -0.0008193142130039632, -0.0008027150761336088, -0.0007861159974709153, -0.0007695169188082218, -0.0007529177819378674, -0.000736318645067513, -0.0007197195664048195, -0.000703120487742126, -0.0006865213508717716, -0.0006699222140014172, -0.0006533231353387237, -0.0006367240566760302, -0.0006201249198056757, -0.0006035257829353213, -0.0005869267042726278, -0.0005703276256099343, -0.0005537284887395799, -0.0005371293518692255, -0.000520530273206532, -0.0005039311945438385, -0.0004873320576734841, -0.00047073294990696013, -0.00045413384214043617, -0.0004375347343739122, -0.00042093562660738826, -0.0004043365188408643, -0.00038773741107434034, -0.0003711383033078164, -0.00035453919554129243, -0.00033794008777476847, -0.0003213409800082445, -0.00030474187224172056, -0.0002881427644751966, -0.00027154365670867264, -0.0002549445489421487, -0.00023834544117562473, -0.00022174633340910077, -0.00020514722564257681, -0.00018854813242796808, -0.00017194902466144413, -0.00015534991689492017, -0.0001387508091283962, -0.00012215170136187226, -0.0001055525935953483, -8.895348582882434e-05, -7.235437806230038e-05, -5.575527029577643e-05, -3.915616252925247e-05, -2.2557054762728512e-05, -5.957946996204555e-06, 1.0641160770319402e-05, 2.724026853684336e-05, 4.383937630336732e-05, 6.0438484069891274e-05, 7.703759183641523e-05, 9.363669960293919e-05, 0.00011023580736946315, 0.0001268349151359871, 0.00014343402290251106, 0.00016003313066903502, 0.00017663223843555897, 0.00019323134620208293, 0.0002098304539686069]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 5.0, 7.0, 6.0, 10.0, 16.0, 11.0, 19.0, 29.0, 28.0, 26.0, 24.0, 22.0, 45.0, 34.0, 42.0, 38.0, 64.0, 40.0, 54.0, 46.0, 41.0, 37.0, 31.0, 49.0, 33.0, 38.0, 33.0, 24.0, 18.0, 19.0, 25.0, 13.0, 13.0, 15.0, 13.0, 11.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001245737075805664, -0.00011979695409536362, -0.00011502020061016083, -0.00011024344712495804, -0.00010546669363975525, -0.00010068994015455246, -9.591318666934967e-05, -9.113643318414688e-05, -8.635967969894409e-05, -8.15829262137413e-05, -7.680617272853851e-05, -7.202941924333572e-05, -6.725266575813293e-05, -6.247591227293015e-05, -5.7699158787727356e-05, -5.292240530252457e-05, -4.814565181732178e-05, -4.336889833211899e-05, -3.85921448469162e-05, -3.381539136171341e-05, -2.903863787651062e-05, -2.426188439130783e-05, -1.948513090610504e-05, -1.4708377420902252e-05, -9.931623935699463e-06, -5.154870450496674e-06, -3.781169652938843e-07, 4.398636519908905e-06, 9.175390005111694e-06, 1.3952143490314484e-05, 1.8728896975517273e-05, 2.3505650460720062e-05, 2.828240394592285e-05, 3.305915743112564e-05, 3.783591091632843e-05, 4.261266440153122e-05, 4.738941788673401e-05, 5.21661713719368e-05, 5.694292485713959e-05, 6.171967834234238e-05, 6.649643182754517e-05, 7.127318531274796e-05, 7.604993879795074e-05, 8.082669228315353e-05, 8.560344576835632e-05, 9.038019925355911e-05, 9.51569527387619e-05, 9.993370622396469e-05, 0.00010471045970916748, 0.00010948721319437027, 0.00011426396667957306, 0.00011904072016477585, 0.00012381747364997864, 0.00012859422713518143, 0.00013337098062038422, 0.000138147734105587, 0.0001429244875907898, 0.00014770124107599258, 0.00015247799456119537, 0.00015725474804639816, 0.00016203150153160095, 0.00016680825501680374, 0.00017158500850200653, 0.00017636176198720932, 0.0001811385154724121]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 7.0, 28.0, 40.0, 56.0, 107.0, 160.0, 285.0, 499.0, 780.0, 1454.0, 2779.0, 5560.0, 12899.0, 34595.0, 128537.0, 3457191.0, 430684.0, 73320.0, 24187.0, 10025.0, 4773.0, 2638.0, 1417.0, 769.0, 448.0, 279.0, 227.0, 127.0, 82.0, 62.0, 59.0, 41.0, 39.0, 32.0, 22.0, 17.0, 13.0, 13.0, 8.0, 4.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.612871170043945e-05, -8.217524737119675e-05, -7.822178304195404e-05, -7.426831871271133e-05, -7.031485438346863e-05, -6.636139005422592e-05, -6.240792572498322e-05, -5.845446139574051e-05, -5.45009970664978e-05, -5.0547532737255096e-05, -4.659406840801239e-05, -4.2640604078769684e-05, -3.868713974952698e-05, -3.473367542028427e-05, -3.0780211091041565e-05, -2.682674676179886e-05, -2.2873282432556152e-05, -1.8919818103313446e-05, -1.496635377407074e-05, -1.1012889444828033e-05, -7.059425115585327e-06, -3.105960786342621e-06, 8.475035429000854e-07, 4.800967872142792e-06, 8.754432201385498e-06, 1.2707896530628204e-05, 1.666136085987091e-05, 2.0614825189113617e-05, 2.4568289518356323e-05, 2.852175384759903e-05, 3.2475218176841736e-05, 3.642868250608444e-05, 4.038214683532715e-05, 4.4335611164569855e-05, 4.828907549381256e-05, 5.224253982305527e-05, 5.6196004152297974e-05, 6.014946848154068e-05, 6.410293281078339e-05, 6.805639714002609e-05, 7.20098614692688e-05, 7.59633257985115e-05, 7.991679012775421e-05, 8.387025445699692e-05, 8.782371878623962e-05, 9.177718311548233e-05, 9.573064744472504e-05, 9.968411177396774e-05, 0.00010363757610321045, 0.00010759104043245316, 0.00011154450476169586, 0.00011549796909093857, 0.00011945143342018127, 0.00012340489774942398, 0.0001273583620786667, 0.0001313118264079094, 0.0001352652907371521, 0.0001392187550663948, 0.0001431722193956375, 0.00014712568372488022, 0.00015107914805412292, 0.00015503261238336563, 0.00015898607671260834, 0.00016293954104185104, 0.00016689300537109375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 17.0, 10.0, 16.0, 31.0, 42.0, 49.0, 77.0, 115.0, 111.0, 98.0, 111.0, 74.0, 73.0, 47.0, 39.0, 13.0, 17.0, 13.0, 5.0, 13.0, 4.0, 3.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4007091522216797e-05, -1.3346783816814423e-05, -1.2686476111412048e-05, -1.2026168406009674e-05, -1.13658607006073e-05, -1.0705552995204926e-05, -1.0045245289802551e-05, -9.384937584400177e-06, -8.724629878997803e-06, -8.064322173595428e-06, -7.404014468193054e-06, -6.74370676279068e-06, -6.083399057388306e-06, -5.423091351985931e-06, -4.762783646583557e-06, -4.102475941181183e-06, -3.4421682357788086e-06, -2.7818605303764343e-06, -2.12155282497406e-06, -1.4612451195716858e-06, -8.009374141693115e-07, -1.4062970876693726e-07, 5.19677996635437e-07, 1.1799857020378113e-06, 1.8402934074401855e-06, 2.50060111284256e-06, 3.160908818244934e-06, 3.821216523647308e-06, 4.481524229049683e-06, 5.141831934452057e-06, 5.802139639854431e-06, 6.462447345256805e-06, 7.12275505065918e-06, 7.783062756061554e-06, 8.443370461463928e-06, 9.103678166866302e-06, 9.763985872268677e-06, 1.0424293577671051e-05, 1.1084601283073425e-05, 1.17449089884758e-05, 1.2405216693878174e-05, 1.3065524399280548e-05, 1.3725832104682922e-05, 1.4386139810085297e-05, 1.5046447515487671e-05, 1.5706755220890045e-05, 1.636706292629242e-05, 1.7027370631694794e-05, 1.7687678337097168e-05, 1.8347986042499542e-05, 1.9008293747901917e-05, 1.966860145330429e-05, 2.0328909158706665e-05, 2.098921686410904e-05, 2.1649524569511414e-05, 2.2309832274913788e-05, 2.2970139980316162e-05, 2.3630447685718536e-05, 2.429075539112091e-05, 2.4951063096523285e-05, 2.561137080192566e-05, 2.6271678507328033e-05, 2.6931986212730408e-05, 2.7592293918132782e-05, 2.8252601623535156e-05]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 11.0, 15.0, 10.0, 19.0, 29.0, 50.0, 79.0, 90.0, 150.0, 227.0, 339.0, 470.0, 729.0, 1181.0, 1795.0, 2693.0, 4354.0, 7024.0, 11513.0, 20624.0, 35191.0, 65967.0, 139786.0, 402309.0, 2671618.0, 494146.0, 166636.0, 73792.0, 38452.0, 21535.0, 12810.0, 7424.0, 4676.0, 2946.0, 1864.0, 1284.0, 789.0, 539.0, 359.0, 240.0, 184.0, 122.0, 83.0, 39.0, 26.0, 26.0, 14.0, 11.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.137920379638672e-05, -4.975218325853348e-05, -4.812516272068024e-05, -4.6498142182826996e-05, -4.4871121644973755e-05, -4.3244101107120514e-05, -4.161708056926727e-05, -3.999006003141403e-05, -3.836303949356079e-05, -3.673601895570755e-05, -3.510899841785431e-05, -3.348197788000107e-05, -3.185495734214783e-05, -3.0227936804294586e-05, -2.8600916266441345e-05, -2.6973895728588104e-05, -2.5346875190734863e-05, -2.3719854652881622e-05, -2.209283411502838e-05, -2.046581357717514e-05, -1.88387930393219e-05, -1.721177250146866e-05, -1.5584751963615417e-05, -1.3957731425762177e-05, -1.2330710887908936e-05, -1.0703690350055695e-05, -9.076669812202454e-06, -7.449649274349213e-06, -5.822628736495972e-06, -4.195608198642731e-06, -2.5685876607894897e-06, -9.415671229362488e-07, 6.854534149169922e-07, 2.312473952770233e-06, 3.939494490623474e-06, 5.566515028476715e-06, 7.193535566329956e-06, 8.820556104183197e-06, 1.0447576642036438e-05, 1.2074597179889679e-05, 1.370161771774292e-05, 1.532863825559616e-05, 1.6955658793449402e-05, 1.8582679331302643e-05, 2.0209699869155884e-05, 2.1836720407009125e-05, 2.3463740944862366e-05, 2.5090761482715607e-05, 2.6717782020568848e-05, 2.834480255842209e-05, 2.997182309627533e-05, 3.159884363412857e-05, 3.322586417198181e-05, 3.485288470983505e-05, 3.6479905247688293e-05, 3.8106925785541534e-05, 3.9733946323394775e-05, 4.1360966861248016e-05, 4.298798739910126e-05, 4.46150079369545e-05, 4.624202847480774e-05, 4.786904901266098e-05, 4.949606955051422e-05, 5.112309008836746e-05, 5.27501106262207e-05]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 4.0, 5.0, 5.0, 4.0, 8.0, 6.0, 14.0, 14.0, 19.0, 19.0, 29.0, 29.0, 44.0, 48.0, 55.0, 83.0, 95.0, 105.0, 130.0, 158.0, 263.0, 582.0, 960.0, 458.0, 186.0, 129.0, 112.0, 86.0, 68.0, 64.0, 44.0, 30.0, 34.0, 35.0, 18.0, 22.0, 27.0, 19.0, 11.0, 14.0, 13.0, 6.0, 5.0, 6.0, 10.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.082918167114258e-05, -3.967713564634323e-05, -3.8525089621543884e-05, -3.737304359674454e-05, -3.622099757194519e-05, -3.5068951547145844e-05, -3.3916905522346497e-05, -3.276485949754715e-05, -3.16128134727478e-05, -3.0460767447948456e-05, -2.930872142314911e-05, -2.8156675398349762e-05, -2.7004629373550415e-05, -2.5852583348751068e-05, -2.470053732395172e-05, -2.3548491299152374e-05, -2.2396445274353027e-05, -2.124439924955368e-05, -2.0092353224754333e-05, -1.8940307199954987e-05, -1.778826117515564e-05, -1.6636215150356293e-05, -1.5484169125556946e-05, -1.4332123100757599e-05, -1.3180077075958252e-05, -1.2028031051158905e-05, -1.0875985026359558e-05, -9.723939001560211e-06, -8.571892976760864e-06, -7.419846951961517e-06, -6.26780092716217e-06, -5.1157549023628235e-06, -3.9637088775634766e-06, -2.8116628527641296e-06, -1.6596168279647827e-06, -5.075708031654358e-07, 6.444752216339111e-07, 1.796521246433258e-06, 2.948567271232605e-06, 4.100613296031952e-06, 5.252659320831299e-06, 6.404705345630646e-06, 7.556751370429993e-06, 8.70879739522934e-06, 9.860843420028687e-06, 1.1012889444828033e-05, 1.216493546962738e-05, 1.3316981494426727e-05, 1.4469027519226074e-05, 1.562107354402542e-05, 1.6773119568824768e-05, 1.7925165593624115e-05, 1.9077211618423462e-05, 2.022925764322281e-05, 2.1381303668022156e-05, 2.2533349692821503e-05, 2.368539571762085e-05, 2.4837441742420197e-05, 2.5989487767219543e-05, 2.714153379201889e-05, 2.8293579816818237e-05, 2.9445625841617584e-05, 3.059767186641693e-05, 3.174971789121628e-05, 3.2901763916015625e-05]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 4.0, 9.0, 11.0, 14.0, 19.0, 47.0, 46.0, 69.0, 132.0, 170.0, 141.0, 95.0, 58.0, 57.0, 34.0, 23.0, 21.0, 12.0, 10.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002866583818104118, -0.0002739180054049939, -0.00026117762899957597, -0.0002484372234903276, -0.00023569684708490968, -0.00022295647067949176, -0.00021021609427407384, -0.00019747571786865592, -0.00018473532691132277, -0.00017199495050590485, -0.0001592545595485717, -0.0001465141831431538, -0.00013377380673773587, -0.00012103341578040272, -0.0001082930393749848, -9.555265569360927e-05, -8.281227201223373e-05, -7.00718883308582e-05, -5.7331508287461475e-05, -4.459112824406475e-05, -3.1850744562689215e-05, -1.911036088131368e-05, -6.3699844758957624e-06, 6.370399205479771e-06, 1.9110782886855304e-05, 3.185116656823084e-05, 4.4591546611627564e-05, 5.733192665502429e-05, 7.007231033639982e-05, 8.281269401777536e-05, 9.555307042319328e-05, 0.00010829345410456881, 0.00012103380868211389, 0.0001337741850875318, 0.00014651457604486495, 0.00015925495245028287, 0.00017199534340761602, 0.00018473571981303394, 0.00019747609621845186, 0.00021021647262386978, 0.00022295686358120292, 0.00023569723998662084, 0.000248437630943954, 0.0002611780073493719, 0.00027391838375478983, 0.00028665876016020775, 0.00029939913656562567, 0.00031213954207487404, 0.00032487991848029196, 0.0003376202948857099, 0.0003503606712911278, 0.0003631010768003762, 0.0003758414532057941, 0.000388581829611212, 0.00040132220601662993, 0.00041406258242204785, 0.00042680295882746577, 0.0004395433352328837, 0.0004522837116383016, 0.00046502408804371953, 0.0004777644935529679, 0.0004905048990622163, 0.0005032452754676342, 0.0005159856518730521, 0.00052872602827847]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 7.0, 6.0, 8.0, 16.0, 16.0, 16.0, 20.0, 21.0, 28.0, 26.0, 23.0, 31.0, 34.0, 27.0, 30.0, 32.0, 44.0, 40.0, 44.0, 37.0, 46.0, 31.0, 37.0, 35.0, 34.0, 29.0, 26.0, 30.0, 23.0, 17.0, 29.0, 23.0, 20.0, 11.0, 12.0, 12.0, 14.0, 14.0, 6.0, 5.0, 6.0, 6.0, 2.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013560056686401367, -0.0001307651400566101, -0.00012592971324920654, -0.00012109428644180298, -0.00011625885963439941, -0.00011142343282699585, -0.00010658800601959229, -0.00010175257921218872, -9.691715240478516e-05, -9.208172559738159e-05, -8.724629878997803e-05, -8.241087198257446e-05, -7.75754451751709e-05, -7.274001836776733e-05, -6.790459156036377e-05, -6.30691647529602e-05, -5.823373794555664e-05, -5.3398311138153076e-05, -4.856288433074951e-05, -4.372745752334595e-05, -3.889203071594238e-05, -3.405660390853882e-05, -2.9221177101135254e-05, -2.438575029373169e-05, -1.9550323486328125e-05, -1.471489667892456e-05, -9.879469871520996e-06, -5.044043064117432e-06, -2.086162567138672e-07, 4.626810550689697e-06, 9.462237358093262e-06, 1.4297664165496826e-05, 1.913309097290039e-05, 2.3968517780303955e-05, 2.880394458770752e-05, 3.3639371395111084e-05, 3.847479820251465e-05, 4.331022500991821e-05, 4.814565181732178e-05, 5.298107862472534e-05, 5.7816505432128906e-05, 6.265193223953247e-05, 6.748735904693604e-05, 7.23227858543396e-05, 7.715821266174316e-05, 8.199363946914673e-05, 8.682906627655029e-05, 9.166449308395386e-05, 9.649991989135742e-05, 0.00010133534669876099, 0.00010617077350616455, 0.00011100620031356812, 0.00011584162712097168, 0.00012067705392837524, 0.0001255124807357788, 0.00013034790754318237, 0.00013518333435058594, 0.0001400187611579895, 0.00014485418796539307, 0.00014968961477279663, 0.0001545250415802002, 0.00015936046838760376, 0.00016419589519500732, 0.0001690313220024109, 0.00017386674880981445]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 6.0, 7.0, 4.0, 9.0, 17.0, 23.0, 23.0, 35.0, 57.0, 71.0, 112.0, 207.0, 373.0, 592.0, 1235.0, 2832.0, 6961.0, 19686.0, 77562.0, 651626.0, 226351.0, 40087.0, 11980.0, 4602.0, 1950.0, 924.0, 466.0, 260.0, 167.0, 105.0, 71.0, 34.0, 24.0, 17.0, 21.0, 20.0, 9.0, 10.0, 3.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00020384788513183594, -0.00019743293523788452, -0.0001910179853439331, -0.0001846030354499817, -0.00017818808555603027, -0.00017177313566207886, -0.00016535818576812744, -0.00015894323587417603, -0.0001525282859802246, -0.0001461133360862732, -0.00013969838619232178, -0.00013328343629837036, -0.00012686848640441895, -0.00012045353651046753, -0.00011403858661651611, -0.0001076236367225647, -0.00010120868682861328, -9.479373693466187e-05, -8.837878704071045e-05, -8.196383714675903e-05, -7.554888725280762e-05, -6.91339373588562e-05, -6.271898746490479e-05, -5.630403757095337e-05, -4.988908767700195e-05, -4.347413778305054e-05, -3.705918788909912e-05, -3.0644237995147705e-05, -2.422928810119629e-05, -1.7814338207244873e-05, -1.1399388313293457e-05, -4.984438419342041e-06, 1.430511474609375e-06, 7.845461368560791e-06, 1.4260411262512207e-05, 2.0675361156463623e-05, 2.709031105041504e-05, 3.3505260944366455e-05, 3.992021083831787e-05, 4.633516073226929e-05, 5.27501106262207e-05, 5.916506052017212e-05, 6.558001041412354e-05, 7.199496030807495e-05, 7.840991020202637e-05, 8.482486009597778e-05, 9.12398099899292e-05, 9.765475988388062e-05, 0.00010406970977783203, 0.00011048465967178345, 0.00011689960956573486, 0.00012331455945968628, 0.0001297295093536377, 0.0001361444592475891, 0.00014255940914154053, 0.00014897435903549194, 0.00015538930892944336, 0.00016180425882339478, 0.0001682192087173462, 0.0001746341586112976, 0.00018104910850524902, 0.00018746405839920044, 0.00019387900829315186, 0.00020029395818710327, 0.0002067089080810547]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 7.0, 11.0, 15.0, 17.0, 29.0, 31.0, 66.0, 79.0, 116.0, 133.0, 125.0, 111.0, 75.0, 50.0, 45.0, 20.0, 19.0, 13.0, 8.0, 10.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5914440155029297e-05, -1.5157274901866913e-05, -1.4400109648704529e-05, -1.3642944395542145e-05, -1.288577914237976e-05, -1.2128613889217377e-05, -1.1371448636054993e-05, -1.0614283382892609e-05, -9.857118129730225e-06, -9.09995287656784e-06, -8.342787623405457e-06, -7.5856223702430725e-06, -6.8284571170806885e-06, -6.0712918639183044e-06, -5.31412661075592e-06, -4.556961357593536e-06, -3.7997961044311523e-06, -3.0426308512687683e-06, -2.2854655981063843e-06, -1.5283003449440002e-06, -7.711350917816162e-07, -1.3969838619232178e-08, 7.431954145431519e-07, 1.5003606677055359e-06, 2.25752592086792e-06, 3.014691174030304e-06, 3.771856427192688e-06, 4.529021680355072e-06, 5.286186933517456e-06, 6.04335218667984e-06, 6.800517439842224e-06, 7.557682693004608e-06, 8.314847946166992e-06, 9.072013199329376e-06, 9.82917845249176e-06, 1.0586343705654144e-05, 1.1343508958816528e-05, 1.2100674211978912e-05, 1.2857839465141296e-05, 1.361500471830368e-05, 1.4372169971466064e-05, 1.5129335224628448e-05, 1.5886500477790833e-05, 1.6643665730953217e-05, 1.74008309841156e-05, 1.8157996237277985e-05, 1.891516149044037e-05, 1.9672326743602753e-05, 2.0429491996765137e-05, 2.118665724992752e-05, 2.1943822503089905e-05, 2.270098775625229e-05, 2.3458153009414673e-05, 2.4215318262577057e-05, 2.497248351573944e-05, 2.5729648768901825e-05, 2.648681402206421e-05, 2.7243979275226593e-05, 2.8001144528388977e-05, 2.875830978155136e-05, 2.9515475034713745e-05, 3.027264028787613e-05, 3.102980554103851e-05, 3.17869707942009e-05, 3.254413604736328e-05]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 7.0, 18.0, 12.0, 16.0, 25.0, 34.0, 54.0, 75.0, 99.0, 148.0, 203.0, 232.0, 358.0, 494.0, 749.0, 999.0, 1409.0, 1968.0, 3116.0, 4264.0, 6376.0, 10089.0, 15037.0, 24528.0, 38798.0, 68187.0, 124260.0, 334529.0, 189785.0, 86537.0, 51010.0, 29433.0, 19044.0, 11668.0, 7994.0, 5214.0, 3553.0, 2491.0, 1643.0, 1212.0, 832.0, 595.0, 387.0, 304.0, 226.0, 155.0, 118.0, 76.0, 60.0, 47.0, 27.0, 23.0, 16.0, 14.0, 8.0, 4.0, 4.0, 0.0, 1.0, 2.0], "bins": [-5.5670738220214844e-05, -5.391612648963928e-05, -5.216151475906372e-05, -5.040690302848816e-05, -4.86522912979126e-05, -4.6897679567337036e-05, -4.5143067836761475e-05, -4.338845610618591e-05, -4.163384437561035e-05, -3.987923264503479e-05, -3.812462091445923e-05, -3.637000918388367e-05, -3.4615397453308105e-05, -3.2860785722732544e-05, -3.110617399215698e-05, -2.935156226158142e-05, -2.759695053100586e-05, -2.5842338800430298e-05, -2.4087727069854736e-05, -2.2333115339279175e-05, -2.0578503608703613e-05, -1.8823891878128052e-05, -1.706928014755249e-05, -1.531466841697693e-05, -1.3560056686401367e-05, -1.1805444955825806e-05, -1.0050833225250244e-05, -8.296221494674683e-06, -6.541609764099121e-06, -4.7869980335235596e-06, -3.032386302947998e-06, -1.2777745723724365e-06, 4.76837158203125e-07, 2.2314488887786865e-06, 3.986060619354248e-06, 5.7406723499298096e-06, 7.495284080505371e-06, 9.249895811080933e-06, 1.1004507541656494e-05, 1.2759119272232056e-05, 1.4513731002807617e-05, 1.626834273338318e-05, 1.802295446395874e-05, 1.9777566194534302e-05, 2.1532177925109863e-05, 2.3286789655685425e-05, 2.5041401386260986e-05, 2.6796013116836548e-05, 2.855062484741211e-05, 3.030523657798767e-05, 3.205984830856323e-05, 3.3814460039138794e-05, 3.5569071769714355e-05, 3.732368350028992e-05, 3.907829523086548e-05, 4.083290696144104e-05, 4.25875186920166e-05, 4.434213042259216e-05, 4.6096742153167725e-05, 4.7851353883743286e-05, 4.960596561431885e-05, 5.136057734489441e-05, 5.311518907546997e-05, 5.486980080604553e-05, 5.6624412536621094e-05]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 7.0, 7.0, 6.0, 3.0, 9.0, 10.0, 13.0, 13.0, 17.0, 16.0, 20.0, 23.0, 30.0, 28.0, 37.0, 32.0, 39.0, 37.0, 44.0, 47.0, 50.0, 42.0, 48.0, 36.0, 36.0, 36.0, 29.0, 38.0, 28.0, 39.0, 25.0, 20.0, 20.0, 18.0, 16.0, 16.0, 12.0, 9.0, 8.0, 6.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.225969314575195e-05, -4.10228967666626e-05, -3.978610038757324e-05, -3.854930400848389e-05, -3.731250762939453e-05, -3.6075711250305176e-05, -3.483891487121582e-05, -3.3602118492126465e-05, -3.236532211303711e-05, -3.1128525733947754e-05, -2.98917293548584e-05, -2.8654932975769043e-05, -2.7418136596679688e-05, -2.6181340217590332e-05, -2.4944543838500977e-05, -2.370774745941162e-05, -2.2470951080322266e-05, -2.123415470123291e-05, -1.9997358322143555e-05, -1.87605619430542e-05, -1.7523765563964844e-05, -1.6286969184875488e-05, -1.5050172805786133e-05, -1.3813376426696777e-05, -1.2576580047607422e-05, -1.1339783668518066e-05, -1.0102987289428711e-05, -8.866190910339355e-06, -7.62939453125e-06, -6.3925981521606445e-06, -5.155801773071289e-06, -3.919005393981934e-06, -2.682209014892578e-06, -1.4454126358032227e-06, -2.086162567138672e-07, 1.0281801223754883e-06, 2.2649765014648438e-06, 3.5017728805541992e-06, 4.738569259643555e-06, 5.97536563873291e-06, 7.212162017822266e-06, 8.448958396911621e-06, 9.685754776000977e-06, 1.0922551155090332e-05, 1.2159347534179688e-05, 1.3396143913269043e-05, 1.4632940292358398e-05, 1.5869736671447754e-05, 1.710653305053711e-05, 1.8343329429626465e-05, 1.958012580871582e-05, 2.0816922187805176e-05, 2.205371856689453e-05, 2.3290514945983887e-05, 2.4527311325073242e-05, 2.5764107704162598e-05, 2.7000904083251953e-05, 2.823770046234131e-05, 2.9474496841430664e-05, 3.071129322052002e-05, 3.1948089599609375e-05, 3.318488597869873e-05, 3.4421682357788086e-05, 3.565847873687744e-05, 3.68952751159668e-05]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 3.0, 5.0, 14.0, 14.0, 17.0, 30.0, 32.0, 53.0, 98.0, 112.0, 152.0, 282.0, 388.0, 510.0, 1263.0, 1670.0, 2891.0, 8380.0, 14568.0, 35461.0, 196907.0, 523949.0, 172795.0, 58578.0, 14495.0, 6780.0, 4308.0, 1642.0, 1060.0, 821.0, 375.0, 268.0, 222.0, 112.0, 83.0, 77.0, 41.0, 26.0, 27.0, 6.0, 11.0, 9.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.854534149169922e-06, -6.656162440776825e-06, -6.457790732383728e-06, -6.259419023990631e-06, -6.061047315597534e-06, -5.862675607204437e-06, -5.66430389881134e-06, -5.465932190418243e-06, -5.2675604820251465e-06, -5.0691887736320496e-06, -4.870817065238953e-06, -4.672445356845856e-06, -4.474073648452759e-06, -4.275701940059662e-06, -4.077330231666565e-06, -3.878958523273468e-06, -3.680586814880371e-06, -3.482215106487274e-06, -3.2838433980941772e-06, -3.0854716897010803e-06, -2.8870999813079834e-06, -2.6887282729148865e-06, -2.4903565645217896e-06, -2.2919848561286926e-06, -2.0936131477355957e-06, -1.8952414393424988e-06, -1.6968697309494019e-06, -1.498498022556305e-06, -1.300126314163208e-06, -1.101754605770111e-06, -9.033828973770142e-07, -7.050111889839172e-07, -5.066394805908203e-07, -3.082677721977234e-07, -1.0989606380462646e-07, 8.847564458847046e-08, 2.868473529815674e-07, 4.852190613746643e-07, 6.835907697677612e-07, 8.819624781608582e-07, 1.080334186553955e-06, 1.278705894947052e-06, 1.477077603340149e-06, 1.6754493117332458e-06, 1.8738210201263428e-06, 2.0721927285194397e-06, 2.2705644369125366e-06, 2.4689361453056335e-06, 2.6673078536987305e-06, 2.8656795620918274e-06, 3.0640512704849243e-06, 3.2624229788780212e-06, 3.460794687271118e-06, 3.659166395664215e-06, 3.857538104057312e-06, 4.055909812450409e-06, 4.254281520843506e-06, 4.452653229236603e-06, 4.6510249376297e-06, 4.849396646022797e-06, 5.0477683544158936e-06, 5.2461400628089905e-06, 5.444511771202087e-06, 5.642883479595184e-06, 5.841255187988281e-06]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 5.0, 0.0, 7.0, 0.0, 6.0, 0.0, 13.0, 0.0, 22.0, 0.0, 12.0, 18.0, 0.0, 41.0, 0.0, 32.0, 0.0, 42.0, 0.0, 54.0, 0.0, 62.0, 0.0, 74.0, 0.0, 81.0, 0.0, 70.0, 72.0, 0.0, 77.0, 0.0, 76.0, 0.0, 58.0, 0.0, 46.0, 0.0, 45.0, 0.0, 23.0, 0.0, 29.0, 14.0, 0.0, 10.0, 0.0, 13.0, 0.0, 2.0, 0.0, 5.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0132789611816406e-06, -9.816139936447144e-07, -9.499490261077881e-07, -9.182840585708618e-07, -8.866190910339355e-07, -8.549541234970093e-07, -8.23289155960083e-07, -7.916241884231567e-07, -7.599592208862305e-07, -7.282942533493042e-07, -6.966292858123779e-07, -6.649643182754517e-07, -6.332993507385254e-07, -6.016343832015991e-07, -5.699694156646729e-07, -5.383044481277466e-07, -5.066394805908203e-07, -4.7497451305389404e-07, -4.4330954551696777e-07, -4.116445779800415e-07, -3.7997961044311523e-07, -3.4831464290618896e-07, -3.166496753692627e-07, -2.849847078323364e-07, -2.5331974029541016e-07, -2.2165477275848389e-07, -1.8998980522155762e-07, -1.5832483768463135e-07, -1.2665987014770508e-07, -9.499490261077881e-08, -6.332993507385254e-08, -3.166496753692627e-08, 0.0, 3.166496753692627e-08, 6.332993507385254e-08, 9.499490261077881e-08, 1.2665987014770508e-07, 1.5832483768463135e-07, 1.8998980522155762e-07, 2.2165477275848389e-07, 2.5331974029541016e-07, 2.849847078323364e-07, 3.166496753692627e-07, 3.4831464290618896e-07, 3.7997961044311523e-07, 4.116445779800415e-07, 4.4330954551696777e-07, 4.7497451305389404e-07, 5.066394805908203e-07, 5.383044481277466e-07, 5.699694156646729e-07, 6.016343832015991e-07, 6.332993507385254e-07, 6.649643182754517e-07, 6.966292858123779e-07, 7.282942533493042e-07, 7.599592208862305e-07, 7.916241884231567e-07, 8.23289155960083e-07, 8.549541234970093e-07, 8.866190910339355e-07, 9.182840585708618e-07, 9.499490261077881e-07, 9.816139936447144e-07, 1.0132789611816406e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 2.0, 1.0, 5.0, 10.0, 4.0, 16.0, 9.0, 20.0, 34.0, 42.0, 52.0, 43.0, 106.0, 157.0, 252.0, 317.0, 241.0, 611.0, 902.0, 1337.0, 2216.0, 1496.0, 4482.0, 7752.0, 14506.0, 29341.0, 26862.0, 120884.0, 464824.0, 237897.0, 70000.0, 17563.0, 20346.0, 10670.0, 5983.0, 3392.0, 1170.0, 1683.0, 1036.0, 705.0, 467.0, 186.0, 280.0, 195.0, 125.0, 101.0, 42.0, 47.0, 43.0, 28.0, 24.0, 10.0, 14.0, 9.0, 11.0, 5.0, 0.0, 4.0, 0.0, 4.0, 2.0], "bins": [-3.3974647521972656e-06, -3.2903626561164856e-06, -3.1832605600357056e-06, -3.0761584639549255e-06, -2.9690563678741455e-06, -2.8619542717933655e-06, -2.7548521757125854e-06, -2.6477500796318054e-06, -2.5406479835510254e-06, -2.4335458874702454e-06, -2.3264437913894653e-06, -2.2193416953086853e-06, -2.1122395992279053e-06, -2.0051375031471252e-06, -1.8980354070663452e-06, -1.7909333109855652e-06, -1.6838312149047852e-06, -1.5767291188240051e-06, -1.469627022743225e-06, -1.362524926662445e-06, -1.255422830581665e-06, -1.148320734500885e-06, -1.041218638420105e-06, -9.34116542339325e-07, -8.270144462585449e-07, -7.199123501777649e-07, -6.128102540969849e-07, -5.057081580162048e-07, -3.986060619354248e-07, -2.915039658546448e-07, -1.8440186977386475e-07, -7.729977369308472e-08, 2.9802322387695312e-08, 1.3690441846847534e-07, 2.4400651454925537e-07, 3.511086106300354e-07, 4.5821070671081543e-07, 5.653128027915955e-07, 6.724148988723755e-07, 7.795169949531555e-07, 8.866190910339355e-07, 9.937211871147156e-07, 1.1008232831954956e-06, 1.2079253792762756e-06, 1.3150274753570557e-06, 1.4221295714378357e-06, 1.5292316675186157e-06, 1.6363337635993958e-06, 1.7434358596801758e-06, 1.8505379557609558e-06, 1.957640051841736e-06, 2.064742147922516e-06, 2.171844244003296e-06, 2.278946340084076e-06, 2.386048436164856e-06, 2.493150532245636e-06, 2.600252628326416e-06, 2.707354724407196e-06, 2.814456820487976e-06, 2.921558916568756e-06, 3.028661012649536e-06, 3.135763108730316e-06, 3.242865204811096e-06, 3.3499673008918762e-06, 3.4570693969726562e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 7.0, 2.0, 10.0, 7.0, 13.0, 30.0, 19.0, 20.0, 54.0, 30.0, 38.0, 107.0, 46.0, 71.0, 78.0, 125.0, 63.0, 53.0, 65.0, 23.0, 19.0, 40.0, 6.0, 17.0, 10.0, 6.0, 5.0, 6.0, 8.0, 4.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4437904357910156e-06, -2.3655593395233154e-06, -2.2873282432556152e-06, -2.209097146987915e-06, -2.130866050720215e-06, -2.0526349544525146e-06, -1.9744038581848145e-06, -1.8961727619171143e-06, -1.817941665649414e-06, -1.7397105693817139e-06, -1.6614794731140137e-06, -1.5832483768463135e-06, -1.5050172805786133e-06, -1.426786184310913e-06, -1.3485550880432129e-06, -1.2703239917755127e-06, -1.1920928955078125e-06, -1.1138617992401123e-06, -1.0356307029724121e-06, -9.57399606704712e-07, -8.791685104370117e-07, -8.009374141693115e-07, -7.227063179016113e-07, -6.444752216339111e-07, -5.662441253662109e-07, -4.880130290985107e-07, -4.0978193283081055e-07, -3.3155083656311035e-07, -2.5331974029541016e-07, -1.7508864402770996e-07, -9.685754776000977e-08, -1.862645149230957e-08, 5.960464477539063e-08, 1.3783574104309082e-07, 2.1606683731079102e-07, 2.942979335784912e-07, 3.725290298461914e-07, 4.507601261138916e-07, 5.289912223815918e-07, 6.07222318649292e-07, 6.854534149169922e-07, 7.636845111846924e-07, 8.419156074523926e-07, 9.201467037200928e-07, 9.98377799987793e-07, 1.0766088962554932e-06, 1.1548399925231934e-06, 1.2330710887908936e-06, 1.3113021850585938e-06, 1.389533281326294e-06, 1.4677643775939941e-06, 1.5459954738616943e-06, 1.6242265701293945e-06, 1.7024576663970947e-06, 1.780688762664795e-06, 1.8589198589324951e-06, 1.9371509552001953e-06, 2.0153820514678955e-06, 2.0936131477355957e-06, 2.171844244003296e-06, 2.250075340270996e-06, 2.3283064365386963e-06, 2.4065375328063965e-06, 2.4847686290740967e-06, 2.562999725341797e-06]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 9.0, 7.0, 9.0, 17.0, 22.0, 46.0, 62.0, 105.0, 238.0, 200.0, 97.0, 76.0, 31.0, 24.0, 21.0, 11.0, 5.0, 9.0, 6.0, 5.0, 5.0, 0.0, 1.0], "bins": [-0.0006909047369845212, -0.0006770605687052011, -0.0006632164004258811, -0.0006493722903542221, -0.0006355281220749021, -0.0006216839537955821, -0.0006078397855162621, -0.000593995675444603, -0.000580151507165283, -0.000566307338885963, -0.000552463170606643, -0.0005386190605349839, -0.0005247748922556639, -0.0005109307239763439, -0.0004970865556970239, -0.0004832424165215343, -0.0004693982773460448, -0.0004555541090667248, -0.00044170996989123523, -0.00042786580161191523, -0.0004140216624364257, -0.0004001774941571057, -0.00038633335498161614, -0.00037248918670229614, -0.00035864501842297614, -0.00034480085014365613, -0.0003309567109681666, -0.0003171125426888466, -0.00030326840351335704, -0.00028942423523403704, -0.0002755800960585475, -0.0002617359277792275, -0.00024789178860373795, -0.00023404763487633318, -0.0002202034811489284, -0.00020635932742152363, -0.00019251517369411886, -0.00017867100541479886, -0.0001648268662393093, -0.0001509826979599893, -0.00013713855878449976, -0.000123294405057095, -0.00010945025132969022, -9.560609760228544e-05, -8.176194387488067e-05, -6.791778287151828e-05, -5.407362914411351e-05, -4.022947541670874e-05, -2.638531441334635e-05, -1.2541159776446875e-05, 1.3029948604525998e-06, 1.5147150406846777e-05, 2.899130413425155e-05, 4.283546149963513e-05, 5.6679615227039903e-05, 7.052376895444468e-05, 8.436792268184945e-05, 9.821207640925422e-05, 0.000112056230136659, 0.00012590039114002138, 0.00013974454486742616, 0.00015358869859483093, 0.0001674328523222357, 0.00018127700604964048, 0.00019512115977704525]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 10.0, 10.0, 7.0, 17.0, 15.0, 19.0, 26.0, 20.0, 25.0, 40.0, 32.0, 31.0, 37.0, 33.0, 40.0, 43.0, 56.0, 49.0, 42.0, 34.0, 45.0, 51.0, 38.0, 30.0, 33.0, 33.0, 31.0, 22.0, 21.0, 20.0, 15.0, 12.0, 10.0, 12.0, 12.0, 7.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001723170280456543, -0.00016692373901605606, -0.00016153044998645782, -0.0001561371609568596, -0.00015074387192726135, -0.00014535058289766312, -0.00013995729386806488, -0.00013456400483846664, -0.0001291707158088684, -0.00012377742677927017, -0.00011838413774967194, -0.0001129908487200737, -0.00010759755969047546, -0.00010220427066087723, -9.681098163127899e-05, -9.141769260168076e-05, -8.602440357208252e-05, -8.063111454248428e-05, -7.523782551288605e-05, -6.984453648328781e-05, -6.445124745368958e-05, -5.905795842409134e-05, -5.36646693944931e-05, -4.827138036489487e-05, -4.287809133529663e-05, -3.7484802305698395e-05, -3.209151327610016e-05, -2.6698224246501923e-05, -2.1304935216903687e-05, -1.591164618730545e-05, -1.0518357157707214e-05, -5.125068128108978e-06, 2.682209014892578e-07, 5.661509931087494e-06, 1.105479896068573e-05, 1.6448087990283966e-05, 2.1841377019882202e-05, 2.7234666049480438e-05, 3.2627955079078674e-05, 3.802124410867691e-05, 4.3414533138275146e-05, 4.880782216787338e-05, 5.420111119747162e-05, 5.9594400227069855e-05, 6.498768925666809e-05, 7.038097828626633e-05, 7.577426731586456e-05, 8.11675563454628e-05, 8.656084537506104e-05, 9.195413440465927e-05, 9.734742343425751e-05, 0.00010274071246385574, 0.00010813400149345398, 0.00011352729052305222, 0.00011892057955265045, 0.0001243138685822487, 0.00012970715761184692, 0.00013510044664144516, 0.0001404937356710434, 0.00014588702470064163, 0.00015128031373023987, 0.0001566736027598381, 0.00016206689178943634, 0.00016746018081903458, 0.0001728534698486328]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 10.0, 10.0, 19.0, 41.0, 64.0, 86.0, 127.0, 244.0, 364.0, 620.0, 1032.0, 1691.0, 2811.0, 5051.0, 9277.0, 18833.0, 45325.0, 159814.0, 3504397.0, 323779.0, 66485.0, 25835.0, 12079.0, 6324.0, 3633.0, 2164.0, 1318.0, 876.0, 608.0, 379.0, 253.0, 165.0, 116.0, 87.0, 61.0, 64.0, 44.0, 28.0, 32.0, 15.0, 21.0, 19.0, 15.0, 16.0, 12.0, 13.0, 6.0, 4.0, 6.0, 2.0, 8.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.443262100219727e-05, -6.146077066659927e-05, -5.848892033100128e-05, -5.551706999540329e-05, -5.25452196598053e-05, -4.9573369324207306e-05, -4.6601518988609314e-05, -4.362966865301132e-05, -4.065781831741333e-05, -3.768596798181534e-05, -3.4714117646217346e-05, -3.1742267310619354e-05, -2.8770416975021362e-05, -2.579856663942337e-05, -2.282671630382538e-05, -1.9854865968227386e-05, -1.6883015632629395e-05, -1.3911165297031403e-05, -1.093931496143341e-05, -7.967464625835419e-06, -4.995614290237427e-06, -2.023763954639435e-06, 9.480863809585571e-07, 3.919936716556549e-06, 6.891787052154541e-06, 9.863637387752533e-06, 1.2835487723350525e-05, 1.5807338058948517e-05, 1.877918839454651e-05, 2.17510387301445e-05, 2.4722889065742493e-05, 2.7694739401340485e-05, 3.0666589736938477e-05, 3.363844007253647e-05, 3.661029040813446e-05, 3.958214074373245e-05, 4.2553991079330444e-05, 4.5525841414928436e-05, 4.849769175052643e-05, 5.146954208612442e-05, 5.444139242172241e-05, 5.7413242757320404e-05, 6.0385093092918396e-05, 6.335694342851639e-05, 6.632879376411438e-05, 6.930064409971237e-05, 7.227249443531036e-05, 7.524434477090836e-05, 7.821619510650635e-05, 8.118804544210434e-05, 8.415989577770233e-05, 8.713174611330032e-05, 9.010359644889832e-05, 9.307544678449631e-05, 9.60472971200943e-05, 9.901914745569229e-05, 0.00010199099779129028, 0.00010496284812688828, 0.00010793469846248627, 0.00011090654879808426, 0.00011387839913368225, 0.00011685024946928024, 0.00011982209980487823, 0.00012279395014047623, 0.00012576580047607422]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 7.0, 10.0, 9.0, 24.0, 18.0, 35.0, 44.0, 73.0, 117.0, 124.0, 110.0, 97.0, 82.0, 71.0, 38.0, 36.0, 24.0, 19.0, 9.0, 5.0, 5.0, 13.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.33514404296875e-05, -1.2695789337158203e-05, -1.2040138244628906e-05, -1.138448715209961e-05, -1.0728836059570312e-05, -1.0073184967041016e-05, -9.417533874511719e-06, -8.761882781982422e-06, -8.106231689453125e-06, -7.450580596923828e-06, -6.794929504394531e-06, -6.139278411865234e-06, -5.4836273193359375e-06, -4.827976226806641e-06, -4.172325134277344e-06, -3.516674041748047e-06, -2.86102294921875e-06, -2.205371856689453e-06, -1.5497207641601562e-06, -8.940696716308594e-07, -2.384185791015625e-07, 4.172325134277344e-07, 1.0728836059570312e-06, 1.7285346984863281e-06, 2.384185791015625e-06, 3.039836883544922e-06, 3.6954879760742188e-06, 4.351139068603516e-06, 5.0067901611328125e-06, 5.662441253662109e-06, 6.318092346191406e-06, 6.973743438720703e-06, 7.62939453125e-06, 8.285045623779297e-06, 8.940696716308594e-06, 9.59634780883789e-06, 1.0251998901367188e-05, 1.0907649993896484e-05, 1.1563301086425781e-05, 1.2218952178955078e-05, 1.2874603271484375e-05, 1.3530254364013672e-05, 1.4185905456542969e-05, 1.4841556549072266e-05, 1.5497207641601562e-05, 1.615285873413086e-05, 1.6808509826660156e-05, 1.7464160919189453e-05, 1.811981201171875e-05, 1.8775463104248047e-05, 1.9431114196777344e-05, 2.008676528930664e-05, 2.0742416381835938e-05, 2.1398067474365234e-05, 2.205371856689453e-05, 2.2709369659423828e-05, 2.3365020751953125e-05, 2.4020671844482422e-05, 2.467632293701172e-05, 2.5331974029541016e-05, 2.5987625122070312e-05, 2.664327621459961e-05, 2.7298927307128906e-05, 2.7954578399658203e-05, 2.86102294921875e-05]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 4.0, 10.0, 9.0, 21.0, 37.0, 41.0, 63.0, 84.0, 129.0, 184.0, 320.0, 458.0, 788.0, 1186.0, 1990.0, 3204.0, 5548.0, 9683.0, 17558.0, 34857.0, 68763.0, 171192.0, 939001.0, 2560463.0, 208381.0, 82300.0, 40746.0, 20155.0, 11414.0, 6148.0, 3594.0, 2222.0, 1273.0, 884.0, 521.0, 342.0, 221.0, 159.0, 99.0, 64.0, 46.0, 35.0, 33.0, 17.0, 10.0, 9.0, 2.0, 6.0, 5.0, 2.0, 3.0], "bins": [-6.54458999633789e-05, -6.363354623317719e-05, -6.182119250297546e-05, -6.000883877277374e-05, -5.819648504257202e-05, -5.63841313123703e-05, -5.457177758216858e-05, -5.275942385196686e-05, -5.094707012176514e-05, -4.9134716391563416e-05, -4.7322362661361694e-05, -4.551000893115997e-05, -4.369765520095825e-05, -4.188530147075653e-05, -4.007294774055481e-05, -3.826059401035309e-05, -3.644824028015137e-05, -3.4635886549949646e-05, -3.2823532819747925e-05, -3.1011179089546204e-05, -2.9198825359344482e-05, -2.738647162914276e-05, -2.557411789894104e-05, -2.376176416873932e-05, -2.1949410438537598e-05, -2.0137056708335876e-05, -1.8324702978134155e-05, -1.6512349247932434e-05, -1.4699995517730713e-05, -1.2887641787528992e-05, -1.107528805732727e-05, -9.26293432712555e-06, -7.450580596923828e-06, -5.638226866722107e-06, -3.825873136520386e-06, -2.0135194063186646e-06, -2.0116567611694336e-07, 1.6111880540847778e-06, 3.423541784286499e-06, 5.23589551448822e-06, 7.048249244689941e-06, 8.860602974891663e-06, 1.0672956705093384e-05, 1.2485310435295105e-05, 1.4297664165496826e-05, 1.6110017895698547e-05, 1.792237162590027e-05, 1.973472535610199e-05, 2.154707908630371e-05, 2.3359432816505432e-05, 2.5171786546707153e-05, 2.6984140276908875e-05, 2.8796494007110596e-05, 3.060884773731232e-05, 3.242120146751404e-05, 3.423355519771576e-05, 3.604590892791748e-05, 3.78582626581192e-05, 3.967061638832092e-05, 4.1482970118522644e-05, 4.3295323848724365e-05, 4.5107677578926086e-05, 4.692003130912781e-05, 4.873238503932953e-05, 5.054473876953125e-05]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 6.0, 7.0, 5.0, 10.0, 20.0, 13.0, 21.0, 27.0, 32.0, 44.0, 53.0, 59.0, 83.0, 105.0, 143.0, 277.0, 733.0, 1281.0, 426.0, 151.0, 112.0, 82.0, 82.0, 57.0, 50.0, 51.0, 34.0, 31.0, 16.0, 16.0, 11.0, 11.0, 9.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.947185516357422e-05, -4.802923649549484e-05, -4.6586617827415466e-05, -4.514399915933609e-05, -4.3701380491256714e-05, -4.225876182317734e-05, -4.081614315509796e-05, -3.9373524487018585e-05, -3.793090581893921e-05, -3.648828715085983e-05, -3.5045668482780457e-05, -3.360304981470108e-05, -3.2160431146621704e-05, -3.071781247854233e-05, -2.927519381046295e-05, -2.7832575142383575e-05, -2.63899564743042e-05, -2.4947337806224823e-05, -2.3504719138145447e-05, -2.206210047006607e-05, -2.0619481801986694e-05, -1.9176863133907318e-05, -1.7734244465827942e-05, -1.6291625797748566e-05, -1.484900712966919e-05, -1.3406388461589813e-05, -1.1963769793510437e-05, -1.052115112543106e-05, -9.078532457351685e-06, -7.635913789272308e-06, -6.193295121192932e-06, -4.750676453113556e-06, -3.3080577850341797e-06, -1.8654391169548035e-06, -4.2282044887542725e-07, 1.019798219203949e-06, 2.462416887283325e-06, 3.905035555362701e-06, 5.347654223442078e-06, 6.790272891521454e-06, 8.23289155960083e-06, 9.675510227680206e-06, 1.1118128895759583e-05, 1.2560747563838959e-05, 1.4003366231918335e-05, 1.544598489999771e-05, 1.6888603568077087e-05, 1.8331222236156464e-05, 1.977384090423584e-05, 2.1216459572315216e-05, 2.2659078240394592e-05, 2.410169690847397e-05, 2.5544315576553345e-05, 2.698693424463272e-05, 2.8429552912712097e-05, 2.9872171580791473e-05, 3.131479024887085e-05, 3.2757408916950226e-05, 3.42000275850296e-05, 3.564264625310898e-05, 3.7085264921188354e-05, 3.852788358926773e-05, 3.997050225734711e-05, 4.141312092542648e-05, 4.285573959350586e-05]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 6.0, 9.0, 9.0, 22.0, 38.0, 52.0, 83.0, 140.0, 197.0, 141.0, 93.0, 56.0, 44.0, 27.0, 21.0, 27.0, 11.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002161163283744827, -0.0002035608922597021, -0.00019100545614492148, -0.00017845002003014088, -0.00016589458391536027, -0.00015333914780057967, -0.0001407837262377143, -0.00012822827557101846, -0.00011567284673219547, -0.00010311741061741486, -9.056197450263426e-05, -7.800654566381127e-05, -6.545110954903066e-05, -5.289567343425006e-05, -4.034023731946945e-05, -2.7784801204688847e-05, -1.5229365089908242e-05, -2.673929884622339e-06, 9.881505320663564e-06, 2.2436939616454765e-05, 3.499237573123537e-05, 4.754780820803717e-05, 6.010324432281777e-05, 7.265868043759838e-05, 8.521411655237898e-05, 9.776955266715959e-05, 0.00011032498878194019, 0.00012288041762076318, 0.0001354358537355438, 0.0001479912898503244, 0.000160546725965105, 0.0001731021620798856, 0.00018565761274658144, 0.00019821304886136204, 0.00021076848497614264, 0.00022332392109092325, 0.00023587935720570385, 0.00024843477876856923, 0.00026099022943526506, 0.00027354565099813044, 0.0002861011016648263, 0.00029865652322769165, 0.0003112119738943875, 0.00032376739545725286, 0.0003363228461239487, 0.00034887826768681407, 0.0003614337183535099, 0.0003739891399163753, 0.00038654456147924066, 0.00039909998304210603, 0.00041165543370880187, 0.00042421085527166724, 0.0004367663059383631, 0.00044932172750122845, 0.0004618771781679243, 0.00047443259973078966, 0.0004869880503974855, 0.0004995435010641813, 0.0005120988935232162, 0.0005246543441899121, 0.0005372097948566079, 0.0005497652455233037, 0.0005623206379823387, 0.0005748760886490345, 0.0005874315393157303]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 14.0, 3.0, 9.0, 8.0, 12.0, 12.0, 12.0, 13.0, 15.0, 25.0, 22.0, 31.0, 36.0, 26.0, 31.0, 31.0, 37.0, 23.0, 44.0, 39.0, 52.0, 38.0, 36.0, 51.0, 39.0, 43.0, 39.0, 27.0, 30.0, 23.0, 21.0, 17.0, 19.0, 13.0, 19.0, 12.0, 9.0, 15.0, 11.0, 7.0, 9.0, 5.0, 7.0, 4.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00014591217041015625, -0.00014131423085927963, -0.00013671629130840302, -0.0001321183517575264, -0.00012752041220664978, -0.00012292247265577316, -0.00011832453310489655, -0.00011372659355401993, -0.00010912865400314331, -0.00010453071445226669, -9.993277490139008e-05, -9.533483535051346e-05, -9.073689579963684e-05, -8.613895624876022e-05, -8.15410166978836e-05, -7.694307714700699e-05, -7.234513759613037e-05, -6.774719804525375e-05, -6.314925849437714e-05, -5.855131894350052e-05, -5.39533793926239e-05, -4.9355439841747284e-05, -4.4757500290870667e-05, -4.015956073999405e-05, -3.556162118911743e-05, -3.0963681638240814e-05, -2.6365742087364197e-05, -2.176780253648758e-05, -1.7169862985610962e-05, -1.2571923434734344e-05, -7.973983883857727e-06, -3.3760443329811096e-06, 1.2218952178955078e-06, 5.819834768772125e-06, 1.0417774319648743e-05, 1.501571387052536e-05, 1.9613653421401978e-05, 2.4211592972278595e-05, 2.8809532523155212e-05, 3.340747207403183e-05, 3.800541162490845e-05, 4.2603351175785065e-05, 4.720129072666168e-05, 5.17992302775383e-05, 5.639716982841492e-05, 6.0995109379291534e-05, 6.559304893016815e-05, 7.019098848104477e-05, 7.478892803192139e-05, 7.9386867582798e-05, 8.398480713367462e-05, 8.858274668455124e-05, 9.318068623542786e-05, 9.777862578630447e-05, 0.00010237656533718109, 0.00010697450488805771, 0.00011157244443893433, 0.00011617038398981094, 0.00012076832354068756, 0.00012536626309156418, 0.0001299642026424408, 0.0001345621421933174, 0.00013916008174419403, 0.00014375802129507065, 0.00014835596084594727]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 4.0, 15.0, 12.0, 10.0, 16.0, 22.0, 27.0, 48.0, 90.0, 105.0, 228.0, 332.0, 659.0, 1612.0, 3462.0, 9636.0, 30361.0, 167328.0, 717866.0, 85421.0, 19484.0, 6805.0, 2508.0, 1215.0, 523.0, 272.0, 152.0, 92.0, 65.0, 39.0, 34.0, 30.0, 9.0, 10.0, 5.0, 8.0, 12.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.0001882314682006836, -0.00018258392810821533, -0.00017693638801574707, -0.0001712888479232788, -0.00016564130783081055, -0.00015999376773834229, -0.00015434622764587402, -0.00014869868755340576, -0.0001430511474609375, -0.00013740360736846924, -0.00013175606727600098, -0.00012610852718353271, -0.00012046098709106445, -0.00011481344699859619, -0.00010916590690612793, -0.00010351836681365967, -9.78708267211914e-05, -9.222328662872314e-05, -8.657574653625488e-05, -8.092820644378662e-05, -7.528066635131836e-05, -6.96331262588501e-05, -6.398558616638184e-05, -5.8338046073913574e-05, -5.269050598144531e-05, -4.704296588897705e-05, -4.139542579650879e-05, -3.574788570404053e-05, -3.0100345611572266e-05, -2.4452805519104004e-05, -1.8805265426635742e-05, -1.315772533416748e-05, -7.510185241699219e-06, -1.862645149230957e-06, 3.7848949432373047e-06, 9.432435035705566e-06, 1.5079975128173828e-05, 2.072751522064209e-05, 2.637505531311035e-05, 3.202259540557861e-05, 3.7670135498046875e-05, 4.331767559051514e-05, 4.89652156829834e-05, 5.461275577545166e-05, 6.026029586791992e-05, 6.590783596038818e-05, 7.155537605285645e-05, 7.720291614532471e-05, 8.285045623779297e-05, 8.849799633026123e-05, 9.414553642272949e-05, 9.979307651519775e-05, 0.00010544061660766602, 0.00011108815670013428, 0.00011673569679260254, 0.0001223832368850708, 0.00012803077697753906, 0.00013367831707000732, 0.00013932585716247559, 0.00014497339725494385, 0.0001506209373474121, 0.00015626847743988037, 0.00016191601753234863, 0.0001675635576248169, 0.00017321109771728516]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 5.0, 19.0, 18.0, 17.0, 32.0, 56.0, 76.0, 111.0, 137.0, 139.0, 110.0, 82.0, 63.0, 34.0, 22.0, 23.0, 15.0, 10.0, 9.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1801719665527344e-05, -1.1072494089603424e-05, -1.0343268513679504e-05, -9.614042937755585e-06, -8.884817361831665e-06, -8.155591785907745e-06, -7.426366209983826e-06, -6.697140634059906e-06, -5.967915058135986e-06, -5.238689482212067e-06, -4.509463906288147e-06, -3.7802383303642273e-06, -3.0510127544403076e-06, -2.321787178516388e-06, -1.5925616025924683e-06, -8.633360266685486e-07, -1.341104507446289e-07, 5.951151251792908e-07, 1.3243407011032104e-06, 2.05356627702713e-06, 2.78279185295105e-06, 3.5120174288749695e-06, 4.241243004798889e-06, 4.970468580722809e-06, 5.6996941566467285e-06, 6.428919732570648e-06, 7.158145308494568e-06, 7.887370884418488e-06, 8.616596460342407e-06, 9.345822036266327e-06, 1.0075047612190247e-05, 1.0804273188114166e-05, 1.1533498764038086e-05, 1.2262724339962006e-05, 1.2991949915885925e-05, 1.3721175491809845e-05, 1.4450401067733765e-05, 1.5179626643657684e-05, 1.5908852219581604e-05, 1.6638077795505524e-05, 1.7367303371429443e-05, 1.8096528947353363e-05, 1.8825754523277283e-05, 1.9554980099201202e-05, 2.0284205675125122e-05, 2.1013431251049042e-05, 2.174265682697296e-05, 2.247188240289688e-05, 2.32011079788208e-05, 2.393033355474472e-05, 2.465955913066864e-05, 2.538878470659256e-05, 2.611801028251648e-05, 2.68472358584404e-05, 2.757646143436432e-05, 2.830568701028824e-05, 2.9034912586212158e-05, 2.9764138162136078e-05, 3.0493363738059998e-05, 3.122258931398392e-05, 3.195181488990784e-05, 3.2681040465831757e-05, 3.3410266041755676e-05, 3.4139491617679596e-05, 3.4868717193603516e-05]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 1.0, 10.0, 7.0, 13.0, 14.0, 25.0, 42.0, 61.0, 77.0, 116.0, 150.0, 211.0, 306.0, 409.0, 641.0, 915.0, 1294.0, 2017.0, 2872.0, 4316.0, 6412.0, 9803.0, 15254.0, 24313.0, 42160.0, 69959.0, 134985.0, 342297.0, 175221.0, 85179.0, 48096.0, 29840.0, 17636.0, 11280.0, 7437.0, 4776.0, 3251.0, 2166.0, 1573.0, 1062.0, 698.0, 485.0, 363.0, 250.0, 157.0, 126.0, 91.0, 58.0, 56.0, 19.0, 21.0, 15.0, 8.0, 8.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-4.744529724121094e-05, -4.594679921865463e-05, -4.444830119609833e-05, -4.294980317354202e-05, -4.145130515098572e-05, -3.995280712842941e-05, -3.845430910587311e-05, -3.69558110833168e-05, -3.54573130607605e-05, -3.395881503820419e-05, -3.246031701564789e-05, -3.096181899309158e-05, -2.946332097053528e-05, -2.7964822947978973e-05, -2.646632492542267e-05, -2.4967826902866364e-05, -2.346932888031006e-05, -2.1970830857753754e-05, -2.047233283519745e-05, -1.8973834812641144e-05, -1.747533679008484e-05, -1.5976838767528534e-05, -1.4478340744972229e-05, -1.2979842722415924e-05, -1.1481344699859619e-05, -9.982846677303314e-06, -8.48434865474701e-06, -6.985850632190704e-06, -5.487352609634399e-06, -3.9888545870780945e-06, -2.4903565645217896e-06, -9.918585419654846e-07, 5.066394805908203e-07, 2.0051375031471252e-06, 3.50363552570343e-06, 5.002133548259735e-06, 6.50063157081604e-06, 7.999129593372345e-06, 9.49762761592865e-06, 1.0996125638484955e-05, 1.249462366104126e-05, 1.3993121683597565e-05, 1.549161970615387e-05, 1.6990117728710175e-05, 1.848861575126648e-05, 1.9987113773822784e-05, 2.148561179637909e-05, 2.2984109818935394e-05, 2.44826078414917e-05, 2.5981105864048004e-05, 2.747960388660431e-05, 2.8978101909160614e-05, 3.047659993171692e-05, 3.1975097954273224e-05, 3.347359597682953e-05, 3.4972093999385834e-05, 3.647059202194214e-05, 3.7969090044498444e-05, 3.946758806705475e-05, 4.0966086089611053e-05, 4.246458411216736e-05, 4.396308213472366e-05, 4.546158015727997e-05, 4.696007817983627e-05, 4.845857620239258e-05]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 5.0, 6.0, 5.0, 10.0, 8.0, 13.0, 13.0, 17.0, 21.0, 25.0, 23.0, 28.0, 31.0, 41.0, 42.0, 44.0, 30.0, 43.0, 50.0, 47.0, 52.0, 42.0, 52.0, 42.0, 39.0, 31.0, 41.0, 28.0, 23.0, 31.0, 19.0, 17.0, 18.0, 11.0, 6.0, 9.0, 6.0, 5.0, 5.0, 8.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7789344787597656e-05, -3.6627985537052155e-05, -3.546662628650665e-05, -3.430526703596115e-05, -3.314390778541565e-05, -3.198254853487015e-05, -3.0821189284324646e-05, -2.9659830033779144e-05, -2.8498470783233643e-05, -2.733711153268814e-05, -2.617575228214264e-05, -2.5014393031597137e-05, -2.3853033781051636e-05, -2.2691674530506134e-05, -2.1530315279960632e-05, -2.036895602941513e-05, -1.920759677886963e-05, -1.8046237528324127e-05, -1.6884878277778625e-05, -1.5723519027233124e-05, -1.4562159776687622e-05, -1.340080052614212e-05, -1.2239441275596619e-05, -1.1078082025051117e-05, -9.916722774505615e-06, -8.755363523960114e-06, -7.594004273414612e-06, -6.43264502286911e-06, -5.271285772323608e-06, -4.109926521778107e-06, -2.948567271232605e-06, -1.7872080206871033e-06, -6.258487701416016e-07, 5.355104804039001e-07, 1.6968697309494019e-06, 2.8582289814949036e-06, 4.019588232040405e-06, 5.180947482585907e-06, 6.342306733131409e-06, 7.50366598367691e-06, 8.665025234222412e-06, 9.826384484767914e-06, 1.0987743735313416e-05, 1.2149102985858917e-05, 1.3310462236404419e-05, 1.447182148694992e-05, 1.5633180737495422e-05, 1.6794539988040924e-05, 1.7955899238586426e-05, 1.9117258489131927e-05, 2.027861773967743e-05, 2.143997699022293e-05, 2.2601336240768433e-05, 2.3762695491313934e-05, 2.4924054741859436e-05, 2.6085413992404938e-05, 2.724677324295044e-05, 2.840813249349594e-05, 2.9569491744041443e-05, 3.0730850994586945e-05, 3.1892210245132446e-05, 3.305356949567795e-05, 3.421492874622345e-05, 3.537628799676895e-05, 3.653764724731445e-05]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 9.0, 4.0, 4.0, 16.0, 14.0, 19.0, 28.0, 22.0, 44.0, 71.0, 107.0, 238.0, 256.0, 403.0, 598.0, 920.0, 1485.0, 2342.0, 3845.0, 6633.0, 12591.0, 24525.0, 105974.0, 243963.0, 397206.0, 139357.0, 53770.0, 24410.0, 12504.0, 6728.0, 3858.0, 2328.0, 1997.0, 743.0, 516.0, 317.0, 219.0, 149.0, 99.0, 67.0, 52.0, 29.0, 24.0, 32.0, 16.0, 7.0, 11.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 4.0], "bins": [-4.291534423828125e-06, -4.166737198829651e-06, -4.041939973831177e-06, -3.917142748832703e-06, -3.7923455238342285e-06, -3.6675482988357544e-06, -3.5427510738372803e-06, -3.417953848838806e-06, -3.293156623840332e-06, -3.168359398841858e-06, -3.043562173843384e-06, -2.9187649488449097e-06, -2.7939677238464355e-06, -2.6691704988479614e-06, -2.5443732738494873e-06, -2.419576048851013e-06, -2.294778823852539e-06, -2.169981598854065e-06, -2.045184373855591e-06, -1.9203871488571167e-06, -1.7955899238586426e-06, -1.6707926988601685e-06, -1.5459954738616943e-06, -1.4211982488632202e-06, -1.296401023864746e-06, -1.171603798866272e-06, -1.0468065738677979e-06, -9.220093488693237e-07, -7.972121238708496e-07, -6.724148988723755e-07, -5.476176738739014e-07, -4.2282044887542725e-07, -2.980232238769531e-07, -1.73225998878479e-07, -4.842877388000488e-08, 7.636845111846924e-08, 2.0116567611694336e-07, 3.259629011154175e-07, 4.507601261138916e-07, 5.755573511123657e-07, 7.003545761108398e-07, 8.25151801109314e-07, 9.499490261077881e-07, 1.0747462511062622e-06, 1.1995434761047363e-06, 1.3243407011032104e-06, 1.4491379261016846e-06, 1.5739351511001587e-06, 1.6987323760986328e-06, 1.823529601097107e-06, 1.948326826095581e-06, 2.073124051094055e-06, 2.1979212760925293e-06, 2.3227185010910034e-06, 2.4475157260894775e-06, 2.5723129510879517e-06, 2.6971101760864258e-06, 2.8219074010849e-06, 2.946704626083374e-06, 3.071501851081848e-06, 3.1962990760803223e-06, 3.3210963010787964e-06, 3.4458935260772705e-06, 3.5706907510757446e-06, 3.6954879760742188e-06]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 8.0, 0.0, 19.0, 17.0, 0.0, 28.0, 23.0, 0.0, 43.0, 50.0, 0.0, 51.0, 95.0, 0.0, 71.0, 0.0, 74.0, 94.0, 0.0, 87.0, 81.0, 0.0, 66.0, 55.0, 0.0, 41.0, 21.0, 0.0, 19.0, 16.0, 0.0, 10.0, 14.0, 0.0, 10.0, 9.0, 0.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3113021850585938e-06, -1.2721866369247437e-06, -1.2330710887908936e-06, -1.1939555406570435e-06, -1.1548399925231934e-06, -1.1157244443893433e-06, -1.0766088962554932e-06, -1.037493348121643e-06, -9.98377799987793e-07, -9.592622518539429e-07, -9.201467037200928e-07, -8.810311555862427e-07, -8.419156074523926e-07, -8.028000593185425e-07, -7.636845111846924e-07, -7.245689630508423e-07, -6.854534149169922e-07, -6.463378667831421e-07, -6.07222318649292e-07, -5.681067705154419e-07, -5.289912223815918e-07, -4.898756742477417e-07, -4.507601261138916e-07, -4.116445779800415e-07, -3.725290298461914e-07, -3.334134817123413e-07, -2.942979335784912e-07, -2.551823854446411e-07, -2.1606683731079102e-07, -1.7695128917694092e-07, -1.3783574104309082e-07, -9.872019290924072e-08, -5.960464477539063e-08, -2.0489096641540527e-08, 1.862645149230957e-08, 5.774199962615967e-08, 9.685754776000977e-08, 1.3597309589385986e-07, 1.7508864402770996e-07, 2.1420419216156006e-07, 2.5331974029541016e-07, 2.9243528842926025e-07, 3.3155083656311035e-07, 3.7066638469696045e-07, 4.0978193283081055e-07, 4.4889748096466064e-07, 4.880130290985107e-07, 5.271285772323608e-07, 5.662441253662109e-07, 6.05359673500061e-07, 6.444752216339111e-07, 6.835907697677612e-07, 7.227063179016113e-07, 7.618218660354614e-07, 8.009374141693115e-07, 8.400529623031616e-07, 8.791685104370117e-07, 9.182840585708618e-07, 9.57399606704712e-07, 9.96515154838562e-07, 1.0356307029724121e-06, 1.0747462511062622e-06, 1.1138617992401123e-06, 1.1529773473739624e-06, 1.1920928955078125e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 10.0, 4.0, 21.0, 31.0, 21.0, 71.0, 54.0, 127.0, 228.0, 144.0, 459.0, 324.0, 987.0, 1648.0, 1274.0, 3881.0, 3004.0, 9444.0, 19274.0, 17027.0, 69032.0, 77830.0, 475106.0, 163792.0, 120572.0, 43127.0, 11362.0, 13398.0, 4059.0, 5171.0, 2862.0, 973.0, 1295.0, 412.0, 603.0, 365.0, 130.0, 163.0, 66.0, 83.0, 39.0, 18.0, 30.0, 7.0, 13.0, 8.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9206275939941406e-06, -2.825632691383362e-06, -2.730637788772583e-06, -2.635642886161804e-06, -2.5406479835510254e-06, -2.4456530809402466e-06, -2.3506581783294678e-06, -2.255663275718689e-06, -2.16066837310791e-06, -2.0656734704971313e-06, -1.9706785678863525e-06, -1.8756836652755737e-06, -1.780688762664795e-06, -1.6856938600540161e-06, -1.5906989574432373e-06, -1.4957040548324585e-06, -1.4007091522216797e-06, -1.3057142496109009e-06, -1.210719347000122e-06, -1.1157244443893433e-06, -1.0207295417785645e-06, -9.257346391677856e-07, -8.307397365570068e-07, -7.35744833946228e-07, -6.407499313354492e-07, -5.457550287246704e-07, -4.507601261138916e-07, -3.557652235031128e-07, -2.60770320892334e-07, -1.6577541828155518e-07, -7.078051567077637e-08, 2.421438694000244e-08, 1.1920928955078125e-07, 2.1420419216156006e-07, 3.0919909477233887e-07, 4.041939973831177e-07, 4.991888999938965e-07, 5.941838026046753e-07, 6.891787052154541e-07, 7.841736078262329e-07, 8.791685104370117e-07, 9.741634130477905e-07, 1.0691583156585693e-06, 1.1641532182693481e-06, 1.259148120880127e-06, 1.3541430234909058e-06, 1.4491379261016846e-06, 1.5441328287124634e-06, 1.6391277313232422e-06, 1.734122633934021e-06, 1.8291175365447998e-06, 1.9241124391555786e-06, 2.0191073417663574e-06, 2.1141022443771362e-06, 2.209097146987915e-06, 2.304092049598694e-06, 2.3990869522094727e-06, 2.4940818548202515e-06, 2.5890767574310303e-06, 2.684071660041809e-06, 2.779066562652588e-06, 2.8740614652633667e-06, 2.9690563678741455e-06, 3.0640512704849243e-06, 3.159046173095703e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 6.0, 9.0, 14.0, 11.0, 21.0, 17.0, 22.0, 22.0, 35.0, 46.0, 59.0, 47.0, 60.0, 67.0, 74.0, 60.0, 67.0, 52.0, 54.0, 40.0, 40.0, 24.0, 15.0, 19.0, 14.0, 16.0, 14.0, 8.0, 12.0, 6.0, 7.0, 2.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-2.1457672119140625e-06, -2.086162567138672e-06, -2.0265579223632812e-06, -1.9669532775878906e-06, -1.9073486328125e-06, -1.8477439880371094e-06, -1.7881393432617188e-06, -1.7285346984863281e-06, -1.6689300537109375e-06, -1.6093254089355469e-06, -1.5497207641601562e-06, -1.4901161193847656e-06, -1.430511474609375e-06, -1.3709068298339844e-06, -1.3113021850585938e-06, -1.2516975402832031e-06, -1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 15.0, 33.0, 60.0, 155.0, 359.0, 188.0, 82.0, 38.0, 36.0, 18.0, 8.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008392405579797924, -0.0008219002047553658, -0.0008045599097386003, -0.0007872195565141737, -0.0007698792032897472, -0.0007525389082729816, -0.0007351985550485551, -0.0007178582018241286, -0.000700517906807363, -0.0006831775535829365, -0.0006658372585661709, -0.0006484969053417444, -0.0006311565521173179, -0.0006138161988928914, -0.0005964759038761258, -0.0005791355506516993, -0.0005617951974272728, -0.0005444548442028463, -0.0005271145491860807, -0.0005097741959616542, -0.0004924338427372277, -0.0004750935186166316, -0.0004577531944960356, -0.00044041284127160907, -0.000423072517151013, -0.00040573219303041697, -0.00038839183980599046, -0.0003710515156853944, -0.00035371119156479836, -0.00033637083834037185, -0.0003190305142197758, -0.00030169019009917974, -0.0002843498077709228, -0.00026700948365032673, -0.0002496691304259002, -0.00023232880630530417, -0.0002149884676327929, -0.0001976481289602816, -0.00018030780483968556, -0.00016296746616717428, -0.000145627127494663, -0.00012828678882215172, -0.00011094645742559806, -9.360612602904439e-05, -7.626578735653311e-05, -5.892544868402183e-05, -4.1585117287468165e-05, -2.42447858909145e-05, -6.90444721840322e-06, 1.0435887816129252e-05, 2.7776222850661725e-05, 4.51165578851942e-05, 6.245689291972667e-05, 7.979723159223795e-05, 9.713756298879161e-05, 0.00011447789438534528, 0.00013181823305785656, 0.00014915857173036784, 0.00016649891040287912, 0.00018383923452347517, 0.00020117957319598645, 0.00021851991186849773, 0.00023586023598909378, 0.0002532005892135203, 0.00027054091333411634]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 3.0, 7.0, 4.0, 6.0, 8.0, 12.0, 15.0, 17.0, 18.0, 19.0, 19.0, 33.0, 33.0, 35.0, 45.0, 39.0, 45.0, 41.0, 48.0, 46.0, 46.0, 39.0, 45.0, 38.0, 40.0, 48.0, 45.0, 29.0, 30.0, 17.0, 21.0, 30.0, 11.0, 18.0, 12.0, 10.0, 6.0, 4.0, 8.0, 3.0, 5.0, 6.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001074671745300293, -0.00010298844426870346, -9.850971400737762e-05, -9.403098374605179e-05, -8.955225348472595e-05, -8.507352322340012e-05, -8.059479296207428e-05, -7.611606270074844e-05, -7.163733243942261e-05, -6.715860217809677e-05, -6.267987191677094e-05, -5.82011416554451e-05, -5.372241139411926e-05, -4.9243681132793427e-05, -4.476495087146759e-05, -4.0286220610141754e-05, -3.580749034881592e-05, -3.132876008749008e-05, -2.6850029826164246e-05, -2.237129956483841e-05, -1.7892569303512573e-05, -1.3413839042186737e-05, -8.935108780860901e-06, -4.456378519535065e-06, 2.2351741790771484e-08, 4.501082003116608e-06, 8.979812264442444e-06, 1.345854252576828e-05, 1.7937272787094116e-05, 2.2416003048419952e-05, 2.689473330974579e-05, 3.1373463571071625e-05, 3.585219383239746e-05, 4.03309240937233e-05, 4.480965435504913e-05, 4.928838461637497e-05, 5.3767114877700806e-05, 5.824584513902664e-05, 6.272457540035248e-05, 6.720330566167831e-05, 7.168203592300415e-05, 7.616076618432999e-05, 8.063949644565582e-05, 8.511822670698166e-05, 8.95969569683075e-05, 9.407568722963333e-05, 9.855441749095917e-05, 0.000103033147752285, 0.00010751187801361084, 0.00011199060827493668, 0.00011646933853626251, 0.00012094806879758835, 0.00012542679905891418, 0.00012990552932024002, 0.00013438425958156586, 0.0001388629898428917, 0.00014334172010421753, 0.00014782045036554337, 0.0001522991806268692, 0.00015677791088819504, 0.00016125664114952087, 0.0001657353714108467, 0.00017021410167217255, 0.00017469283193349838, 0.00017917156219482422]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 9.0, 20.0, 34.0, 44.0, 65.0, 93.0, 157.0, 283.0, 453.0, 716.0, 1339.0, 2197.0, 4080.0, 7792.0, 16147.0, 36405.0, 106914.0, 2131257.0, 1716641.0, 94247.0, 36333.0, 17270.0, 8693.0, 5109.0, 2982.0, 1702.0, 1079.0, 672.0, 410.0, 308.0, 214.0, 125.0, 72.0, 73.0, 53.0, 45.0, 38.0, 32.0, 35.0, 27.0, 17.0, 14.0, 17.0, 9.0, 12.0, 11.0, 6.0, 6.0, 5.0, 6.0, 3.0, 8.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.692243576049805e-05, -5.4333359003067017e-05, -5.1744282245635986e-05, -4.9155205488204956e-05, -4.6566128730773926e-05, -4.3977051973342896e-05, -4.1387975215911865e-05, -3.8798898458480835e-05, -3.6209821701049805e-05, -3.3620744943618774e-05, -3.1031668186187744e-05, -2.8442591428756714e-05, -2.5853514671325684e-05, -2.3264437913894653e-05, -2.0675361156463623e-05, -1.8086284399032593e-05, -1.5497207641601562e-05, -1.2908130884170532e-05, -1.0319054126739502e-05, -7.729977369308472e-06, -5.140900611877441e-06, -2.551823854446411e-06, 3.725290298461914e-08, 2.6263296604156494e-06, 5.21540641784668e-06, 7.80448317527771e-06, 1.039355993270874e-05, 1.298263669013977e-05, 1.55717134475708e-05, 1.816079020500183e-05, 2.074986696243286e-05, 2.333894371986389e-05, 2.5928020477294922e-05, 2.8517097234725952e-05, 3.110617399215698e-05, 3.369525074958801e-05, 3.628432750701904e-05, 3.887340426445007e-05, 4.1462481021881104e-05, 4.4051557779312134e-05, 4.6640634536743164e-05, 4.9229711294174194e-05, 5.1818788051605225e-05, 5.4407864809036255e-05, 5.6996941566467285e-05, 5.9586018323898315e-05, 6.217509508132935e-05, 6.476417183876038e-05, 6.73532485961914e-05, 6.994232535362244e-05, 7.253140211105347e-05, 7.51204788684845e-05, 7.770955562591553e-05, 8.029863238334656e-05, 8.288770914077759e-05, 8.547678589820862e-05, 8.806586265563965e-05, 9.065493941307068e-05, 9.324401617050171e-05, 9.583309292793274e-05, 9.842216968536377e-05, 0.0001010112464427948, 0.00010360032320022583, 0.00010618939995765686, 0.00010877847671508789]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 9.0, 13.0, 17.0, 26.0, 36.0, 44.0, 66.0, 103.0, 97.0, 108.0, 116.0, 79.0, 56.0, 67.0, 42.0, 26.0, 19.0, 21.0, 15.0, 5.0, 9.0, 4.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2874603271484375e-05, -1.2256205081939697e-05, -1.163780689239502e-05, -1.1019408702850342e-05, -1.0401010513305664e-05, -9.782612323760986e-06, -9.164214134216309e-06, -8.545815944671631e-06, -7.927417755126953e-06, -7.309019565582275e-06, -6.690621376037598e-06, -6.07222318649292e-06, -5.453824996948242e-06, -4.8354268074035645e-06, -4.217028617858887e-06, -3.598630428314209e-06, -2.9802322387695312e-06, -2.3618340492248535e-06, -1.7434358596801758e-06, -1.125037670135498e-06, -5.066394805908203e-07, 1.1175870895385742e-07, 7.301568984985352e-07, 1.3485550880432129e-06, 1.9669532775878906e-06, 2.5853514671325684e-06, 3.203749656677246e-06, 3.822147846221924e-06, 4.4405460357666016e-06, 5.058944225311279e-06, 5.677342414855957e-06, 6.295740604400635e-06, 6.9141387939453125e-06, 7.53253698348999e-06, 8.150935173034668e-06, 8.769333362579346e-06, 9.387731552124023e-06, 1.0006129741668701e-05, 1.0624527931213379e-05, 1.1242926120758057e-05, 1.1861324310302734e-05, 1.2479722499847412e-05, 1.309812068939209e-05, 1.3716518878936768e-05, 1.4334917068481445e-05, 1.4953315258026123e-05, 1.55717134475708e-05, 1.619011163711548e-05, 1.6808509826660156e-05, 1.7426908016204834e-05, 1.8045306205749512e-05, 1.866370439529419e-05, 1.9282102584838867e-05, 1.9900500774383545e-05, 2.0518898963928223e-05, 2.11372971534729e-05, 2.1755695343017578e-05, 2.2374093532562256e-05, 2.2992491722106934e-05, 2.361088991165161e-05, 2.422928810119629e-05, 2.4847686290740967e-05, 2.5466084480285645e-05, 2.6084482669830322e-05, 2.6702880859375e-05]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 6.0, 7.0, 8.0, 9.0, 14.0, 26.0, 33.0, 49.0, 82.0, 127.0, 151.0, 238.0, 370.0, 584.0, 797.0, 1309.0, 1817.0, 3112.0, 4846.0, 7457.0, 12720.0, 21896.0, 37170.0, 75822.0, 173187.0, 842449.0, 2545382.0, 253280.0, 98144.0, 46734.0, 26717.0, 15244.0, 9177.0, 5339.0, 3521.0, 2216.0, 1400.0, 977.0, 611.0, 403.0, 274.0, 196.0, 142.0, 79.0, 57.0, 38.0, 28.0, 19.0, 10.0, 6.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.082918167114258e-05, -3.947596997022629e-05, -3.812275826931e-05, -3.676954656839371e-05, -3.541633486747742e-05, -3.406312316656113e-05, -3.2709911465644836e-05, -3.1356699764728546e-05, -3.0003488063812256e-05, -2.8650276362895966e-05, -2.7297064661979675e-05, -2.5943852961063385e-05, -2.4590641260147095e-05, -2.3237429559230804e-05, -2.1884217858314514e-05, -2.0531006157398224e-05, -1.9177794456481934e-05, -1.7824582755565643e-05, -1.6471371054649353e-05, -1.5118159353733063e-05, -1.3764947652816772e-05, -1.2411735951900482e-05, -1.1058524250984192e-05, -9.705312550067902e-06, -8.352100849151611e-06, -6.998889148235321e-06, -5.645677447319031e-06, -4.2924657464027405e-06, -2.93925404548645e-06, -1.58604234457016e-06, -2.3283064365386963e-07, 1.1203810572624207e-06, 2.473592758178711e-06, 3.826804459095001e-06, 5.1800161600112915e-06, 6.533227860927582e-06, 7.886439561843872e-06, 9.239651262760162e-06, 1.0592862963676453e-05, 1.1946074664592743e-05, 1.3299286365509033e-05, 1.4652498066425323e-05, 1.6005709767341614e-05, 1.7358921468257904e-05, 1.8712133169174194e-05, 2.0065344870090485e-05, 2.1418556571006775e-05, 2.2771768271923065e-05, 2.4124979972839355e-05, 2.5478191673755646e-05, 2.6831403374671936e-05, 2.8184615075588226e-05, 2.9537826776504517e-05, 3.089103847742081e-05, 3.22442501783371e-05, 3.359746187925339e-05, 3.495067358016968e-05, 3.630388528108597e-05, 3.765709698200226e-05, 3.901030868291855e-05, 4.036352038383484e-05, 4.171673208475113e-05, 4.306994378566742e-05, 4.442315548658371e-05, 4.57763671875e-05]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 15.0, 13.0, 15.0, 12.0, 13.0, 25.0, 19.0, 25.0, 48.0, 48.0, 74.0, 57.0, 87.0, 100.0, 139.0, 259.0, 561.0, 1243.0, 479.0, 200.0, 121.0, 75.0, 90.0, 56.0, 49.0, 48.0, 32.0, 27.0, 23.0, 20.0, 17.0, 18.0, 13.0, 9.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-3.600120544433594e-05, -3.489293158054352e-05, -3.37846577167511e-05, -3.267638385295868e-05, -3.156810998916626e-05, -3.045983612537384e-05, -2.935156226158142e-05, -2.8243288397789e-05, -2.7135014533996582e-05, -2.6026740670204163e-05, -2.4918466806411743e-05, -2.3810192942619324e-05, -2.2701919078826904e-05, -2.1593645215034485e-05, -2.0485371351242065e-05, -1.9377097487449646e-05, -1.8268823623657227e-05, -1.7160549759864807e-05, -1.6052275896072388e-05, -1.4944002032279968e-05, -1.3835728168487549e-05, -1.272745430469513e-05, -1.161918044090271e-05, -1.051090657711029e-05, -9.402632713317871e-06, -8.294358849525452e-06, -7.186084985733032e-06, -6.077811121940613e-06, -4.969537258148193e-06, -3.861263394355774e-06, -2.7529895305633545e-06, -1.644715666770935e-06, -5.364418029785156e-07, 5.718320608139038e-07, 1.6801059246063232e-06, 2.7883797883987427e-06, 3.896653652191162e-06, 5.0049275159835815e-06, 6.113201379776001e-06, 7.22147524356842e-06, 8.32974910736084e-06, 9.43802297115326e-06, 1.0546296834945679e-05, 1.1654570698738098e-05, 1.2762844562530518e-05, 1.3871118426322937e-05, 1.4979392290115356e-05, 1.6087666153907776e-05, 1.7195940017700195e-05, 1.8304213881492615e-05, 1.9412487745285034e-05, 2.0520761609077454e-05, 2.1629035472869873e-05, 2.2737309336662292e-05, 2.3845583200454712e-05, 2.495385706424713e-05, 2.606213092803955e-05, 2.717040479183197e-05, 2.827867865562439e-05, 2.938695251941681e-05, 3.049522638320923e-05, 3.160350024700165e-05, 3.271177411079407e-05, 3.382004797458649e-05, 3.4928321838378906e-05]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 4.0, 3.0, 9.0, 13.0, 12.0, 21.0, 11.0, 22.0, 40.0, 54.0, 70.0, 81.0, 121.0, 119.0, 97.0, 68.0, 57.0, 33.0, 35.0, 17.0, 25.0, 17.0, 17.0, 9.0, 9.0, 6.0, 3.0, 6.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020833007874898612, -0.0002008856099564582, -0.0001934411411639303, -0.00018599667237140238, -0.00017855218902695924, -0.00017110772023443133, -0.0001636632514419034, -0.0001562187826493755, -0.00014877429930493236, -0.00014132983051240444, -0.00013388536171987653, -0.00012644089292734861, -0.00011899640958290547, -0.00011155194079037756, -0.00010410747199784964, -9.666300320532173e-05, -8.921853441279382e-05, -8.17740656202659e-05, -7.432958955178037e-05, -6.688512075925246e-05, -5.944064832874574e-05, -5.1996175898239017e-05, -4.45517071057111e-05, -3.710723467520438e-05, -2.966276224469766e-05, -2.221828981419094e-05, -1.4773819202673621e-05, -7.329348591156304e-06, 1.1512383935041726e-07, 7.559596269857138e-06, 1.5004065062385052e-05, 2.2448537492891774e-05, 2.9893009923398495e-05, 3.7337482353905216e-05, 4.478195478441194e-05, 5.222642357693985e-05, 5.967089600744657e-05, 6.71153684379533e-05, 7.455983723048121e-05, 8.200430602300912e-05, 8.944878209149465e-05, 9.689325088402256e-05, 0.00010433772695250809, 0.000111782195745036, 0.00011922666453756392, 0.00012667113333009183, 0.00013411560212261975, 0.0001415600854670629, 0.0001490045542595908, 0.00015644902305211872, 0.00016389349184464663, 0.00017133797518908978, 0.0001787824439816177, 0.0001862269127741456, 0.00019367138156667352, 0.00020111585035920143, 0.00020856031915172935, 0.00021600478794425726, 0.00022344925673678517, 0.0002308937255293131, 0.00023833820887375623, 0.0002457826631143689, 0.00025322713190689683, 0.0002606716298032552, 0.0002681160985957831]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 9.0, 9.0, 10.0, 17.0, 15.0, 17.0, 15.0, 19.0, 23.0, 25.0, 29.0, 37.0, 26.0, 35.0, 27.0, 37.0, 62.0, 31.0, 45.0, 35.0, 48.0, 41.0, 37.0, 35.0, 41.0, 30.0, 34.0, 26.0, 29.0, 21.0, 16.0, 19.0, 16.0, 16.0, 8.0, 9.0, 9.0, 4.0, 7.0, 2.0, 4.0, 6.0, 4.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00012624263763427734, -0.00012203399091959, -0.00011782534420490265, -0.0001136166974902153, -0.00010940805077552795, -0.0001051994040608406, -0.00010099075734615326, -9.678211063146591e-05, -9.257346391677856e-05, -8.836481720209122e-05, -8.415617048740387e-05, -7.994752377271652e-05, -7.573887705802917e-05, -7.153023034334183e-05, -6.732158362865448e-05, -6.311293691396713e-05, -5.8904290199279785e-05, -5.469564348459244e-05, -5.048699676990509e-05, -4.627835005521774e-05, -4.2069703340530396e-05, -3.786105662584305e-05, -3.36524099111557e-05, -2.9443763196468353e-05, -2.5235116481781006e-05, -2.102646976709366e-05, -1.681782305240631e-05, -1.2609176337718964e-05, -8.400529623031616e-06, -4.191882908344269e-06, 1.6763806343078613e-08, 4.225410521030426e-06, 8.434057235717773e-06, 1.2642703950405121e-05, 1.6851350665092468e-05, 2.1059997379779816e-05, 2.5268644094467163e-05, 2.947729080915451e-05, 3.368593752384186e-05, 3.7894584238529205e-05, 4.210323095321655e-05, 4.63118776679039e-05, 5.052052438259125e-05, 5.4729171097278595e-05, 5.893781781196594e-05, 6.314646452665329e-05, 6.735511124134064e-05, 7.156375795602798e-05, 7.577240467071533e-05, 7.998105138540268e-05, 8.418969810009003e-05, 8.839834481477737e-05, 9.260699152946472e-05, 9.681563824415207e-05, 0.00010102428495883942, 0.00010523293167352676, 0.00010944157838821411, 0.00011365022510290146, 0.0001178588718175888, 0.00012206751853227615, 0.0001262761652469635, 0.00013048481196165085, 0.0001346934586763382, 0.00013890210539102554, 0.0001431107521057129]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 7.0, 7.0, 8.0, 10.0, 14.0, 14.0, 28.0, 41.0, 46.0, 68.0, 93.0, 151.0, 277.0, 431.0, 759.0, 1156.0, 2103.0, 3827.0, 7343.0, 15857.0, 40156.0, 131510.0, 610379.0, 155684.0, 43873.0, 17269.0, 7901.0, 3985.0, 2271.0, 1231.0, 766.0, 483.0, 279.0, 161.0, 105.0, 57.0, 58.0, 43.0, 28.0, 24.0, 12.0, 9.0, 8.0, 6.0, 6.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010985136032104492, -0.00010647624731063843, -0.00010310113430023193, -9.972602128982544e-05, -9.635090827941895e-05, -9.297579526901245e-05, -8.960068225860596e-05, -8.622556924819946e-05, -8.285045623779297e-05, -7.947534322738647e-05, -7.610023021697998e-05, -7.272511720657349e-05, -6.935000419616699e-05, -6.59748911857605e-05, -6.2599778175354e-05, -5.922466516494751e-05, -5.5849552154541016e-05, -5.247443914413452e-05, -4.909932613372803e-05, -4.572421312332153e-05, -4.234910011291504e-05, -3.8973987102508545e-05, -3.559887409210205e-05, -3.222376108169556e-05, -2.8848648071289062e-05, -2.547353506088257e-05, -2.2098422050476074e-05, -1.872330904006958e-05, -1.5348196029663086e-05, -1.1973083019256592e-05, -8.597970008850098e-06, -5.2228569984436035e-06, -1.8477439880371094e-06, 1.5273690223693848e-06, 4.902482032775879e-06, 8.277595043182373e-06, 1.1652708053588867e-05, 1.5027821063995361e-05, 1.8402934074401855e-05, 2.177804708480835e-05, 2.5153160095214844e-05, 2.8528273105621338e-05, 3.190338611602783e-05, 3.5278499126434326e-05, 3.865361213684082e-05, 4.2028725147247314e-05, 4.540383815765381e-05, 4.87789511680603e-05, 5.21540641784668e-05, 5.552917718887329e-05, 5.8904290199279785e-05, 6.227940320968628e-05, 6.565451622009277e-05, 6.902962923049927e-05, 7.240474224090576e-05, 7.577985525131226e-05, 7.915496826171875e-05, 8.253008127212524e-05, 8.590519428253174e-05, 8.928030729293823e-05, 9.265542030334473e-05, 9.603053331375122e-05, 9.940564632415771e-05, 0.00010278075933456421, 0.0001061558723449707]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 3.0, 7.0, 10.0, 18.0, 10.0, 14.0, 38.0, 51.0, 60.0, 77.0, 122.0, 91.0, 128.0, 91.0, 63.0, 64.0, 39.0, 34.0, 19.0, 9.0, 8.0, 11.0, 10.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6808509826660156e-05, -1.6179867088794708e-05, -1.555122435092926e-05, -1.4922581613063812e-05, -1.4293938875198364e-05, -1.3665296137332916e-05, -1.3036653399467468e-05, -1.240801066160202e-05, -1.1779367923736572e-05, -1.1150725185871124e-05, -1.0522082448005676e-05, -9.893439710140228e-06, -9.26479697227478e-06, -8.636154234409332e-06, -8.007511496543884e-06, -7.378868758678436e-06, -6.750226020812988e-06, -6.12158328294754e-06, -5.492940545082092e-06, -4.864297807216644e-06, -4.235655069351196e-06, -3.6070123314857483e-06, -2.9783695936203003e-06, -2.3497268557548523e-06, -1.7210841178894043e-06, -1.0924413800239563e-06, -4.637986421585083e-07, 1.648440957069397e-07, 7.934868335723877e-07, 1.4221295714378357e-06, 2.0507723093032837e-06, 2.6794150471687317e-06, 3.3080577850341797e-06, 3.936700522899628e-06, 4.565343260765076e-06, 5.193985998630524e-06, 5.822628736495972e-06, 6.45127147436142e-06, 7.079914212226868e-06, 7.708556950092316e-06, 8.337199687957764e-06, 8.965842425823212e-06, 9.59448516368866e-06, 1.0223127901554108e-05, 1.0851770639419556e-05, 1.1480413377285004e-05, 1.2109056115150452e-05, 1.27376988530159e-05, 1.3366341590881348e-05, 1.3994984328746796e-05, 1.4623627066612244e-05, 1.5252269804477692e-05, 1.588091254234314e-05, 1.6509555280208588e-05, 1.7138198018074036e-05, 1.7766840755939484e-05, 1.839548349380493e-05, 1.902412623167038e-05, 1.9652768969535828e-05, 2.0281411707401276e-05, 2.0910054445266724e-05, 2.153869718313217e-05, 2.216733992099762e-05, 2.2795982658863068e-05, 2.3424625396728516e-05]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 10.0, 6.0, 8.0, 11.0, 6.0, 11.0, 27.0, 44.0, 58.0, 84.0, 124.0, 141.0, 235.0, 298.0, 463.0, 594.0, 941.0, 1273.0, 1999.0, 2897.0, 4102.0, 6314.0, 8932.0, 14241.0, 20735.0, 34774.0, 55723.0, 111344.0, 305653.0, 242546.0, 95481.0, 49544.0, 31505.0, 18921.0, 13074.0, 8345.0, 5759.0, 3738.0, 2721.0, 1769.0, 1271.0, 842.0, 587.0, 408.0, 288.0, 204.0, 159.0, 102.0, 74.0, 51.0, 35.0, 32.0, 23.0, 10.0, 15.0, 2.0, 5.0, 5.0, 0.0, 4.0, 0.0, 1.0], "bins": [-3.600120544433594e-05, -3.4836120903491974e-05, -3.367103636264801e-05, -3.250595182180405e-05, -3.134086728096008e-05, -3.017578274011612e-05, -2.9010698199272156e-05, -2.7845613658428192e-05, -2.668052911758423e-05, -2.5515444576740265e-05, -2.43503600358963e-05, -2.3185275495052338e-05, -2.2020190954208374e-05, -2.085510641336441e-05, -1.9690021872520447e-05, -1.8524937331676483e-05, -1.735985279083252e-05, -1.6194768249988556e-05, -1.5029683709144592e-05, -1.3864599168300629e-05, -1.2699514627456665e-05, -1.1534430086612701e-05, -1.0369345545768738e-05, -9.204261004924774e-06, -8.03917646408081e-06, -6.874091923236847e-06, -5.709007382392883e-06, -4.54392284154892e-06, -3.378838300704956e-06, -2.2137537598609924e-06, -1.0486692190170288e-06, 1.1641532182693481e-07, 1.2814998626708984e-06, 2.446584403514862e-06, 3.6116689443588257e-06, 4.776753485202789e-06, 5.941838026046753e-06, 7.1069225668907166e-06, 8.27200710773468e-06, 9.437091648578644e-06, 1.0602176189422607e-05, 1.1767260730266571e-05, 1.2932345271110535e-05, 1.4097429811954498e-05, 1.5262514352798462e-05, 1.6427598893642426e-05, 1.759268343448639e-05, 1.8757767975330353e-05, 1.9922852516174316e-05, 2.108793705701828e-05, 2.2253021597862244e-05, 2.3418106138706207e-05, 2.458319067955017e-05, 2.5748275220394135e-05, 2.6913359761238098e-05, 2.8078444302082062e-05, 2.9243528842926025e-05, 3.040861338376999e-05, 3.157369792461395e-05, 3.2738782465457916e-05, 3.390386700630188e-05, 3.5068951547145844e-05, 3.623403608798981e-05, 3.739912062883377e-05, 3.8564205169677734e-05]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 8.0, 12.0, 9.0, 13.0, 13.0, 22.0, 16.0, 21.0, 22.0, 24.0, 34.0, 27.0, 37.0, 39.0, 50.0, 38.0, 64.0, 39.0, 54.0, 52.0, 51.0, 54.0, 39.0, 35.0, 31.0, 25.0, 21.0, 20.0, 22.0, 22.0, 9.0, 11.0, 14.0, 11.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.510713577270508e-05, -3.4047290682792664e-05, -3.298744559288025e-05, -3.1927600502967834e-05, -3.086775541305542e-05, -2.9807910323143005e-05, -2.874806523323059e-05, -2.7688220143318176e-05, -2.6628375053405762e-05, -2.5568529963493347e-05, -2.4508684873580933e-05, -2.3448839783668518e-05, -2.2388994693756104e-05, -2.132914960384369e-05, -2.0269304513931274e-05, -1.920945942401886e-05, -1.8149614334106445e-05, -1.708976924419403e-05, -1.6029924154281616e-05, -1.4970079064369202e-05, -1.3910233974456787e-05, -1.2850388884544373e-05, -1.1790543794631958e-05, -1.0730698704719543e-05, -9.670853614807129e-06, -8.611008524894714e-06, -7.5511634349823e-06, -6.491318345069885e-06, -5.431473255157471e-06, -4.371628165245056e-06, -3.3117830753326416e-06, -2.251937985420227e-06, -1.1920928955078125e-06, -1.3224780559539795e-07, 9.275972843170166e-07, 1.987442374229431e-06, 3.0472874641418457e-06, 4.10713255405426e-06, 5.166977643966675e-06, 6.226822733879089e-06, 7.286667823791504e-06, 8.346512913703918e-06, 9.406358003616333e-06, 1.0466203093528748e-05, 1.1526048183441162e-05, 1.2585893273353577e-05, 1.3645738363265991e-05, 1.4705583453178406e-05, 1.576542854309082e-05, 1.6825273633003235e-05, 1.788511872291565e-05, 1.8944963812828064e-05, 2.000480890274048e-05, 2.1064653992652893e-05, 2.2124499082565308e-05, 2.3184344172477722e-05, 2.4244189262390137e-05, 2.530403435230255e-05, 2.6363879442214966e-05, 2.742372453212738e-05, 2.8483569622039795e-05, 2.954341471195221e-05, 3.0603259801864624e-05, 3.166310489177704e-05, 3.272294998168945e-05]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 6.0, 9.0, 13.0, 18.0, 17.0, 34.0, 54.0, 75.0, 112.0, 192.0, 299.0, 575.0, 1108.0, 2129.0, 4442.0, 10563.0, 28327.0, 95258.0, 523417.0, 285543.0, 61522.0, 19757.0, 7867.0, 3412.0, 1687.0, 916.0, 469.0, 295.0, 145.0, 97.0, 65.0, 35.0, 36.0, 16.0, 13.0, 14.0, 7.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.662441253662109e-06, -5.4836273193359375e-06, -5.304813385009766e-06, -5.125999450683594e-06, -4.947185516357422e-06, -4.76837158203125e-06, -4.589557647705078e-06, -4.410743713378906e-06, -4.231929779052734e-06, -4.0531158447265625e-06, -3.874301910400391e-06, -3.6954879760742188e-06, -3.516674041748047e-06, -3.337860107421875e-06, -3.159046173095703e-06, -2.9802322387695312e-06, -2.8014183044433594e-06, -2.6226043701171875e-06, -2.4437904357910156e-06, -2.2649765014648438e-06, -2.086162567138672e-06, -1.9073486328125e-06, -1.7285346984863281e-06, -1.5497207641601562e-06, -1.3709068298339844e-06, -1.1920928955078125e-06, -1.0132789611816406e-06, -8.344650268554688e-07, -6.556510925292969e-07, -4.76837158203125e-07, -2.980232238769531e-07, -1.1920928955078125e-07, 5.960464477539063e-08, 2.384185791015625e-07, 4.172325134277344e-07, 5.960464477539062e-07, 7.748603820800781e-07, 9.5367431640625e-07, 1.1324882507324219e-06, 1.3113021850585938e-06, 1.4901161193847656e-06, 1.6689300537109375e-06, 1.8477439880371094e-06, 2.0265579223632812e-06, 2.205371856689453e-06, 2.384185791015625e-06, 2.562999725341797e-06, 2.7418136596679688e-06, 2.9206275939941406e-06, 3.0994415283203125e-06, 3.2782554626464844e-06, 3.4570693969726562e-06, 3.635883331298828e-06, 3.814697265625e-06, 3.993511199951172e-06, 4.172325134277344e-06, 4.351139068603516e-06, 4.5299530029296875e-06, 4.708766937255859e-06, 4.887580871582031e-06, 5.066394805908203e-06, 5.245208740234375e-06, 5.424022674560547e-06, 5.602836608886719e-06, 5.781650543212891e-06]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 12.0, 10.0, 20.0, 16.0, 0.0, 28.0, 18.0, 31.0, 33.0, 0.0, 45.0, 57.0, 78.0, 96.0, 0.0, 87.0, 102.0, 78.0, 56.0, 50.0, 0.0, 45.0, 25.0, 26.0, 30.0, 0.0, 15.0, 12.0, 6.0, 9.0, 0.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5012919902801514e-06, -1.4528632164001465e-06, -1.4044344425201416e-06, -1.3560056686401367e-06, -1.3075768947601318e-06, -1.259148120880127e-06, -1.210719347000122e-06, -1.1622905731201172e-06, -1.1138617992401123e-06, -1.0654330253601074e-06, -1.0170042514801025e-06, -9.685754776000977e-07, -9.201467037200928e-07, -8.717179298400879e-07, -8.23289155960083e-07, -7.748603820800781e-07, -7.264316082000732e-07, -6.780028343200684e-07, -6.295740604400635e-07, -5.811452865600586e-07, -5.327165126800537e-07, -4.842877388000488e-07, -4.3585896492004395e-07, -3.8743019104003906e-07, -3.390014171600342e-07, -2.905726432800293e-07, -2.421438694000244e-07, -1.9371509552001953e-07, -1.4528632164001465e-07, -9.685754776000977e-08, -4.842877388000488e-08, 0.0, 4.842877388000488e-08, 9.685754776000977e-08, 1.4528632164001465e-07, 1.9371509552001953e-07, 2.421438694000244e-07, 2.905726432800293e-07, 3.390014171600342e-07, 3.8743019104003906e-07, 4.3585896492004395e-07, 4.842877388000488e-07, 5.327165126800537e-07, 5.811452865600586e-07, 6.295740604400635e-07, 6.780028343200684e-07, 7.264316082000732e-07, 7.748603820800781e-07, 8.23289155960083e-07, 8.717179298400879e-07, 9.201467037200928e-07, 9.685754776000977e-07, 1.0170042514801025e-06, 1.0654330253601074e-06, 1.1138617992401123e-06, 1.1622905731201172e-06, 1.210719347000122e-06, 1.259148120880127e-06, 1.3075768947601318e-06, 1.3560056686401367e-06, 1.4044344425201416e-06, 1.4528632164001465e-06, 1.5012919902801514e-06, 1.5497207641601562e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 7.0, 3.0, 5.0, 6.0, 3.0, 20.0, 13.0, 30.0, 14.0, 60.0, 43.0, 53.0, 167.0, 129.0, 324.0, 218.0, 675.0, 569.0, 1635.0, 1302.0, 1769.0, 6010.0, 5274.0, 20363.0, 20204.0, 103829.0, 168560.0, 385988.0, 236861.0, 35471.0, 32673.0, 7806.0, 8887.0, 2527.0, 3097.0, 925.0, 687.0, 957.0, 309.0, 429.0, 148.0, 173.0, 62.0, 65.0, 78.0, 28.0, 38.0, 12.0, 23.0, 10.0, 11.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-2.682209014892578e-06, -2.596527338027954e-06, -2.51084566116333e-06, -2.425163984298706e-06, -2.339482307434082e-06, -2.253800630569458e-06, -2.168118953704834e-06, -2.08243727684021e-06, -1.996755599975586e-06, -1.911073923110962e-06, -1.8253922462463379e-06, -1.7397105693817139e-06, -1.6540288925170898e-06, -1.5683472156524658e-06, -1.4826655387878418e-06, -1.3969838619232178e-06, -1.3113021850585938e-06, -1.2256205081939697e-06, -1.1399388313293457e-06, -1.0542571544647217e-06, -9.685754776000977e-07, -8.828938007354736e-07, -7.972121238708496e-07, -7.115304470062256e-07, -6.258487701416016e-07, -5.401670932769775e-07, -4.544854164123535e-07, -3.688037395477295e-07, -2.8312206268310547e-07, -1.9744038581848145e-07, -1.1175870895385742e-07, -2.60770320892334e-08, 5.960464477539063e-08, 1.4528632164001465e-07, 2.3096799850463867e-07, 3.166496753692627e-07, 4.023313522338867e-07, 4.880130290985107e-07, 5.736947059631348e-07, 6.593763828277588e-07, 7.450580596923828e-07, 8.307397365570068e-07, 9.164214134216309e-07, 1.0021030902862549e-06, 1.087784767150879e-06, 1.173466444015503e-06, 1.259148120880127e-06, 1.344829797744751e-06, 1.430511474609375e-06, 1.516193151473999e-06, 1.601874828338623e-06, 1.687556505203247e-06, 1.773238182067871e-06, 1.8589198589324951e-06, 1.944601535797119e-06, 2.030283212661743e-06, 2.115964889526367e-06, 2.201646566390991e-06, 2.2873282432556152e-06, 2.3730099201202393e-06, 2.4586915969848633e-06, 2.5443732738494873e-06, 2.6300549507141113e-06, 2.7157366275787354e-06, 2.8014183044433594e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 7.0, 3.0, 3.0, 5.0, 5.0, 11.0, 12.0, 25.0, 22.0, 20.0, 19.0, 31.0, 45.0, 42.0, 120.0, 81.0, 95.0, 83.0, 68.0, 48.0, 47.0, 77.0, 23.0, 24.0, 15.0, 18.0, 10.0, 5.0, 12.0, 8.0, 2.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.562999725341797e-06, -2.495013177394867e-06, -2.427026629447937e-06, -2.359040081501007e-06, -2.291053533554077e-06, -2.2230669856071472e-06, -2.1550804376602173e-06, -2.0870938897132874e-06, -2.0191073417663574e-06, -1.9511207938194275e-06, -1.8831342458724976e-06, -1.8151476979255676e-06, -1.7471611499786377e-06, -1.6791746020317078e-06, -1.6111880540847778e-06, -1.543201506137848e-06, -1.475214958190918e-06, -1.407228410243988e-06, -1.339241862297058e-06, -1.2712553143501282e-06, -1.2032687664031982e-06, -1.1352822184562683e-06, -1.0672956705093384e-06, -9.993091225624084e-07, -9.313225746154785e-07, -8.633360266685486e-07, -7.953494787216187e-07, -7.273629307746887e-07, -6.593763828277588e-07, -5.913898348808289e-07, -5.234032869338989e-07, -4.55416738986969e-07, -3.8743019104003906e-07, -3.1944364309310913e-07, -2.514570951461792e-07, -1.8347054719924927e-07, -1.1548399925231934e-07, -4.7497451305389404e-08, 2.0489096641540527e-08, 8.847564458847046e-08, 1.564621925354004e-07, 2.2444874048233032e-07, 2.9243528842926025e-07, 3.604218363761902e-07, 4.284083843231201e-07, 4.9639493227005e-07, 5.6438148021698e-07, 6.323680281639099e-07, 7.003545761108398e-07, 7.683411240577698e-07, 8.363276720046997e-07, 9.043142199516296e-07, 9.723007678985596e-07, 1.0402873158454895e-06, 1.1082738637924194e-06, 1.1762604117393494e-06, 1.2442469596862793e-06, 1.3122335076332092e-06, 1.3802200555801392e-06, 1.448206603527069e-06, 1.516193151473999e-06, 1.584179699420929e-06, 1.6521662473678589e-06, 1.7201527953147888e-06, 1.7881393432617188e-06]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 5.0, 5.0, 18.0, 14.0, 23.0, 38.0, 45.0, 62.0, 117.0, 258.0, 126.0, 76.0, 58.0, 31.0, 35.0, 20.0, 12.0, 16.0, 9.0, 7.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001925597171066329, -0.00018602219643071294, -0.00017948469030670822, -0.00017294716963078827, -0.00016640964895486832, -0.00015987212827894837, -0.00015333460760302842, -0.0001467971014790237, -0.00014025958080310374, -0.0001337220601271838, -0.00012718455400317907, -0.00012064703332725912, -0.00011410951265133917, -0.00010757199197541922, -0.00010103447857545689, -9.449696517549455e-05, -8.79594444995746e-05, -8.142192382365465e-05, -7.488441042369232e-05, -6.834689702372998e-05, -6.180937634781003e-05, -5.527185930986889e-05, -4.8734342271927744e-05, -4.21968252339866e-05, -3.565930819604546e-05, -2.9121791158104315e-05, -2.2584274120163172e-05, -1.604675708222203e-05, -9.509240044280887e-06, -2.9717230063397437e-06, 3.565794031601399e-06, 1.0103311069542542e-05, 1.6640813555568457e-05, 2.31783305935096e-05, 2.9715847631450742e-05, 3.6253364669391885e-05, 4.279088170733303e-05, 4.932839874527417e-05, 5.5865915783215314e-05, 6.240342918317765e-05, 6.89409498590976e-05, 7.547847053501755e-05, 8.201598393497989e-05, 8.855349733494222e-05, 9.509101801086217e-05, 0.00010162853868678212, 0.00010816605208674446, 0.0001147035654867068, 0.00012124108616262674, 0.0001277786068385467, 0.00013431612751446664, 0.00014085363363847136, 0.00014739115431439131, 0.00015392867499031126, 0.000160466181114316, 0.00016700370179023594, 0.0001735412224661559, 0.00018007874314207584, 0.0001866162638179958, 0.0001931537699420005, 0.00019969129061792046, 0.0002062288112938404, 0.00021276631741784513, 0.00021930383809376508, 0.00022584135876968503]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 3.0, 5.0, 6.0, 7.0, 10.0, 11.0, 11.0, 13.0, 23.0, 19.0, 25.0, 36.0, 18.0, 32.0, 36.0, 26.0, 39.0, 30.0, 27.0, 41.0, 33.0, 44.0, 46.0, 35.0, 35.0, 31.0, 28.0, 29.0, 32.0, 27.0, 30.0, 27.0, 19.0, 20.0, 31.0, 14.0, 13.0, 11.0, 13.0, 6.0, 4.0, 19.0, 7.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.171796798706055e-05, -7.910747081041336e-05, -7.649697363376617e-05, -7.388647645711899e-05, -7.12759792804718e-05, -6.866548210382462e-05, -6.605498492717743e-05, -6.344448775053024e-05, -6.083399057388306e-05, -5.822349339723587e-05, -5.5612996220588684e-05, -5.30024990439415e-05, -5.039200186729431e-05, -4.7781504690647125e-05, -4.517100751399994e-05, -4.256051033735275e-05, -3.9950013160705566e-05, -3.733951598405838e-05, -3.4729018807411194e-05, -3.211852163076401e-05, -2.950802445411682e-05, -2.6897527277469635e-05, -2.428703010082245e-05, -2.1676532924175262e-05, -1.9066035747528076e-05, -1.645553857088089e-05, -1.3845041394233704e-05, -1.1234544217586517e-05, -8.624047040939331e-06, -6.013549864292145e-06, -3.4030526876449585e-06, -7.925555109977722e-07, 1.817941665649414e-06, 4.4284388422966e-06, 7.038936018943787e-06, 9.649433195590973e-06, 1.225993037223816e-05, 1.4870427548885345e-05, 1.7480924725532532e-05, 2.0091421902179718e-05, 2.2701919078826904e-05, 2.531241625547409e-05, 2.7922913432121277e-05, 3.053341060876846e-05, 3.314390778541565e-05, 3.5754404962062836e-05, 3.836490213871002e-05, 4.097539931535721e-05, 4.3585896492004395e-05, 4.619639366865158e-05, 4.880689084529877e-05, 5.141738802194595e-05, 5.402788519859314e-05, 5.6638382375240326e-05, 5.924887955188751e-05, 6.18593767285347e-05, 6.446987390518188e-05, 6.708037108182907e-05, 6.969086825847626e-05, 7.230136543512344e-05, 7.491186261177063e-05, 7.752235978841782e-05, 8.0132856965065e-05, 8.274335414171219e-05, 8.535385131835938e-05]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 18.0, 24.0, 30.0, 53.0, 84.0, 163.0, 253.0, 452.0, 822.0, 1605.0, 3218.0, 7115.0, 17248.0, 50920.0, 223287.0, 3658534.0, 161485.0, 41069.0, 15176.0, 6167.0, 2855.0, 1455.0, 804.0, 415.0, 280.0, 158.0, 118.0, 66.0, 67.0, 49.0, 36.0, 23.0, 31.0, 23.0, 30.0, 29.0, 14.0, 18.0, 14.0, 8.0, 11.0, 12.0, 9.0, 11.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-9.02414321899414e-05, -8.603185415267944e-05, -8.182227611541748e-05, -7.761269807815552e-05, -7.340312004089355e-05, -6.919354200363159e-05, -6.498396396636963e-05, -6.0774385929107666e-05, -5.65648078918457e-05, -5.235522985458374e-05, -4.814565181732178e-05, -4.3936073780059814e-05, -3.972649574279785e-05, -3.551691770553589e-05, -3.1307339668273926e-05, -2.7097761631011963e-05, -2.288818359375e-05, -1.8678605556488037e-05, -1.4469027519226074e-05, -1.0259449481964111e-05, -6.0498714447021484e-06, -1.8402934074401855e-06, 2.3692846298217773e-06, 6.57886266708374e-06, 1.0788440704345703e-05, 1.4998018741607666e-05, 1.920759677886963e-05, 2.3417174816131592e-05, 2.7626752853393555e-05, 3.183633089065552e-05, 3.604590892791748e-05, 4.025548696517944e-05, 4.4465065002441406e-05, 4.867464303970337e-05, 5.288422107696533e-05, 5.7093799114227295e-05, 6.130337715148926e-05, 6.551295518875122e-05, 6.972253322601318e-05, 7.393211126327515e-05, 7.814168930053711e-05, 8.235126733779907e-05, 8.656084537506104e-05, 9.0770423412323e-05, 9.498000144958496e-05, 9.918957948684692e-05, 0.00010339915752410889, 0.00010760873556137085, 0.00011181831359863281, 0.00011602789163589478, 0.00012023746967315674, 0.0001244470477104187, 0.00012865662574768066, 0.00013286620378494263, 0.0001370757818222046, 0.00014128535985946655, 0.00014549493789672852, 0.00014970451593399048, 0.00015391409397125244, 0.0001581236720085144, 0.00016233325004577637, 0.00016654282808303833, 0.0001707524061203003, 0.00017496198415756226, 0.00017917156219482422]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 10.0, 16.0, 14.0, 24.0, 45.0, 59.0, 83.0, 132.0, 150.0, 132.0, 101.0, 85.0, 44.0, 30.0, 39.0, 11.0, 8.0, 6.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.627206802368164e-05, -1.5494413673877716e-05, -1.4716759324073792e-05, -1.3939104974269867e-05, -1.3161450624465942e-05, -1.2383796274662018e-05, -1.1606141924858093e-05, -1.0828487575054169e-05, -1.0050833225250244e-05, -9.27317887544632e-06, -8.495524525642395e-06, -7.71787017583847e-06, -6.940215826034546e-06, -6.162561476230621e-06, -5.384907126426697e-06, -4.607252776622772e-06, -3.829598426818848e-06, -3.051944077014923e-06, -2.2742897272109985e-06, -1.496635377407074e-06, -7.189810276031494e-07, 5.8673322200775146e-08, 8.363276720046997e-07, 1.6139820218086243e-06, 2.391636371612549e-06, 3.1692907214164734e-06, 3.946945071220398e-06, 4.7245994210243225e-06, 5.502253770828247e-06, 6.279908120632172e-06, 7.057562470436096e-06, 7.83521682024002e-06, 8.612871170043945e-06, 9.39052551984787e-06, 1.0168179869651794e-05, 1.0945834219455719e-05, 1.1723488569259644e-05, 1.2501142919063568e-05, 1.3278797268867493e-05, 1.4056451618671417e-05, 1.4834105968475342e-05, 1.5611760318279266e-05, 1.638941466808319e-05, 1.7167069017887115e-05, 1.794472336769104e-05, 1.8722377717494965e-05, 1.950003206729889e-05, 2.0277686417102814e-05, 2.1055340766906738e-05, 2.1832995116710663e-05, 2.2610649466514587e-05, 2.3388303816318512e-05, 2.4165958166122437e-05, 2.494361251592636e-05, 2.5721266865730286e-05, 2.649892121553421e-05, 2.7276575565338135e-05, 2.805422991514206e-05, 2.8831884264945984e-05, 2.960953861474991e-05, 3.0387192964553833e-05, 3.116484731435776e-05, 3.194250166416168e-05, 3.272015601396561e-05, 3.349781036376953e-05]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 14.0, 10.0, 21.0, 25.0, 50.0, 82.0, 109.0, 164.0, 262.0, 384.0, 615.0, 909.0, 1437.0, 2233.0, 3456.0, 5922.0, 10393.0, 17933.0, 32822.0, 68310.0, 144936.0, 481124.0, 2891974.0, 298437.0, 113150.0, 54449.0, 27151.0, 15039.0, 9137.0, 4970.0, 3110.0, 1996.0, 1306.0, 810.0, 566.0, 310.0, 228.0, 148.0, 85.0, 68.0, 53.0, 32.0, 16.0, 11.0, 7.0, 4.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.233287811279297e-05, -5.076359957456589e-05, -4.9194321036338806e-05, -4.7625042498111725e-05, -4.6055763959884644e-05, -4.448648542165756e-05, -4.291720688343048e-05, -4.13479283452034e-05, -3.977864980697632e-05, -3.820937126874924e-05, -3.6640092730522156e-05, -3.5070814192295074e-05, -3.350153565406799e-05, -3.193225711584091e-05, -3.036297857761383e-05, -2.879370003938675e-05, -2.7224421501159668e-05, -2.5655142962932587e-05, -2.4085864424705505e-05, -2.2516585886478424e-05, -2.0947307348251343e-05, -1.937802881002426e-05, -1.780875027179718e-05, -1.62394717335701e-05, -1.4670193195343018e-05, -1.3100914657115936e-05, -1.1531636118888855e-05, -9.962357580661774e-06, -8.393079042434692e-06, -6.823800504207611e-06, -5.25452196598053e-06, -3.6852434277534485e-06, -2.115964889526367e-06, -5.466863512992859e-07, 1.0225921869277954e-06, 2.5918707251548767e-06, 4.161149263381958e-06, 5.730427801609039e-06, 7.299706339836121e-06, 8.868984878063202e-06, 1.0438263416290283e-05, 1.2007541954517365e-05, 1.3576820492744446e-05, 1.5146099030971527e-05, 1.671537756919861e-05, 1.828465610742569e-05, 1.985393464565277e-05, 2.1423213183879852e-05, 2.2992491722106934e-05, 2.4561770260334015e-05, 2.6131048798561096e-05, 2.7700327336788177e-05, 2.926960587501526e-05, 3.083888441324234e-05, 3.240816295146942e-05, 3.39774414896965e-05, 3.5546720027923584e-05, 3.7115998566150665e-05, 3.8685277104377747e-05, 4.025455564260483e-05, 4.182383418083191e-05, 4.339311271905899e-05, 4.496239125728607e-05, 4.653166979551315e-05, 4.8100948333740234e-05]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 8.0, 6.0, 7.0, 5.0, 4.0, 11.0, 11.0, 19.0, 41.0, 41.0, 40.0, 53.0, 70.0, 69.0, 100.0, 133.0, 267.0, 726.0, 1206.0, 380.0, 181.0, 112.0, 90.0, 88.0, 72.0, 61.0, 50.0, 40.0, 52.0, 28.0, 18.0, 15.0, 16.0, 11.0, 14.0, 10.0, 7.0, 6.0, 5.0, 3.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.707408905029297e-05, -3.584660589694977e-05, -3.461912274360657e-05, -3.339163959026337e-05, -3.2164156436920166e-05, -3.0936673283576965e-05, -2.9709190130233765e-05, -2.8481706976890564e-05, -2.7254223823547363e-05, -2.6026740670204163e-05, -2.4799257516860962e-05, -2.357177436351776e-05, -2.234429121017456e-05, -2.111680805683136e-05, -1.988932490348816e-05, -1.866184175014496e-05, -1.7434358596801758e-05, -1.6206875443458557e-05, -1.4979392290115356e-05, -1.3751909136772156e-05, -1.2524425983428955e-05, -1.1296942830085754e-05, -1.0069459676742554e-05, -8.841976523399353e-06, -7.614493370056152e-06, -6.387010216712952e-06, -5.159527063369751e-06, -3.93204391002655e-06, -2.7045607566833496e-06, -1.477077603340149e-06, -2.4959444999694824e-07, 9.778887033462524e-07, 2.205371856689453e-06, 3.432855010032654e-06, 4.6603381633758545e-06, 5.887821316719055e-06, 7.115304470062256e-06, 8.342787623405457e-06, 9.570270776748657e-06, 1.0797753930091858e-05, 1.2025237083435059e-05, 1.325272023677826e-05, 1.448020339012146e-05, 1.570768654346466e-05, 1.693516969680786e-05, 1.8162652850151062e-05, 1.9390136003494263e-05, 2.0617619156837463e-05, 2.1845102310180664e-05, 2.3072585463523865e-05, 2.4300068616867065e-05, 2.5527551770210266e-05, 2.6755034923553467e-05, 2.7982518076896667e-05, 2.9210001230239868e-05, 3.043748438358307e-05, 3.166496753692627e-05, 3.289245069026947e-05, 3.411993384361267e-05, 3.534741699695587e-05, 3.657490015029907e-05, 3.780238330364227e-05, 3.9029866456985474e-05, 4.0257349610328674e-05, 4.1484832763671875e-05]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 18.0, 19.0, 33.0, 67.0, 74.0, 105.0, 127.0, 100.0, 110.0, 57.0, 38.0, 46.0, 34.0, 23.0, 30.0, 18.0, 20.0, 7.0, 8.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026325476937927306, -0.00025325894239358604, -0.00024326311540789902, -0.000233267288422212, -0.00022327144688460976, -0.00021327561989892274, -0.00020327979291323572, -0.00019328395137563348, -0.00018328812438994646, -0.00017329229740425944, -0.00016329647041857243, -0.0001533006434328854, -0.00014330480189528316, -0.00013330897490959615, -0.00012331314792390913, -0.0001133173136622645, -0.00010332149395253509, -9.332566696684808e-05, -8.332983270520344e-05, -7.333400571951643e-05, -6.33381714578718e-05, -5.334234447218478e-05, -4.334651748649776e-05, -3.335068322485313e-05, -2.335485623916611e-05, -1.3359026524994988e-05, -3.3631968108238652e-06, 6.632631993852556e-06, 1.662846261751838e-05, 2.6624293241184205e-05, 3.662012022687122e-05, 4.6615954488515854e-05, 5.661178147420287e-05, 6.660760845988989e-05, 7.660344272153452e-05, 8.659926970722154e-05, 9.659510396886617e-05, 0.00010659093095455319, 0.0001165867579402402, 0.00012658259947784245, 0.00013657842646352947, 0.00014657425344921649, 0.0001565700804349035, 0.00016656590742059052, 0.00017656174895819277, 0.00018655757594387978, 0.0001965534029295668, 0.00020654924446716905, 0.00021654505690094084, 0.00022654088388662785, 0.00023653671087231487, 0.0002465325524099171, 0.00025652837939560413, 0.00026652420638129115, 0.00027652003336697817, 0.0002865158603526652, 0.0002965116873383522, 0.0003065075143240392, 0.00031650334130972624, 0.00032649916829541326, 0.0003364949952811003, 0.0003464908222667873, 0.0003564866492524743, 0.0003664825053419918, 0.0003764783323276788]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 12.0, 6.0, 9.0, 12.0, 17.0, 15.0, 20.0, 15.0, 15.0, 19.0, 26.0, 29.0, 28.0, 33.0, 30.0, 40.0, 27.0, 42.0, 33.0, 33.0, 32.0, 38.0, 30.0, 46.0, 41.0, 43.0, 38.0, 37.0, 24.0, 20.0, 17.0, 27.0, 17.0, 16.0, 15.0, 20.0, 13.0, 10.0, 11.0, 7.0, 1.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.0001723766326904297, -0.00016716867685317993, -0.00016196072101593018, -0.00015675276517868042, -0.00015154480934143066, -0.0001463368535041809, -0.00014112889766693115, -0.0001359209418296814, -0.00013071298599243164, -0.00012550503015518188, -0.00012029707431793213, -0.00011508911848068237, -0.00010988116264343262, -0.00010467320680618286, -9.94652509689331e-05, -9.425729513168335e-05, -8.90493392944336e-05, -8.384138345718384e-05, -7.863342761993408e-05, -7.342547178268433e-05, -6.821751594543457e-05, -6.300956010818481e-05, -5.780160427093506e-05, -5.25936484336853e-05, -4.738569259643555e-05, -4.217773675918579e-05, -3.6969780921936035e-05, -3.176182508468628e-05, -2.6553869247436523e-05, -2.1345913410186768e-05, -1.6137957572937012e-05, -1.0930001735687256e-05, -5.7220458984375e-06, -5.140900611877441e-07, 4.693865776062012e-06, 9.901821613311768e-06, 1.5109777450561523e-05, 2.031773328781128e-05, 2.5525689125061035e-05, 3.073364496231079e-05, 3.594160079956055e-05, 4.11495566368103e-05, 4.635751247406006e-05, 5.1565468311309814e-05, 5.677342414855957e-05, 6.198137998580933e-05, 6.718933582305908e-05, 7.239729166030884e-05, 7.76052474975586e-05, 8.281320333480835e-05, 8.80211591720581e-05, 9.322911500930786e-05, 9.843707084655762e-05, 0.00010364502668380737, 0.00010885298252105713, 0.00011406093835830688, 0.00011926889419555664, 0.0001244768500328064, 0.00012968480587005615, 0.0001348927617073059, 0.00014010071754455566, 0.00014530867338180542, 0.00015051662921905518, 0.00015572458505630493, 0.0001609325408935547]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 2.0, 9.0, 8.0, 9.0, 13.0, 20.0, 20.0, 28.0, 37.0, 43.0, 67.0, 106.0, 170.0, 309.0, 628.0, 1332.0, 3004.0, 6806.0, 17774.0, 57033.0, 344210.0, 514623.0, 68560.0, 19871.0, 7592.0, 3221.0, 1470.0, 639.0, 370.0, 177.0, 123.0, 68.0, 43.0, 37.0, 31.0, 24.0, 13.0, 13.0, 9.0, 8.0, 10.0, 7.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00013375282287597656, -0.0001294463872909546, -0.00012513995170593262, -0.00012083351612091064, -0.00011652708053588867, -0.0001122206449508667, -0.00010791420936584473, -0.00010360777378082275, -9.930133819580078e-05, -9.499490261077881e-05, -9.068846702575684e-05, -8.638203144073486e-05, -8.207559585571289e-05, -7.776916027069092e-05, -7.346272468566895e-05, -6.915628910064697e-05, -6.4849853515625e-05, -6.054341793060303e-05, -5.6236982345581055e-05, -5.193054676055908e-05, -4.762411117553711e-05, -4.331767559051514e-05, -3.9011240005493164e-05, -3.470480442047119e-05, -3.039836883544922e-05, -2.6091933250427246e-05, -2.1785497665405273e-05, -1.74790620803833e-05, -1.3172626495361328e-05, -8.866190910339355e-06, -4.559755325317383e-06, -2.5331974029541016e-07, 4.0531158447265625e-06, 8.359551429748535e-06, 1.2665987014770508e-05, 1.697242259979248e-05, 2.1278858184814453e-05, 2.5585293769836426e-05, 2.98917293548584e-05, 3.419816493988037e-05, 3.8504600524902344e-05, 4.2811036109924316e-05, 4.711747169494629e-05, 5.142390727996826e-05, 5.5730342864990234e-05, 6.003677845001221e-05, 6.434321403503418e-05, 6.864964962005615e-05, 7.295608520507812e-05, 7.72625207901001e-05, 8.156895637512207e-05, 8.587539196014404e-05, 9.018182754516602e-05, 9.448826313018799e-05, 9.879469871520996e-05, 0.00010310113430023193, 0.0001074075698852539, 0.00011171400547027588, 0.00011602044105529785, 0.00012032687664031982, 0.0001246333122253418, 0.00012893974781036377, 0.00013324618339538574, 0.00013755261898040771, 0.0001418590545654297]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 10.0, 9.0, 17.0, 24.0, 22.0, 38.0, 51.0, 98.0, 123.0, 121.0, 113.0, 102.0, 101.0, 60.0, 31.0, 23.0, 18.0, 8.0, 11.0, 8.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.627206802368164e-05, -1.5565194189548492e-05, -1.4858320355415344e-05, -1.4151446521282196e-05, -1.3444572687149048e-05, -1.27376988530159e-05, -1.2030825018882751e-05, -1.1323951184749603e-05, -1.0617077350616455e-05, -9.910203516483307e-06, -9.203329682350159e-06, -8.49645584821701e-06, -7.789582014083862e-06, -7.082708179950714e-06, -6.375834345817566e-06, -5.668960511684418e-06, -4.9620866775512695e-06, -4.255212843418121e-06, -3.548339009284973e-06, -2.841465175151825e-06, -2.1345913410186768e-06, -1.4277175068855286e-06, -7.208436727523804e-07, -1.3969838619232178e-08, 6.92903995513916e-07, 1.3997778296470642e-06, 2.1066516637802124e-06, 2.8135254979133606e-06, 3.520399332046509e-06, 4.227273166179657e-06, 4.934147000312805e-06, 5.641020834445953e-06, 6.3478946685791016e-06, 7.05476850271225e-06, 7.761642336845398e-06, 8.468516170978546e-06, 9.175390005111694e-06, 9.882263839244843e-06, 1.058913767337799e-05, 1.1296011507511139e-05, 1.2002885341644287e-05, 1.2709759175777435e-05, 1.3416633009910583e-05, 1.4123506844043732e-05, 1.483038067817688e-05, 1.5537254512310028e-05, 1.6244128346443176e-05, 1.6951002180576324e-05, 1.7657876014709473e-05, 1.836474984884262e-05, 1.907162368297577e-05, 1.9778497517108917e-05, 2.0485371351242065e-05, 2.1192245185375214e-05, 2.1899119019508362e-05, 2.260599285364151e-05, 2.3312866687774658e-05, 2.4019740521907806e-05, 2.4726614356040955e-05, 2.5433488190174103e-05, 2.614036202430725e-05, 2.68472358584404e-05, 2.7554109692573547e-05, 2.8260983526706696e-05, 2.8967857360839844e-05]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 3.0, 7.0, 16.0, 12.0, 27.0, 41.0, 38.0, 76.0, 86.0, 141.0, 185.0, 259.0, 392.0, 561.0, 740.0, 1118.0, 1541.0, 2147.0, 3195.0, 4523.0, 6636.0, 9727.0, 14397.0, 22468.0, 34935.0, 57363.0, 102052.0, 244321.0, 270709.0, 105863.0, 59065.0, 35782.0, 22871.0, 15113.0, 9941.0, 6802.0, 4694.0, 3204.0, 2202.0, 1522.0, 1131.0, 766.0, 564.0, 375.0, 308.0, 173.0, 134.0, 99.0, 69.0, 59.0, 36.0, 17.0, 20.0, 13.0, 10.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.141164779663086e-05, -3.039836883544922e-05, -2.9385089874267578e-05, -2.8371810913085938e-05, -2.7358531951904297e-05, -2.6345252990722656e-05, -2.5331974029541016e-05, -2.4318695068359375e-05, -2.3305416107177734e-05, -2.2292137145996094e-05, -2.1278858184814453e-05, -2.0265579223632812e-05, -1.9252300262451172e-05, -1.823902130126953e-05, -1.722574234008789e-05, -1.621246337890625e-05, -1.519918441772461e-05, -1.4185905456542969e-05, -1.3172626495361328e-05, -1.2159347534179688e-05, -1.1146068572998047e-05, -1.0132789611816406e-05, -9.119510650634766e-06, -8.106231689453125e-06, -7.092952728271484e-06, -6.079673767089844e-06, -5.066394805908203e-06, -4.0531158447265625e-06, -3.039836883544922e-06, -2.0265579223632812e-06, -1.0132789611816406e-06, 0.0, 1.0132789611816406e-06, 2.0265579223632812e-06, 3.039836883544922e-06, 4.0531158447265625e-06, 5.066394805908203e-06, 6.079673767089844e-06, 7.092952728271484e-06, 8.106231689453125e-06, 9.119510650634766e-06, 1.0132789611816406e-05, 1.1146068572998047e-05, 1.2159347534179688e-05, 1.3172626495361328e-05, 1.4185905456542969e-05, 1.519918441772461e-05, 1.621246337890625e-05, 1.722574234008789e-05, 1.823902130126953e-05, 1.9252300262451172e-05, 2.0265579223632812e-05, 2.1278858184814453e-05, 2.2292137145996094e-05, 2.3305416107177734e-05, 2.4318695068359375e-05, 2.5331974029541016e-05, 2.6345252990722656e-05, 2.7358531951904297e-05, 2.8371810913085938e-05, 2.9385089874267578e-05, 3.039836883544922e-05, 3.141164779663086e-05, 3.24249267578125e-05, 3.343820571899414e-05]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 0.0, 6.0, 3.0, 5.0, 11.0, 7.0, 12.0, 13.0, 13.0, 15.0, 18.0, 10.0, 16.0, 25.0, 24.0, 31.0, 37.0, 36.0, 33.0, 41.0, 41.0, 40.0, 52.0, 50.0, 33.0, 38.0, 53.0, 44.0, 32.0, 36.0, 33.0, 25.0, 22.0, 24.0, 24.0, 14.0, 13.0, 18.0, 10.0, 11.0, 8.0, 6.0, 8.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6881694793701172e-05, -2.599228173494339e-05, -2.5102868676185608e-05, -2.4213455617427826e-05, -2.3324042558670044e-05, -2.2434629499912262e-05, -2.154521644115448e-05, -2.0655803382396698e-05, -1.9766390323638916e-05, -1.8876977264881134e-05, -1.7987564206123352e-05, -1.709815114736557e-05, -1.6208738088607788e-05, -1.5319325029850006e-05, -1.4429911971092224e-05, -1.3540498912334442e-05, -1.265108585357666e-05, -1.1761672794818878e-05, -1.0872259736061096e-05, -9.982846677303314e-06, -9.093433618545532e-06, -8.20402055978775e-06, -7.314607501029968e-06, -6.425194442272186e-06, -5.535781383514404e-06, -4.646368324756622e-06, -3.7569552659988403e-06, -2.8675422072410583e-06, -1.9781291484832764e-06, -1.0887160897254944e-06, -1.993030309677124e-07, 6.901100277900696e-07, 1.5795230865478516e-06, 2.4689361453056335e-06, 3.3583492040634155e-06, 4.2477622628211975e-06, 5.1371753215789795e-06, 6.0265883803367615e-06, 6.9160014390945435e-06, 7.805414497852325e-06, 8.694827556610107e-06, 9.58424061536789e-06, 1.0473653674125671e-05, 1.1363066732883453e-05, 1.2252479791641235e-05, 1.3141892850399017e-05, 1.40313059091568e-05, 1.4920718967914581e-05, 1.5810132026672363e-05, 1.6699545085430145e-05, 1.7588958144187927e-05, 1.847837120294571e-05, 1.936778426170349e-05, 2.0257197320461273e-05, 2.1146610379219055e-05, 2.2036023437976837e-05, 2.292543649673462e-05, 2.38148495554924e-05, 2.4704262614250183e-05, 2.5593675673007965e-05, 2.6483088731765747e-05, 2.737250179052353e-05, 2.826191484928131e-05, 2.9151327908039093e-05, 3.0040740966796875e-05]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 11.0, 15.0, 16.0, 34.0, 42.0, 52.0, 78.0, 144.0, 148.0, 221.0, 483.0, 467.0, 678.0, 1641.0, 1675.0, 2585.0, 6776.0, 8496.0, 15251.0, 59704.0, 129090.0, 435076.0, 240837.0, 93374.0, 21426.0, 11404.0, 8789.0, 3212.0, 2069.0, 1896.0, 826.0, 573.0, 594.0, 257.0, 180.0, 187.0, 70.0, 58.0, 26.0, 30.0, 14.0, 16.0, 8.0, 10.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.231929779052734e-06, -4.0940940380096436e-06, -3.956258296966553e-06, -3.818422555923462e-06, -3.680586814880371e-06, -3.5427510738372803e-06, -3.4049153327941895e-06, -3.2670795917510986e-06, -3.129243850708008e-06, -2.991408109664917e-06, -2.853572368621826e-06, -2.7157366275787354e-06, -2.5779008865356445e-06, -2.4400651454925537e-06, -2.302229404449463e-06, -2.164393663406372e-06, -2.0265579223632812e-06, -1.8887221813201904e-06, -1.7508864402770996e-06, -1.6130506992340088e-06, -1.475214958190918e-06, -1.3373792171478271e-06, -1.1995434761047363e-06, -1.0617077350616455e-06, -9.238719940185547e-07, -7.860362529754639e-07, -6.48200511932373e-07, -5.103647708892822e-07, -3.725290298461914e-07, -2.3469328880310059e-07, -9.685754776000977e-08, 4.0978193283081055e-08, 1.7881393432617188e-07, 3.166496753692627e-07, 4.544854164123535e-07, 5.923211574554443e-07, 7.301568984985352e-07, 8.67992639541626e-07, 1.0058283805847168e-06, 1.1436641216278076e-06, 1.2814998626708984e-06, 1.4193356037139893e-06, 1.55717134475708e-06, 1.695007085800171e-06, 1.8328428268432617e-06, 1.9706785678863525e-06, 2.1085143089294434e-06, 2.246350049972534e-06, 2.384185791015625e-06, 2.522021532058716e-06, 2.6598572731018066e-06, 2.7976930141448975e-06, 2.9355287551879883e-06, 3.073364496231079e-06, 3.21120023727417e-06, 3.3490359783172607e-06, 3.4868717193603516e-06, 3.6247074604034424e-06, 3.762543201446533e-06, 3.900378942489624e-06, 4.038214683532715e-06, 4.176050424575806e-06, 4.3138861656188965e-06, 4.451721906661987e-06, 4.589557647705078e-06]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 9.0, 15.0, 15.0, 41.0, 24.0, 32.0, 42.0, 66.0, 70.0, 69.0, 74.0, 81.0, 70.0, 76.0, 44.0, 53.0, 72.0, 30.0, 33.0, 22.0, 18.0, 10.0, 13.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1457672119140625e-06, -2.0815059542655945e-06, -2.0172446966171265e-06, -1.9529834389686584e-06, -1.8887221813201904e-06, -1.8244609236717224e-06, -1.7601996660232544e-06, -1.6959384083747864e-06, -1.6316771507263184e-06, -1.5674158930778503e-06, -1.5031546354293823e-06, -1.4388933777809143e-06, -1.3746321201324463e-06, -1.3103708624839783e-06, -1.2461096048355103e-06, -1.1818483471870422e-06, -1.1175870895385742e-06, -1.0533258318901062e-06, -9.890645742416382e-07, -9.248033165931702e-07, -8.605420589447021e-07, -7.962808012962341e-07, -7.320195436477661e-07, -6.677582859992981e-07, -6.034970283508301e-07, -5.392357707023621e-07, -4.7497451305389404e-07, -4.10713255405426e-07, -3.46451997756958e-07, -2.8219074010849e-07, -2.1792948246002197e-07, -1.5366822481155396e-07, -8.940696716308594e-08, -2.514570951461792e-08, 3.91155481338501e-08, 1.0337680578231812e-07, 1.6763806343078613e-07, 2.3189932107925415e-07, 2.9616057872772217e-07, 3.604218363761902e-07, 4.246830940246582e-07, 4.889443516731262e-07, 5.532056093215942e-07, 6.174668669700623e-07, 6.817281246185303e-07, 7.459893822669983e-07, 8.102506399154663e-07, 8.745118975639343e-07, 9.387731552124023e-07, 1.0030344128608704e-06, 1.0672956705093384e-06, 1.1315569281578064e-06, 1.1958181858062744e-06, 1.2600794434547424e-06, 1.3243407011032104e-06, 1.3886019587516785e-06, 1.4528632164001465e-06, 1.5171244740486145e-06, 1.5813857316970825e-06, 1.6456469893455505e-06, 1.7099082469940186e-06, 1.7741695046424866e-06, 1.8384307622909546e-06, 1.9026920199394226e-06, 1.9669532775878906e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 15.0, 7.0, 13.0, 19.0, 21.0, 23.0, 31.0, 58.0, 108.0, 117.0, 155.0, 197.0, 303.0, 484.0, 655.0, 1011.0, 2773.0, 3509.0, 6418.0, 12539.0, 30308.0, 102041.0, 556650.0, 238439.0, 63884.0, 12797.0, 6344.0, 3575.0, 2097.0, 1326.0, 825.0, 551.0, 484.0, 203.0, 152.0, 121.0, 67.0, 51.0, 40.0, 27.0, 36.0, 23.0, 9.0, 14.0, 7.0, 5.0, 2.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-3.874301910400391e-06, -3.7476420402526855e-06, -3.6209821701049805e-06, -3.4943222999572754e-06, -3.3676624298095703e-06, -3.2410025596618652e-06, -3.11434268951416e-06, -2.987682819366455e-06, -2.86102294921875e-06, -2.734363079071045e-06, -2.60770320892334e-06, -2.4810433387756348e-06, -2.3543834686279297e-06, -2.2277235984802246e-06, -2.1010637283325195e-06, -1.9744038581848145e-06, -1.8477439880371094e-06, -1.7210841178894043e-06, -1.5944242477416992e-06, -1.4677643775939941e-06, -1.341104507446289e-06, -1.214444637298584e-06, -1.087784767150879e-06, -9.611248970031738e-07, -8.344650268554688e-07, -7.078051567077637e-07, -5.811452865600586e-07, -4.544854164123535e-07, -3.2782554626464844e-07, -2.0116567611694336e-07, -7.450580596923828e-08, 5.21540641784668e-08, 1.7881393432617188e-07, 3.0547380447387695e-07, 4.3213367462158203e-07, 5.587935447692871e-07, 6.854534149169922e-07, 8.121132850646973e-07, 9.387731552124023e-07, 1.0654330253601074e-06, 1.1920928955078125e-06, 1.3187527656555176e-06, 1.4454126358032227e-06, 1.5720725059509277e-06, 1.6987323760986328e-06, 1.8253922462463379e-06, 1.952052116394043e-06, 2.078711986541748e-06, 2.205371856689453e-06, 2.332031726837158e-06, 2.4586915969848633e-06, 2.5853514671325684e-06, 2.7120113372802734e-06, 2.8386712074279785e-06, 2.9653310775756836e-06, 3.0919909477233887e-06, 3.2186508178710938e-06, 3.345310688018799e-06, 3.471970558166504e-06, 3.598630428314209e-06, 3.725290298461914e-06, 3.851950168609619e-06, 3.978610038757324e-06, 4.105269908905029e-06, 4.231929779052734e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 6.0, 11.0, 7.0, 5.0, 19.0, 19.0, 14.0, 42.0, 91.0, 71.0, 155.0, 176.0, 60.0, 116.0, 78.0, 24.0, 34.0, 21.0, 12.0, 4.0, 8.0, 9.0, 2.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7418136596679688e-06, -2.641230821609497e-06, -2.5406479835510254e-06, -2.4400651454925537e-06, -2.339482307434082e-06, -2.2388994693756104e-06, -2.1383166313171387e-06, -2.037733793258667e-06, -1.9371509552001953e-06, -1.8365681171417236e-06, -1.735985279083252e-06, -1.6354024410247803e-06, -1.5348196029663086e-06, -1.434236764907837e-06, -1.3336539268493652e-06, -1.2330710887908936e-06, -1.1324882507324219e-06, -1.0319054126739502e-06, -9.313225746154785e-07, -8.307397365570068e-07, -7.301568984985352e-07, -6.295740604400635e-07, -5.289912223815918e-07, -4.284083843231201e-07, -3.2782554626464844e-07, -2.2724270820617676e-07, -1.2665987014770508e-07, -2.60770320892334e-08, 7.450580596923828e-08, 1.7508864402770996e-07, 2.7567148208618164e-07, 3.762543201446533e-07, 4.76837158203125e-07, 5.774199962615967e-07, 6.780028343200684e-07, 7.7858567237854e-07, 8.791685104370117e-07, 9.797513484954834e-07, 1.080334186553955e-06, 1.1809170246124268e-06, 1.2814998626708984e-06, 1.3820827007293701e-06, 1.4826655387878418e-06, 1.5832483768463135e-06, 1.6838312149047852e-06, 1.7844140529632568e-06, 1.8849968910217285e-06, 1.9855797290802e-06, 2.086162567138672e-06, 2.1867454051971436e-06, 2.2873282432556152e-06, 2.387911081314087e-06, 2.4884939193725586e-06, 2.5890767574310303e-06, 2.689659595489502e-06, 2.7902424335479736e-06, 2.8908252716064453e-06, 2.991408109664917e-06, 3.0919909477233887e-06, 3.1925737857818604e-06, 3.293156623840332e-06, 3.3937394618988037e-06, 3.4943222999572754e-06, 3.594905138015747e-06, 3.6954879760742188e-06]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 6.0, 9.0, 10.0, 21.0, 19.0, 25.0, 35.0, 55.0, 75.0, 161.0, 193.0, 77.0, 72.0, 49.0, 47.0, 29.0, 28.0, 18.0, 15.0, 15.0, 10.0, 7.0, 7.0, 0.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017697080329526216, -0.00017161769210360944, -0.00016626458091195673, -0.000160911469720304, -0.00015555837308056653, -0.0001502052618889138, -0.0001448521506972611, -0.00013949903950560838, -0.00013414592831395566, -0.00012879281712230295, -0.00012343970593065023, -0.00011808660201495513, -0.00011273349082330242, -0.00010738038690760732, -0.0001020272757159546, -9.667416452430189e-05, -9.132106060860679e-05, -8.596794941695407e-05, -8.061484550125897e-05, -7.526173430960625e-05, -6.990862311795354e-05, -6.455551192630082e-05, -5.920240801060572e-05, -5.384929681895301e-05, -4.84961892652791e-05, -4.314308171160519e-05, -3.7789970519952476e-05, -3.243686296627857e-05, -2.7083753593615256e-05, -2.1730644220951945e-05, -1.6377536667278036e-05, -1.1024425475625321e-05, -5.671317921951413e-06, -3.182090040354524e-07, 5.034899913880508e-06, 1.0388008377049118e-05, 1.574111774971243e-05, 2.109422712237574e-05, 2.644733467604965e-05, 3.1800445867702365e-05, 3.715355342137627e-05, 4.250666097505018e-05, 4.7859772166702896e-05, 5.3212879720376804e-05, 5.856598727405071e-05, 6.391909846570343e-05, 6.927220965735614e-05, 7.462532084900886e-05, 7.997842476470396e-05, 8.533153595635667e-05, 9.068463987205178e-05, 9.603775106370449e-05, 0.0001013908622553572, 0.00010674397344700992, 0.00011209707736270502, 0.00011745018855435774, 0.00012280329247005284, 0.00012815640366170555, 0.00013350951485335827, 0.00013886261149309576, 0.00014421572268474847, 0.00014956883387640119, 0.0001549219450680539, 0.00016027505625970662, 0.00016562816745135933]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 11.0, 11.0, 16.0, 13.0, 28.0, 32.0, 24.0, 31.0, 30.0, 29.0, 34.0, 40.0, 38.0, 42.0, 39.0, 40.0, 52.0, 43.0, 43.0, 36.0, 42.0, 28.0, 31.0, 35.0, 29.0, 30.0, 20.0, 18.0, 18.0, 21.0, 20.0, 19.0, 10.0, 10.0, 9.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.679794311523438e-05, -9.383261203765869e-05, -9.086728096008301e-05, -8.790194988250732e-05, -8.493661880493164e-05, -8.197128772735596e-05, -7.900595664978027e-05, -7.604062557220459e-05, -7.30752944946289e-05, -7.010996341705322e-05, -6.714463233947754e-05, -6.417930126190186e-05, -6.121397018432617e-05, -5.824863910675049e-05, -5.5283308029174805e-05, -5.231797695159912e-05, -4.935264587402344e-05, -4.6387314796447754e-05, -4.342198371887207e-05, -4.045665264129639e-05, -3.74913215637207e-05, -3.452599048614502e-05, -3.1560659408569336e-05, -2.8595328330993652e-05, -2.562999725341797e-05, -2.2664666175842285e-05, -1.96993350982666e-05, -1.6734004020690918e-05, -1.3768672943115234e-05, -1.080334186553955e-05, -7.838010787963867e-06, -4.872679710388184e-06, -1.9073486328125e-06, 1.0579824447631836e-06, 4.023313522338867e-06, 6.988644599914551e-06, 9.953975677490234e-06, 1.2919306755065918e-05, 1.58846378326416e-05, 1.8849968910217285e-05, 2.181529998779297e-05, 2.4780631065368652e-05, 2.7745962142944336e-05, 3.071129322052002e-05, 3.36766242980957e-05, 3.664195537567139e-05, 3.960728645324707e-05, 4.2572617530822754e-05, 4.553794860839844e-05, 4.850327968597412e-05, 5.1468610763549805e-05, 5.443394184112549e-05, 5.739927291870117e-05, 6.0364603996276855e-05, 6.332993507385254e-05, 6.629526615142822e-05, 6.92605972290039e-05, 7.222592830657959e-05, 7.519125938415527e-05, 7.815659046173096e-05, 8.112192153930664e-05, 8.408725261688232e-05, 8.705258369445801e-05, 9.001791477203369e-05, 9.298324584960938e-05]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 10.0, 14.0, 35.0, 45.0, 79.0, 145.0, 275.0, 426.0, 714.0, 1316.0, 2122.0, 3704.0, 6350.0, 11429.0, 22846.0, 52474.0, 167087.0, 3636127.0, 185635.0, 53460.0, 23027.0, 11320.0, 5987.0, 3425.0, 2127.0, 1345.0, 871.0, 593.0, 377.0, 255.0, 137.0, 148.0, 77.0, 56.0, 37.0, 33.0, 31.0, 22.0, 18.0, 19.0, 11.0, 12.0, 17.0, 11.0, 10.0, 8.0, 1.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.29425048828125e-05, -6.002187728881836e-05, -5.710124969482422e-05, -5.418062210083008e-05, -5.125999450683594e-05, -4.83393669128418e-05, -4.5418739318847656e-05, -4.2498111724853516e-05, -3.9577484130859375e-05, -3.6656856536865234e-05, -3.3736228942871094e-05, -3.081560134887695e-05, -2.7894973754882812e-05, -2.4974346160888672e-05, -2.205371856689453e-05, -1.913309097290039e-05, -1.621246337890625e-05, -1.329183578491211e-05, -1.0371208190917969e-05, -7.450580596923828e-06, -4.5299530029296875e-06, -1.6093254089355469e-06, 1.3113021850585938e-06, 4.231929779052734e-06, 7.152557373046875e-06, 1.0073184967041016e-05, 1.2993812561035156e-05, 1.5914440155029297e-05, 1.8835067749023438e-05, 2.1755695343017578e-05, 2.467632293701172e-05, 2.759695053100586e-05, 3.0517578125e-05, 3.343820571899414e-05, 3.635883331298828e-05, 3.927946090698242e-05, 4.220008850097656e-05, 4.51207160949707e-05, 4.8041343688964844e-05, 5.0961971282958984e-05, 5.3882598876953125e-05, 5.6803226470947266e-05, 5.9723854064941406e-05, 6.264448165893555e-05, 6.556510925292969e-05, 6.848573684692383e-05, 7.140636444091797e-05, 7.432699203491211e-05, 7.724761962890625e-05, 8.016824722290039e-05, 8.308887481689453e-05, 8.600950241088867e-05, 8.893013000488281e-05, 9.185075759887695e-05, 9.47713851928711e-05, 9.769201278686523e-05, 0.00010061264038085938, 0.00010353326797485352, 0.00010645389556884766, 0.0001093745231628418, 0.00011229515075683594, 0.00011521577835083008, 0.00011813640594482422, 0.00012105703353881836, 0.0001239776611328125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 15.0, 12.0, 16.0, 24.0, 31.0, 48.0, 48.0, 70.0, 98.0, 83.0, 115.0, 74.0, 83.0, 67.0, 45.0, 38.0, 38.0, 18.0, 15.0, 12.0, 6.0, 8.0, 6.0, 1.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2099742889404297e-05, -1.1538155376911163e-05, -1.097656786441803e-05, -1.0414980351924896e-05, -9.853392839431763e-06, -9.291805326938629e-06, -8.730217814445496e-06, -8.168630301952362e-06, -7.6070427894592285e-06, -7.045455276966095e-06, -6.4838677644729614e-06, -5.922280251979828e-06, -5.360692739486694e-06, -4.799105226993561e-06, -4.237517714500427e-06, -3.6759302020072937e-06, -3.11434268951416e-06, -2.5527551770210266e-06, -1.991167664527893e-06, -1.4295801520347595e-06, -8.67992639541626e-07, -3.0640512704849243e-07, 2.551823854446411e-07, 8.167698979377747e-07, 1.3783574104309082e-06, 1.9399449229240417e-06, 2.5015324354171753e-06, 3.063119947910309e-06, 3.6247074604034424e-06, 4.186294972896576e-06, 4.7478824853897095e-06, 5.309469997882843e-06, 5.8710575103759766e-06, 6.43264502286911e-06, 6.994232535362244e-06, 7.555820047855377e-06, 8.11740756034851e-06, 8.678995072841644e-06, 9.240582585334778e-06, 9.802170097827911e-06, 1.0363757610321045e-05, 1.0925345122814178e-05, 1.1486932635307312e-05, 1.2048520147800446e-05, 1.2610107660293579e-05, 1.3171695172786713e-05, 1.3733282685279846e-05, 1.429487019777298e-05, 1.4856457710266113e-05, 1.5418045222759247e-05, 1.597963273525238e-05, 1.6541220247745514e-05, 1.7102807760238647e-05, 1.766439527273178e-05, 1.8225982785224915e-05, 1.8787570297718048e-05, 1.934915781021118e-05, 1.9910745322704315e-05, 2.047233283519745e-05, 2.1033920347690582e-05, 2.1595507860183716e-05, 2.215709537267685e-05, 2.2718682885169983e-05, 2.3280270397663116e-05, 2.384185791015625e-05]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 7.0, 7.0, 16.0, 31.0, 43.0, 64.0, 77.0, 124.0, 171.0, 271.0, 399.0, 628.0, 926.0, 1586.0, 2417.0, 4027.0, 6688.0, 10650.0, 19855.0, 36825.0, 73688.0, 162938.0, 1428395.0, 2109077.0, 175973.0, 72154.0, 37851.0, 20203.0, 11394.0, 6520.0, 4197.0, 2536.0, 1596.0, 960.0, 657.0, 423.0, 278.0, 196.0, 132.0, 88.0, 64.0, 33.0, 36.0, 23.0, 19.0, 13.0, 7.0, 5.0, 3.0, 6.0, 4.0, 0.0, 2.0, 1.0], "bins": [-4.869699478149414e-05, -4.722177982330322e-05, -4.5746564865112305e-05, -4.427134990692139e-05, -4.279613494873047e-05, -4.132091999053955e-05, -3.984570503234863e-05, -3.8370490074157715e-05, -3.68952751159668e-05, -3.542006015777588e-05, -3.394484519958496e-05, -3.246963024139404e-05, -3.0994415283203125e-05, -2.9519200325012207e-05, -2.804398536682129e-05, -2.656877040863037e-05, -2.5093555450439453e-05, -2.3618340492248535e-05, -2.2143125534057617e-05, -2.06679105758667e-05, -1.919269561767578e-05, -1.7717480659484863e-05, -1.6242265701293945e-05, -1.4767050743103027e-05, -1.329183578491211e-05, -1.1816620826721191e-05, -1.0341405868530273e-05, -8.866190910339355e-06, -7.3909759521484375e-06, -5.9157609939575195e-06, -4.4405460357666016e-06, -2.9653310775756836e-06, -1.4901161193847656e-06, -1.4901161193847656e-08, 1.4603137969970703e-06, 2.9355287551879883e-06, 4.410743713378906e-06, 5.885958671569824e-06, 7.361173629760742e-06, 8.83638858795166e-06, 1.0311603546142578e-05, 1.1786818504333496e-05, 1.3262033462524414e-05, 1.4737248420715332e-05, 1.621246337890625e-05, 1.7687678337097168e-05, 1.9162893295288086e-05, 2.0638108253479004e-05, 2.2113323211669922e-05, 2.358853816986084e-05, 2.5063753128051758e-05, 2.6538968086242676e-05, 2.8014183044433594e-05, 2.9489398002624512e-05, 3.096461296081543e-05, 3.243982791900635e-05, 3.3915042877197266e-05, 3.5390257835388184e-05, 3.68654727935791e-05, 3.834068775177002e-05, 3.981590270996094e-05, 4.1291117668151855e-05, 4.2766332626342773e-05, 4.424154758453369e-05, 4.571676254272461e-05]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 5.0, 4.0, 6.0, 12.0, 14.0, 23.0, 21.0, 25.0, 33.0, 42.0, 53.0, 64.0, 93.0, 85.0, 156.0, 465.0, 1433.0, 679.0, 229.0, 109.0, 73.0, 72.0, 52.0, 53.0, 36.0, 35.0, 31.0, 30.0, 25.0, 24.0, 19.0, 19.0, 11.0, 6.0, 8.0, 9.0, 7.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6226043701171875e-05, -2.520531415939331e-05, -2.4184584617614746e-05, -2.316385507583618e-05, -2.2143125534057617e-05, -2.1122395992279053e-05, -2.0101666450500488e-05, -1.9080936908721924e-05, -1.806020736694336e-05, -1.7039477825164795e-05, -1.601874828338623e-05, -1.4998018741607666e-05, -1.3977289199829102e-05, -1.2956559658050537e-05, -1.1935830116271973e-05, -1.0915100574493408e-05, -9.894371032714844e-06, -8.87364149093628e-06, -7.852911949157715e-06, -6.83218240737915e-06, -5.811452865600586e-06, -4.7907233238220215e-06, -3.769993782043457e-06, -2.7492642402648926e-06, -1.7285346984863281e-06, -7.078051567077637e-07, 3.129243850708008e-07, 1.3336539268493652e-06, 2.3543834686279297e-06, 3.375113010406494e-06, 4.395842552185059e-06, 5.416572093963623e-06, 6.4373016357421875e-06, 7.458031177520752e-06, 8.478760719299316e-06, 9.499490261077881e-06, 1.0520219802856445e-05, 1.154094934463501e-05, 1.2561678886413574e-05, 1.3582408428192139e-05, 1.4603137969970703e-05, 1.5623867511749268e-05, 1.6644597053527832e-05, 1.7665326595306396e-05, 1.868605613708496e-05, 1.9706785678863525e-05, 2.072751522064209e-05, 2.1748244762420654e-05, 2.276897430419922e-05, 2.3789703845977783e-05, 2.4810433387756348e-05, 2.5831162929534912e-05, 2.6851892471313477e-05, 2.787262201309204e-05, 2.8893351554870605e-05, 2.991408109664917e-05, 3.0934810638427734e-05, 3.19555401802063e-05, 3.297626972198486e-05, 3.399699926376343e-05, 3.501772880554199e-05, 3.603845834732056e-05, 3.705918788909912e-05, 3.8079917430877686e-05, 3.910064697265625e-05]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 8.0, 16.0, 16.0, 26.0, 42.0, 68.0, 108.0, 171.0, 128.0, 96.0, 82.0, 44.0, 39.0, 29.0, 18.0, 19.0, 21.0, 17.0, 10.0, 9.0, 5.0, 6.0, 7.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003635537577793002, -0.00035331619437783957, -0.00034307860187254846, -0.00033284100936725736, -0.0003226034459657967, -0.00031236588256433606, -0.00030212829005904496, -0.00029189069755375385, -0.0002816531341522932, -0.00027141557075083256, -0.00026117797824554145, -0.00025094038574025035, -0.0002407028223387897, -0.00023046524438541383, -0.00022022766643203795, -0.00020999008847866207, -0.0001997525105252862, -0.00018951493257191032, -0.00017927735461853445, -0.00016903977666515857, -0.0001588021987117827, -0.00014856462075840682, -0.00013832704280503094, -0.00012808946485165507, -0.00011785188689827919, -0.00010761430894490331, -9.737673099152744e-05, -8.713915303815156e-05, -7.690157508477569e-05, -6.666399713139981e-05, -5.6426419178023934e-05, -4.618884122464806e-05, -3.595126327127218e-05, -2.5713685317896307e-05, -1.547610736452043e-05, -5.238529411144555e-06, 4.999048542231321e-06, 1.5236626495607197e-05, 2.5474204448983073e-05, 3.571178240235895e-05, 4.5949360355734825e-05, 5.61869383091107e-05, 6.642451626248658e-05, 7.666209421586245e-05, 8.689967216923833e-05, 9.71372501226142e-05, 0.00010737482807599008, 0.00011761240602936596, 0.00012784998398274183, 0.0001380875619361177, 0.00014832513988949358, 0.00015856271784286946, 0.00016880029579624534, 0.0001790378737496212, 0.0001892754517029971, 0.00019951302965637296, 0.00020975060760974884, 0.00021998818556312472, 0.0002302257635165006, 0.00024046334146987647, 0.00025070091942325234, 0.000260938482824713, 0.0002711760753300041, 0.0002814136678352952, 0.00029165123123675585]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0, 3.0, 8.0, 12.0, 9.0, 7.0, 15.0, 14.0, 14.0, 11.0, 16.0, 20.0, 27.0, 27.0, 27.0, 27.0, 39.0, 39.0, 36.0, 33.0, 34.0, 36.0, 29.0, 39.0, 56.0, 30.0, 37.0, 30.0, 36.0, 28.0, 19.0, 27.0, 27.0, 29.0, 22.0, 17.0, 19.0, 16.0, 11.0, 16.0, 10.0, 5.0, 7.0, 3.0, 8.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0001481175422668457, -0.0001436648890376091, -0.0001392122358083725, -0.0001347595825791359, -0.0001303069293498993, -0.0001258542761206627, -0.00012140162289142609, -0.00011694896966218948, -0.00011249631643295288, -0.00010804366320371628, -0.00010359100997447968, -9.913835674524307e-05, -9.468570351600647e-05, -9.023305028676987e-05, -8.578039705753326e-05, -8.132774382829666e-05, -7.687509059906006e-05, -7.242243736982346e-05, -6.796978414058685e-05, -6.351713091135025e-05, -5.906447768211365e-05, -5.4611824452877045e-05, -5.015917122364044e-05, -4.570651799440384e-05, -4.1253864765167236e-05, -3.6801211535930634e-05, -3.234855830669403e-05, -2.7895905077457428e-05, -2.3443251848220825e-05, -1.8990598618984222e-05, -1.453794538974762e-05, -1.0085292160511017e-05, -5.632638931274414e-06, -1.1799857020378113e-06, 3.2726675271987915e-06, 7.725320756435394e-06, 1.2177973985671997e-05, 1.66306272149086e-05, 2.1083280444145203e-05, 2.5535933673381805e-05, 2.9988586902618408e-05, 3.444124013185501e-05, 3.8893893361091614e-05, 4.3346546590328217e-05, 4.779919981956482e-05, 5.225185304880142e-05, 5.6704506278038025e-05, 6.115715950727463e-05, 6.560981273651123e-05, 7.006246596574783e-05, 7.451511919498444e-05, 7.896777242422104e-05, 8.342042565345764e-05, 8.787307888269424e-05, 9.232573211193085e-05, 9.677838534116745e-05, 0.00010123103857040405, 0.00010568369179964066, 0.00011013634502887726, 0.00011458899825811386, 0.00011904165148735046, 0.00012349430471658707, 0.00012794695794582367, 0.00013239961117506027, 0.00013685226440429688]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 6.0, 13.0, 16.0, 16.0, 28.0, 34.0, 47.0, 73.0, 142.0, 202.0, 417.0, 765.0, 1555.0, 3318.0, 7780.0, 22208.0, 88186.0, 659185.0, 203788.0, 39730.0, 12183.0, 4673.0, 2029.0, 971.0, 490.0, 274.0, 161.0, 99.0, 49.0, 29.0, 14.0, 28.0, 11.0, 11.0, 5.0, 8.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001646280288696289, -0.00015974603593349457, -0.00015486404299736023, -0.0001499820500612259, -0.00014510005712509155, -0.00014021806418895721, -0.00013533607125282288, -0.00013045407831668854, -0.0001255720853805542, -0.00012069009244441986, -0.00011580809950828552, -0.00011092610657215118, -0.00010604411363601685, -0.00010116212069988251, -9.628012776374817e-05, -9.139813482761383e-05, -8.651614189147949e-05, -8.163414895534515e-05, -7.675215601921082e-05, -7.187016308307648e-05, -6.698817014694214e-05, -6.21061772108078e-05, -5.722418427467346e-05, -5.2342191338539124e-05, -4.7460198402404785e-05, -4.257820546627045e-05, -3.769621253013611e-05, -3.281421959400177e-05, -2.793222665786743e-05, -2.3050233721733093e-05, -1.8168240785598755e-05, -1.3286247849464417e-05, -8.404254913330078e-06, -3.5222619771957397e-06, 1.3597309589385986e-06, 6.241723895072937e-06, 1.1123716831207275e-05, 1.6005709767341614e-05, 2.0887702703475952e-05, 2.576969563961029e-05, 3.065168857574463e-05, 3.553368151187897e-05, 4.0415674448013306e-05, 4.5297667384147644e-05, 5.017966032028198e-05, 5.506165325641632e-05, 5.994364619255066e-05, 6.4825639128685e-05, 6.970763206481934e-05, 7.458962500095367e-05, 7.947161793708801e-05, 8.435361087322235e-05, 8.923560380935669e-05, 9.411759674549103e-05, 9.899958968162537e-05, 0.0001038815826177597, 0.00010876357555389404, 0.00011364556849002838, 0.00011852756142616272, 0.00012340955436229706, 0.0001282915472984314, 0.00013317354023456573, 0.00013805553317070007, 0.0001429375261068344, 0.00014781951904296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 12.0, 14.0, 10.0, 25.0, 37.0, 61.0, 77.0, 97.0, 129.0, 108.0, 115.0, 97.0, 54.0, 40.0, 37.0, 23.0, 17.0, 7.0, 7.0, 8.0, 5.0, 5.0, 3.0, 5.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6808509826660156e-05, -1.611746847629547e-05, -1.5426427125930786e-05, -1.4735385775566101e-05, -1.4044344425201416e-05, -1.3353303074836731e-05, -1.2662261724472046e-05, -1.197122037410736e-05, -1.1280179023742676e-05, -1.058913767337799e-05, -9.898096323013306e-06, -9.20705497264862e-06, -8.516013622283936e-06, -7.82497227191925e-06, -7.1339309215545654e-06, -6.44288957118988e-06, -5.751848220825195e-06, -5.06080687046051e-06, -4.369765520095825e-06, -3.67872416973114e-06, -2.987682819366455e-06, -2.29664146900177e-06, -1.605600118637085e-06, -9.145587682723999e-07, -2.2351741790771484e-07, 4.675239324569702e-07, 1.1585652828216553e-06, 1.8496066331863403e-06, 2.5406479835510254e-06, 3.2316893339157104e-06, 3.9227306842803955e-06, 4.6137720346450806e-06, 5.304813385009766e-06, 5.995854735374451e-06, 6.686896085739136e-06, 7.377937436103821e-06, 8.068978786468506e-06, 8.760020136833191e-06, 9.451061487197876e-06, 1.0142102837562561e-05, 1.0833144187927246e-05, 1.1524185538291931e-05, 1.2215226888656616e-05, 1.2906268239021301e-05, 1.3597309589385986e-05, 1.4288350939750671e-05, 1.4979392290115356e-05, 1.567043364048004e-05, 1.6361474990844727e-05, 1.705251634120941e-05, 1.7743557691574097e-05, 1.8434599041938782e-05, 1.9125640392303467e-05, 1.9816681742668152e-05, 2.0507723093032837e-05, 2.1198764443397522e-05, 2.1889805793762207e-05, 2.2580847144126892e-05, 2.3271888494491577e-05, 2.3962929844856262e-05, 2.4653971195220947e-05, 2.5345012545585632e-05, 2.6036053895950317e-05, 2.6727095246315002e-05, 2.7418136596679688e-05]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 17.0, 19.0, 28.0, 52.0, 55.0, 92.0, 136.0, 186.0, 291.0, 427.0, 647.0, 973.0, 1564.0, 2632.0, 4009.0, 6551.0, 10532.0, 17689.0, 30062.0, 53857.0, 100642.0, 248020.0, 317895.0, 111712.0, 60279.0, 32280.0, 18481.0, 10949.0, 6689.0, 4291.0, 2634.0, 1651.0, 1104.0, 694.0, 506.0, 306.0, 198.0, 140.0, 88.0, 59.0, 27.0, 34.0, 11.0, 16.0, 7.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.7789344787597656e-05, -3.653205931186676e-05, -3.5274773836135864e-05, -3.401748836040497e-05, -3.276020288467407e-05, -3.1502917408943176e-05, -3.024563193321228e-05, -2.8988346457481384e-05, -2.7731060981750488e-05, -2.6473775506019592e-05, -2.5216490030288696e-05, -2.39592045545578e-05, -2.2701919078826904e-05, -2.1444633603096008e-05, -2.0187348127365112e-05, -1.8930062651634216e-05, -1.767277717590332e-05, -1.6415491700172424e-05, -1.5158206224441528e-05, -1.3900920748710632e-05, -1.2643635272979736e-05, -1.138634979724884e-05, -1.0129064321517944e-05, -8.871778845787048e-06, -7.614493370056152e-06, -6.357207894325256e-06, -5.09992241859436e-06, -3.842636942863464e-06, -2.5853514671325684e-06, -1.3280659914016724e-06, -7.078051567077637e-08, 1.1865049600601196e-06, 2.4437904357910156e-06, 3.7010759115219116e-06, 4.958361387252808e-06, 6.215646862983704e-06, 7.4729323387146e-06, 8.730217814445496e-06, 9.987503290176392e-06, 1.1244788765907288e-05, 1.2502074241638184e-05, 1.375935971736908e-05, 1.5016645193099976e-05, 1.627393066883087e-05, 1.7531216144561768e-05, 1.8788501620292664e-05, 2.004578709602356e-05, 2.1303072571754456e-05, 2.256035804748535e-05, 2.3817643523216248e-05, 2.5074928998947144e-05, 2.633221447467804e-05, 2.7589499950408936e-05, 2.884678542613983e-05, 3.0104070901870728e-05, 3.1361356377601624e-05, 3.261864185333252e-05, 3.3875927329063416e-05, 3.513321280479431e-05, 3.639049828052521e-05, 3.7647783756256104e-05, 3.8905069231987e-05, 4.0162354707717896e-05, 4.141964018344879e-05, 4.267692565917969e-05]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 9.0, 6.0, 6.0, 10.0, 14.0, 13.0, 19.0, 17.0, 25.0, 33.0, 35.0, 37.0, 30.0, 26.0, 43.0, 39.0, 41.0, 44.0, 41.0, 44.0, 45.0, 44.0, 37.0, 30.0, 43.0, 29.0, 38.0, 30.0, 21.0, 31.0, 20.0, 14.0, 11.0, 14.0, 11.0, 11.0, 3.0, 11.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.504753112792969e-05, -3.41217964887619e-05, -3.3196061849594116e-05, -3.227032721042633e-05, -3.1344592571258545e-05, -3.041885793209076e-05, -2.9493123292922974e-05, -2.8567388653755188e-05, -2.7641654014587402e-05, -2.6715919375419617e-05, -2.579018473625183e-05, -2.4864450097084045e-05, -2.393871545791626e-05, -2.3012980818748474e-05, -2.208724617958069e-05, -2.1161511540412903e-05, -2.0235776901245117e-05, -1.931004226207733e-05, -1.8384307622909546e-05, -1.745857298374176e-05, -1.6532838344573975e-05, -1.560710370540619e-05, -1.4681369066238403e-05, -1.3755634427070618e-05, -1.2829899787902832e-05, -1.1904165148735046e-05, -1.097843050956726e-05, -1.0052695870399475e-05, -9.12696123123169e-06, -8.201226592063904e-06, -7.275491952896118e-06, -6.3497573137283325e-06, -5.424022674560547e-06, -4.498288035392761e-06, -3.5725533962249756e-06, -2.64681875705719e-06, -1.7210841178894043e-06, -7.953494787216187e-07, 1.30385160446167e-07, 1.0561197996139526e-06, 1.9818544387817383e-06, 2.907589077949524e-06, 3.8333237171173096e-06, 4.759058356285095e-06, 5.684792995452881e-06, 6.6105276346206665e-06, 7.536262273788452e-06, 8.461996912956238e-06, 9.387731552124023e-06, 1.0313466191291809e-05, 1.1239200830459595e-05, 1.216493546962738e-05, 1.3090670108795166e-05, 1.4016404747962952e-05, 1.4942139387130737e-05, 1.5867874026298523e-05, 1.679360866546631e-05, 1.7719343304634094e-05, 1.864507794380188e-05, 1.9570812582969666e-05, 2.049654722213745e-05, 2.1422281861305237e-05, 2.2348016500473022e-05, 2.3273751139640808e-05, 2.4199485778808594e-05]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 5.0, 2.0, 4.0, 8.0, 9.0, 19.0, 9.0, 8.0, 30.0, 38.0, 73.0, 64.0, 70.0, 206.0, 180.0, 507.0, 328.0, 556.0, 1688.0, 1327.0, 4521.0, 3843.0, 5674.0, 21266.0, 19938.0, 82324.0, 88155.0, 162090.0, 425491.0, 87774.0, 82275.0, 19769.0, 21154.0, 5719.0, 3789.0, 4467.0, 1347.0, 1629.0, 539.0, 373.0, 556.0, 175.0, 206.0, 91.0, 49.0, 92.0, 29.0, 42.0, 14.0, 11.0, 5.0, 5.0, 9.0, 2.0, 5.0, 7.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.682209014892578e-06, -2.598389983177185e-06, -2.514570951461792e-06, -2.430751919746399e-06, -2.346932888031006e-06, -2.263113856315613e-06, -2.1792948246002197e-06, -2.0954757928848267e-06, -2.0116567611694336e-06, -1.9278377294540405e-06, -1.8440186977386475e-06, -1.7601996660232544e-06, -1.6763806343078613e-06, -1.5925616025924683e-06, -1.5087425708770752e-06, -1.4249235391616821e-06, -1.341104507446289e-06, -1.257285475730896e-06, -1.173466444015503e-06, -1.0896474123001099e-06, -1.0058283805847168e-06, -9.220093488693237e-07, -8.381903171539307e-07, -7.543712854385376e-07, -6.705522537231445e-07, -5.867332220077515e-07, -5.029141902923584e-07, -4.1909515857696533e-07, -3.3527612686157227e-07, -2.514570951461792e-07, -1.6763806343078613e-07, -8.381903171539307e-08, 0.0, 8.381903171539307e-08, 1.6763806343078613e-07, 2.514570951461792e-07, 3.3527612686157227e-07, 4.1909515857696533e-07, 5.029141902923584e-07, 5.867332220077515e-07, 6.705522537231445e-07, 7.543712854385376e-07, 8.381903171539307e-07, 9.220093488693237e-07, 1.0058283805847168e-06, 1.0896474123001099e-06, 1.173466444015503e-06, 1.257285475730896e-06, 1.341104507446289e-06, 1.4249235391616821e-06, 1.5087425708770752e-06, 1.5925616025924683e-06, 1.6763806343078613e-06, 1.7601996660232544e-06, 1.8440186977386475e-06, 1.9278377294540405e-06, 2.0116567611694336e-06, 2.0954757928848267e-06, 2.1792948246002197e-06, 2.263113856315613e-06, 2.346932888031006e-06, 2.430751919746399e-06, 2.514570951461792e-06, 2.598389983177185e-06, 2.682209014892578e-06]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 7.0, 6.0, 14.0, 16.0, 19.0, 0.0, 25.0, 41.0, 33.0, 41.0, 0.0, 44.0, 51.0, 66.0, 93.0, 0.0, 72.0, 60.0, 64.0, 68.0, 51.0, 0.0, 45.0, 38.0, 38.0, 31.0, 0.0, 25.0, 18.0, 11.0, 10.0, 0.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5012919902801514e-06, -1.4528632164001465e-06, -1.4044344425201416e-06, -1.3560056686401367e-06, -1.3075768947601318e-06, -1.259148120880127e-06, -1.210719347000122e-06, -1.1622905731201172e-06, -1.1138617992401123e-06, -1.0654330253601074e-06, -1.0170042514801025e-06, -9.685754776000977e-07, -9.201467037200928e-07, -8.717179298400879e-07, -8.23289155960083e-07, -7.748603820800781e-07, -7.264316082000732e-07, -6.780028343200684e-07, -6.295740604400635e-07, -5.811452865600586e-07, -5.327165126800537e-07, -4.842877388000488e-07, -4.3585896492004395e-07, -3.8743019104003906e-07, -3.390014171600342e-07, -2.905726432800293e-07, -2.421438694000244e-07, -1.9371509552001953e-07, -1.4528632164001465e-07, -9.685754776000977e-08, -4.842877388000488e-08, 0.0, 4.842877388000488e-08, 9.685754776000977e-08, 1.4528632164001465e-07, 1.9371509552001953e-07, 2.421438694000244e-07, 2.905726432800293e-07, 3.390014171600342e-07, 3.8743019104003906e-07, 4.3585896492004395e-07, 4.842877388000488e-07, 5.327165126800537e-07, 5.811452865600586e-07, 6.295740604400635e-07, 6.780028343200684e-07, 7.264316082000732e-07, 7.748603820800781e-07, 8.23289155960083e-07, 8.717179298400879e-07, 9.201467037200928e-07, 9.685754776000977e-07, 1.0170042514801025e-06, 1.0654330253601074e-06, 1.1138617992401123e-06, 1.1622905731201172e-06, 1.210719347000122e-06, 1.259148120880127e-06, 1.3075768947601318e-06, 1.3560056686401367e-06, 1.4044344425201416e-06, 1.4528632164001465e-06, 1.5012919902801514e-06, 1.5497207641601562e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 10.0, 11.0, 16.0, 28.0, 36.0, 34.0, 59.0, 77.0, 119.0, 161.0, 217.0, 311.0, 482.0, 742.0, 1104.0, 1661.0, 2510.0, 4045.0, 6836.0, 11404.0, 19992.0, 37207.0, 75391.0, 177610.0, 368661.0, 177323.0, 75559.0, 37202.0, 20069.0, 11401.0, 6548.0, 4120.0, 2561.0, 1654.0, 1032.0, 745.0, 474.0, 358.0, 241.0, 136.0, 116.0, 73.0, 66.0, 42.0, 32.0, 22.0, 16.0, 15.0, 12.0, 5.0, 6.0, 4.0, 2.0, 1.0], "bins": [-2.0265579223632812e-06, -1.967884600162506e-06, -1.909211277961731e-06, -1.8505379557609558e-06, -1.7918646335601807e-06, -1.7331913113594055e-06, -1.6745179891586304e-06, -1.6158446669578552e-06, -1.55717134475708e-06, -1.498498022556305e-06, -1.4398247003555298e-06, -1.3811513781547546e-06, -1.3224780559539795e-06, -1.2638047337532043e-06, -1.2051314115524292e-06, -1.146458089351654e-06, -1.087784767150879e-06, -1.0291114449501038e-06, -9.704381227493286e-07, -9.117648005485535e-07, -8.530914783477783e-07, -7.944181561470032e-07, -7.35744833946228e-07, -6.770715117454529e-07, -6.183981895446777e-07, -5.597248673439026e-07, -5.010515451431274e-07, -4.423782229423523e-07, -3.8370490074157715e-07, -3.25031578540802e-07, -2.6635825634002686e-07, -2.076849341392517e-07, -1.4901161193847656e-07, -9.033828973770142e-08, -3.166496753692627e-08, 2.7008354663848877e-08, 8.568167686462402e-08, 1.4435499906539917e-07, 2.0302832126617432e-07, 2.6170164346694946e-07, 3.203749656677246e-07, 3.7904828786849976e-07, 4.377216100692749e-07, 4.9639493227005e-07, 5.550682544708252e-07, 6.137415766716003e-07, 6.724148988723755e-07, 7.310882210731506e-07, 7.897615432739258e-07, 8.484348654747009e-07, 9.071081876754761e-07, 9.657815098762512e-07, 1.0244548320770264e-06, 1.0831281542778015e-06, 1.1418014764785767e-06, 1.2004747986793518e-06, 1.259148120880127e-06, 1.317821443080902e-06, 1.3764947652816772e-06, 1.4351680874824524e-06, 1.4938414096832275e-06, 1.5525147318840027e-06, 1.6111880540847778e-06, 1.669861376285553e-06, 1.7285346984863281e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 6.0, 9.0, 0.0, 13.0, 13.0, 20.0, 22.0, 0.0, 36.0, 39.0, 47.0, 49.0, 0.0, 56.0, 72.0, 72.0, 66.0, 0.0, 68.0, 81.0, 76.0, 44.0, 0.0, 55.0, 31.0, 24.0, 25.0, 0.0, 18.0, 16.0, 11.0, 8.0, 0.0, 12.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.323409378528595e-06, -1.2759119272232056e-06, -1.2284144759178162e-06, -1.1809170246124268e-06, -1.1334195733070374e-06, -1.085922122001648e-06, -1.0384246706962585e-06, -9.909272193908691e-07, -9.434297680854797e-07, -8.959323167800903e-07, -8.484348654747009e-07, -8.009374141693115e-07, -7.534399628639221e-07, -7.059425115585327e-07, -6.584450602531433e-07, -6.109476089477539e-07, -5.634501576423645e-07, -5.159527063369751e-07, -4.684552550315857e-07, -4.209578037261963e-07, -3.734603524208069e-07, -3.259629011154175e-07, -2.784654498100281e-07, -2.3096799850463867e-07, -1.8347054719924927e-07, -1.3597309589385986e-07, -8.847564458847046e-08, -4.0978193283081055e-08, 6.51925802230835e-09, 5.4016709327697754e-08, 1.0151416063308716e-07, 1.4901161193847656e-07, 1.9650906324386597e-07, 2.4400651454925537e-07, 2.915039658546448e-07, 3.390014171600342e-07, 3.864988684654236e-07, 4.33996319770813e-07, 4.814937710762024e-07, 5.289912223815918e-07, 5.764886736869812e-07, 6.239861249923706e-07, 6.7148357629776e-07, 7.189810276031494e-07, 7.664784789085388e-07, 8.139759302139282e-07, 8.614733815193176e-07, 9.08970832824707e-07, 9.564682841300964e-07, 1.0039657354354858e-06, 1.0514631867408752e-06, 1.0989606380462646e-06, 1.146458089351654e-06, 1.1939555406570435e-06, 1.2414529919624329e-06, 1.2889504432678223e-06, 1.3364478945732117e-06, 1.383945345878601e-06, 1.4314427971839905e-06, 1.4789402484893799e-06, 1.5264376997947693e-06, 1.5739351511001587e-06, 1.621432602405548e-06, 1.6689300537109375e-06]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 8.0, 7.0, 8.0, 16.0, 25.0, 23.0, 36.0, 43.0, 89.0, 176.0, 123.0, 88.0, 59.0, 56.0, 39.0, 29.0, 27.0, 22.0, 27.0, 15.0, 15.0, 8.0, 13.0, 3.0, 3.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.557600813219324e-05, -8.14294908195734e-05, -7.728297350695357e-05, -7.313645619433373e-05, -6.898994615767151e-05, -6.484342884505168e-05, -6.069691153243184e-05, -5.6550394219812006e-05, -5.240388054517098e-05, -4.825736323255114e-05, -4.4110849557910115e-05, -3.996433224529028e-05, -3.5817814932670444e-05, -3.1671301258029416e-05, -2.752478394540958e-05, -2.337826845177915e-05, -1.9231752958148718e-05, -1.5085237464518286e-05, -1.0938721061393153e-05, -6.7922046582680196e-06, -2.645689164637588e-06, 1.5008263289928436e-06, 5.647343641612679e-06, 9.79385913524311e-06, 1.3940374628873542e-05, 1.8086890122503974e-05, 2.2233405616134405e-05, 2.637992292875424e-05, 3.0526440241374075e-05, 3.4672953916015103e-05, 3.881947122863494e-05, 4.296598490327597e-05, 4.711249493993819e-05, 5.125901225255802e-05, 5.540552592719905e-05, 5.9552043239818886e-05, 6.369855691445991e-05, 6.784507422707975e-05, 7.199159153969958e-05, 7.613810885231942e-05, 8.028461888898164e-05, 8.443113620160148e-05, 8.857765351422131e-05, 9.272416355088353e-05, 9.687068086350337e-05, 0.0001010171981761232, 0.00010516371548874304, 0.00010931023280136287, 0.00011345675011398271, 0.00011760326742660254, 0.00012174978473922238, 0.0001258963020518422, 0.00013004281208850443, 0.00013418932212516665, 0.0001383358467137441, 0.00014248235675040632, 0.00014662888133898377, 0.000150775391375646, 0.00015492191596422344, 0.00015906842600088567, 0.00016321495058946311, 0.00016736146062612534, 0.00017150797066278756, 0.000175654495251365, 0.00017980100528802723]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 5.0, 6.0, 4.0, 4.0, 10.0, 14.0, 23.0, 19.0, 19.0, 19.0, 24.0, 29.0, 39.0, 43.0, 30.0, 37.0, 41.0, 40.0, 43.0, 47.0, 47.0, 52.0, 37.0, 45.0, 32.0, 31.0, 35.0, 21.0, 25.0, 35.0, 26.0, 20.0, 17.0, 16.0, 11.0, 11.0, 14.0, 6.0, 8.0, 8.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001023411750793457, -9.934324771165848e-05, -9.634532034397125e-05, -9.334739297628403e-05, -9.03494656085968e-05, -8.735153824090958e-05, -8.435361087322235e-05, -8.135568350553513e-05, -7.83577561378479e-05, -7.535982877016068e-05, -7.236190140247345e-05, -6.936397403478622e-05, -6.6366046667099e-05, -6.336811929941177e-05, -6.037019193172455e-05, -5.737226456403732e-05, -5.43743371963501e-05, -5.137640982866287e-05, -4.837848246097565e-05, -4.538055509328842e-05, -4.2382627725601196e-05, -3.938470035791397e-05, -3.6386772990226746e-05, -3.338884562253952e-05, -3.0390918254852295e-05, -2.739299088716507e-05, -2.4395063519477844e-05, -2.139713615179062e-05, -1.8399208784103394e-05, -1.5401281416416168e-05, -1.2403354048728943e-05, -9.405426681041718e-06, -6.407499313354492e-06, -3.409571945667267e-06, -4.116445779800415e-07, 2.586282789707184e-06, 5.584210157394409e-06, 8.582137525081635e-06, 1.158006489276886e-05, 1.4577992260456085e-05, 1.757591962814331e-05, 2.0573846995830536e-05, 2.357177436351776e-05, 2.6569701731204987e-05, 2.9567629098892212e-05, 3.256555646657944e-05, 3.556348383426666e-05, 3.856141120195389e-05, 4.155933856964111e-05, 4.455726593732834e-05, 4.7555193305015564e-05, 5.055312067270279e-05, 5.3551048040390015e-05, 5.654897540807724e-05, 5.9546902775764465e-05, 6.254483014345169e-05, 6.554275751113892e-05, 6.854068487882614e-05, 7.153861224651337e-05, 7.453653961420059e-05, 7.753446698188782e-05, 8.053239434957504e-05, 8.353032171726227e-05, 8.65282490849495e-05, 8.952617645263672e-05]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 11.0, 8.0, 15.0, 18.0, 33.0, 49.0, 83.0, 100.0, 144.0, 211.0, 277.0, 416.0, 633.0, 852.0, 1263.0, 1839.0, 2800.0, 4458.0, 7690.0, 14302.0, 29779.0, 78541.0, 3634638.0, 305342.0, 54172.0, 23819.0, 12041.0, 6901.0, 4348.0, 2969.0, 1876.0, 1326.0, 980.0, 628.0, 464.0, 335.0, 245.0, 175.0, 136.0, 109.0, 68.0, 44.0, 30.0, 35.0, 16.0, 24.0, 7.0, 12.0, 6.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.356571197509766e-05, -8.033029735088348e-05, -7.709488272666931e-05, -7.385946810245514e-05, -7.062405347824097e-05, -6.73886388540268e-05, -6.415322422981262e-05, -6.091780960559845e-05, -5.768239498138428e-05, -5.4446980357170105e-05, -5.121156573295593e-05, -4.797615110874176e-05, -4.474073648452759e-05, -4.1505321860313416e-05, -3.826990723609924e-05, -3.503449261188507e-05, -3.17990779876709e-05, -2.8563663363456726e-05, -2.5328248739242554e-05, -2.209283411502838e-05, -1.885741949081421e-05, -1.5622004866600037e-05, -1.2386590242385864e-05, -9.151175618171692e-06, -5.9157609939575195e-06, -2.680346369743347e-06, 5.550682544708252e-07, 3.7904828786849976e-06, 7.02589750289917e-06, 1.0261312127113342e-05, 1.3496726751327515e-05, 1.6732141375541687e-05, 1.996755599975586e-05, 2.3202970623970032e-05, 2.6438385248184204e-05, 2.9673799872398376e-05, 3.290921449661255e-05, 3.614462912082672e-05, 3.9380043745040894e-05, 4.2615458369255066e-05, 4.585087299346924e-05, 4.908628761768341e-05, 5.232170224189758e-05, 5.5557116866111755e-05, 5.879253149032593e-05, 6.20279461145401e-05, 6.526336073875427e-05, 6.849877536296844e-05, 7.173418998718262e-05, 7.496960461139679e-05, 7.820501923561096e-05, 8.144043385982513e-05, 8.46758484840393e-05, 8.791126310825348e-05, 9.114667773246765e-05, 9.438209235668182e-05, 9.7617506980896e-05, 0.00010085292160511017, 0.00010408833622932434, 0.00010732375085353851, 0.00011055916547775269, 0.00011379458010196686, 0.00011702999472618103, 0.0001202654093503952, 0.00012350082397460938]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 3.0, 5.0, 8.0, 13.0, 17.0, 29.0, 26.0, 40.0, 48.0, 68.0, 83.0, 79.0, 97.0, 82.0, 84.0, 61.0, 53.0, 32.0, 33.0, 23.0, 21.0, 19.0, 5.0, 8.0, 7.0, 2.0, 7.0, 7.0, 1.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.245737075805664e-05, -1.194886863231659e-05, -1.1440366506576538e-05, -1.0931864380836487e-05, -1.0423362255096436e-05, -9.914860129356384e-06, -9.406358003616333e-06, -8.897855877876282e-06, -8.38935375213623e-06, -7.88085162639618e-06, -7.372349500656128e-06, -6.863847374916077e-06, -6.355345249176025e-06, -5.846843123435974e-06, -5.338340997695923e-06, -4.829838871955872e-06, -4.32133674621582e-06, -3.812834620475769e-06, -3.3043324947357178e-06, -2.7958303689956665e-06, -2.2873282432556152e-06, -1.778826117515564e-06, -1.2703239917755127e-06, -7.618218660354614e-07, -2.5331974029541016e-07, 2.551823854446411e-07, 7.636845111846924e-07, 1.2721866369247437e-06, 1.780688762664795e-06, 2.289190888404846e-06, 2.7976930141448975e-06, 3.3061951398849487e-06, 3.814697265625e-06, 4.323199391365051e-06, 4.8317015171051025e-06, 5.340203642845154e-06, 5.848705768585205e-06, 6.357207894325256e-06, 6.865710020065308e-06, 7.374212145805359e-06, 7.88271427154541e-06, 8.391216397285461e-06, 8.899718523025513e-06, 9.408220648765564e-06, 9.916722774505615e-06, 1.0425224900245667e-05, 1.0933727025985718e-05, 1.1442229151725769e-05, 1.195073127746582e-05, 1.2459233403205872e-05, 1.2967735528945923e-05, 1.3476237654685974e-05, 1.3984739780426025e-05, 1.4493241906166077e-05, 1.5001744031906128e-05, 1.551024615764618e-05, 1.601874828338623e-05, 1.6527250409126282e-05, 1.7035752534866333e-05, 1.7544254660606384e-05, 1.8052756786346436e-05, 1.8561258912086487e-05, 1.9069761037826538e-05, 1.957826316356659e-05, 2.008676528930664e-05]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 15.0, 28.0, 30.0, 34.0, 73.0, 101.0, 151.0, 218.0, 310.0, 523.0, 854.0, 1153.0, 2030.0, 3269.0, 5439.0, 9608.0, 17281.0, 33941.0, 72774.0, 222589.0, 3416437.0, 247546.0, 79843.0, 36499.0, 18729.0, 10027.0, 5584.0, 3465.0, 2027.0, 1300.0, 819.0, 529.0, 321.0, 223.0, 156.0, 102.0, 76.0, 58.0, 33.0, 23.0, 18.0, 13.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.157159805297852e-05, -5.973596125841141e-05, -5.79003244638443e-05, -5.606468766927719e-05, -5.422905087471008e-05, -5.2393414080142975e-05, -5.055777728557587e-05, -4.872214049100876e-05, -4.688650369644165e-05, -4.505086690187454e-05, -4.3215230107307434e-05, -4.1379593312740326e-05, -3.954395651817322e-05, -3.770831972360611e-05, -3.5872682929039e-05, -3.403704613447189e-05, -3.2201409339904785e-05, -3.0365772545337677e-05, -2.853013575077057e-05, -2.669449895620346e-05, -2.4858862161636353e-05, -2.3023225367069244e-05, -2.1187588572502136e-05, -1.9351951777935028e-05, -1.751631498336792e-05, -1.5680678188800812e-05, -1.3845041394233704e-05, -1.2009404599666595e-05, -1.0173767805099487e-05, -8.338131010532379e-06, -6.502494215965271e-06, -4.666857421398163e-06, -2.8312206268310547e-06, -9.955838322639465e-07, 8.400529623031616e-07, 2.6756897568702698e-06, 4.511326551437378e-06, 6.346963346004486e-06, 8.182600140571594e-06, 1.0018236935138702e-05, 1.185387372970581e-05, 1.3689510524272919e-05, 1.5525147318840027e-05, 1.7360784113407135e-05, 1.9196420907974243e-05, 2.103205770254135e-05, 2.286769449710846e-05, 2.4703331291675568e-05, 2.6538968086242676e-05, 2.8374604880809784e-05, 3.0210241675376892e-05, 3.2045878469944e-05, 3.388151526451111e-05, 3.5717152059078217e-05, 3.7552788853645325e-05, 3.938842564821243e-05, 4.122406244277954e-05, 4.305969923734665e-05, 4.489533603191376e-05, 4.6730972826480865e-05, 4.8566609621047974e-05, 5.040224641561508e-05, 5.223788321018219e-05, 5.40735200047493e-05, 5.5909156799316406e-05]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 7.0, 3.0, 6.0, 8.0, 16.0, 15.0, 19.0, 24.0, 27.0, 31.0, 43.0, 50.0, 73.0, 107.0, 281.0, 1676.0, 980.0, 229.0, 96.0, 56.0, 52.0, 45.0, 40.0, 26.0, 36.0, 24.0, 26.0, 8.0, 16.0, 10.0, 10.0, 5.0, 3.0, 6.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4928321838378906e-05, -3.3834949135780334e-05, -3.274157643318176e-05, -3.164820373058319e-05, -3.055483102798462e-05, -2.9461458325386047e-05, -2.8368085622787476e-05, -2.7274712920188904e-05, -2.6181340217590332e-05, -2.508796751499176e-05, -2.399459481239319e-05, -2.2901222109794617e-05, -2.1807849407196045e-05, -2.0714476704597473e-05, -1.96211040019989e-05, -1.852773129940033e-05, -1.7434358596801758e-05, -1.6340985894203186e-05, -1.5247613191604614e-05, -1.4154240489006042e-05, -1.306086778640747e-05, -1.1967495083808899e-05, -1.0874122381210327e-05, -9.780749678611755e-06, -8.687376976013184e-06, -7.594004273414612e-06, -6.50063157081604e-06, -5.407258868217468e-06, -4.3138861656188965e-06, -3.2205134630203247e-06, -2.127140760421753e-06, -1.0337680578231812e-06, 5.960464477539063e-08, 1.1529773473739624e-06, 2.246350049972534e-06, 3.339722752571106e-06, 4.433095455169678e-06, 5.5264681577682495e-06, 6.619840860366821e-06, 7.713213562965393e-06, 8.806586265563965e-06, 9.899958968162537e-06, 1.0993331670761108e-05, 1.208670437335968e-05, 1.3180077075958252e-05, 1.4273449778556824e-05, 1.5366822481155396e-05, 1.6460195183753967e-05, 1.755356788635254e-05, 1.864694058895111e-05, 1.9740313291549683e-05, 2.0833685994148254e-05, 2.1927058696746826e-05, 2.3020431399345398e-05, 2.411380410194397e-05, 2.520717680454254e-05, 2.6300549507141113e-05, 2.7393922209739685e-05, 2.8487294912338257e-05, 2.958066761493683e-05, 3.06740403175354e-05, 3.176741302013397e-05, 3.2860785722732544e-05, 3.3954158425331116e-05, 3.504753112792969e-05]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 9.0, 9.0, 17.0, 20.0, 37.0, 57.0, 73.0, 105.0, 163.0, 114.0, 93.0, 67.0, 48.0, 31.0, 33.0, 18.0, 19.0, 16.0, 15.0, 7.0, 7.0, 7.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021992232359480113, -0.0002124725142493844, -0.00020502270490396768, -0.00019757289555855095, -0.00019012308621313423, -0.0001826732768677175, -0.00017522346752230078, -0.00016777365817688406, -0.00016032384883146733, -0.0001528740394860506, -0.00014542423014063388, -0.00013797442079521716, -0.00013052461144980043, -0.0001230748021043837, -0.00011562499275896698, -0.00010817518341355026, -0.00010072537406813353, -9.327556472271681e-05, -8.582575537730008e-05, -7.837594603188336e-05, -7.092613668646663e-05, -6.347632734104991e-05, -5.6026517995633185e-05, -4.857670865021646e-05, -4.1126899304799736e-05, -3.367708995938301e-05, -2.6227280613966286e-05, -1.877747126854956e-05, -1.1327661923132837e-05, -3.877852577716112e-06, 3.5719567677006125e-06, 1.1021766113117337e-05, 1.847159001044929e-05, 2.5921399355866015e-05, 3.337120870128274e-05, 4.0821018046699464e-05, 4.827082739211619e-05, 5.5720636737532914e-05, 6.317044608294964e-05, 7.062025542836636e-05, 7.807006477378309e-05, 8.551987411919981e-05, 9.296968346461654e-05, 0.00010041949281003326, 0.00010786930215544999, 0.00011531911150086671, 0.00012276892084628344, 0.00013021873019170016, 0.00013766853953711689, 0.0001451183488825336, 0.00015256815822795033, 0.00016001796757336706, 0.00016746777691878378, 0.0001749175862642005, 0.00018236739560961723, 0.00018981720495503396, 0.00019726701430045068, 0.0002047168236458674, 0.00021216663299128413, 0.00021961644233670086, 0.00022706625168211758, 0.0002345160610275343, 0.00024196587037295103, 0.000249415694270283, 0.0002568654890637845]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 0.0, 4.0, 6.0, 8.0, 8.0, 13.0, 11.0, 13.0, 13.0, 13.0, 25.0, 27.0, 26.0, 24.0, 34.0, 33.0, 26.0, 43.0, 37.0, 46.0, 41.0, 41.0, 39.0, 38.0, 45.0, 39.0, 35.0, 44.0, 26.0, 28.0, 28.0, 24.0, 24.0, 22.0, 22.0, 23.0, 14.0, 14.0, 12.0, 10.0, 10.0, 3.0, 2.0, 3.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010186433792114258, -9.807292371988297e-05, -9.428150951862335e-05, -9.049009531736374e-05, -8.669868111610413e-05, -8.290726691484451e-05, -7.91158527135849e-05, -7.532443851232529e-05, -7.153302431106567e-05, -6.774161010980606e-05, -6.395019590854645e-05, -6.0158781707286835e-05, -5.636736750602722e-05, -5.257595330476761e-05, -4.8784539103507996e-05, -4.499312490224838e-05, -4.120171070098877e-05, -3.7410296499729156e-05, -3.3618882298469543e-05, -2.982746809720993e-05, -2.6036053895950317e-05, -2.2244639694690704e-05, -1.845322549343109e-05, -1.4661811292171478e-05, -1.0870397090911865e-05, -7.078982889652252e-06, -3.287568688392639e-06, 5.038455128669739e-07, 4.295259714126587e-06, 8.0866739153862e-06, 1.1878088116645813e-05, 1.5669502317905426e-05, 1.946091651916504e-05, 2.3252330720424652e-05, 2.7043744921684265e-05, 3.083515912294388e-05, 3.462657332420349e-05, 3.8417987525463104e-05, 4.220940172672272e-05, 4.600081592798233e-05, 4.979223012924194e-05, 5.3583644330501556e-05, 5.737505853176117e-05, 6.116647273302078e-05, 6.49578869342804e-05, 6.874930113554001e-05, 7.254071533679962e-05, 7.633212953805923e-05, 8.012354373931885e-05, 8.391495794057846e-05, 8.770637214183807e-05, 9.149778634309769e-05, 9.52892005443573e-05, 9.908061474561691e-05, 0.00010287202894687653, 0.00010666344314813614, 0.00011045485734939575, 0.00011424627155065536, 0.00011803768575191498, 0.00012182909995317459, 0.0001256205141544342, 0.00012941192835569382, 0.00013320334255695343, 0.00013699475675821304, 0.00014078617095947266]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 10.0, 7.0, 12.0, 9.0, 9.0, 14.0, 22.0, 22.0, 30.0, 41.0, 67.0, 104.0, 168.0, 327.0, 611.0, 1302.0, 2914.0, 7236.0, 21165.0, 86960.0, 686834.0, 187307.0, 35185.0, 10591.0, 3959.0, 1769.0, 817.0, 414.0, 239.0, 123.0, 104.0, 52.0, 28.0, 26.0, 12.0, 14.0, 9.0, 9.0, 12.0, 7.0, 8.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001552104949951172, -0.0001498013734817505, -0.0001443922519683838, -0.0001389831304550171, -0.0001335740089416504, -0.0001281648874282837, -0.000122755765914917, -0.00011734664440155029, -0.0001119375228881836, -0.0001065284013748169, -0.0001011192798614502, -9.57101583480835e-05, -9.03010368347168e-05, -8.48919153213501e-05, -7.94827938079834e-05, -7.40736722946167e-05, -6.866455078125e-05, -6.32554292678833e-05, -5.78463077545166e-05, -5.24371862411499e-05, -4.70280647277832e-05, -4.1618943214416504e-05, -3.6209821701049805e-05, -3.0800700187683105e-05, -2.5391578674316406e-05, -1.9982457160949707e-05, -1.4573335647583008e-05, -9.164214134216309e-06, -3.7550926208496094e-06, 1.6540288925170898e-06, 7.063150405883789e-06, 1.2472271919250488e-05, 1.7881393432617188e-05, 2.3290514945983887e-05, 2.8699636459350586e-05, 3.4108757972717285e-05, 3.9517879486083984e-05, 4.4927000999450684e-05, 5.033612251281738e-05, 5.574524402618408e-05, 6.115436553955078e-05, 6.656348705291748e-05, 7.197260856628418e-05, 7.738173007965088e-05, 8.279085159301758e-05, 8.819997310638428e-05, 9.360909461975098e-05, 9.901821613311768e-05, 0.00010442733764648438, 0.00010983645915985107, 0.00011524558067321777, 0.00012065470218658447, 0.00012606382369995117, 0.00013147294521331787, 0.00013688206672668457, 0.00014229118824005127, 0.00014770030975341797, 0.00015310943126678467, 0.00015851855278015137, 0.00016392767429351807, 0.00016933679580688477, 0.00017474591732025146, 0.00018015503883361816, 0.00018556416034698486, 0.00019097328186035156]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 11.0, 17.0, 16.0, 31.0, 55.0, 64.0, 93.0, 143.0, 123.0, 120.0, 110.0, 68.0, 36.0, 33.0, 19.0, 13.0, 12.0, 12.0, 6.0, 6.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.52587890625e-05, -1.4477409422397614e-05, -1.3696029782295227e-05, -1.291465014219284e-05, -1.2133270502090454e-05, -1.1351890861988068e-05, -1.0570511221885681e-05, -9.789131581783295e-06, -9.007751941680908e-06, -8.226372301578522e-06, -7.444992661476135e-06, -6.663613021373749e-06, -5.882233381271362e-06, -5.100853741168976e-06, -4.319474101066589e-06, -3.538094460964203e-06, -2.7567148208618164e-06, -1.97533518075943e-06, -1.1939555406570435e-06, -4.12575900554657e-07, 3.688037395477295e-07, 1.150183379650116e-06, 1.9315630197525024e-06, 2.712942659854889e-06, 3.4943222999572754e-06, 4.275701940059662e-06, 5.057081580162048e-06, 5.838461220264435e-06, 6.619840860366821e-06, 7.401220500469208e-06, 8.182600140571594e-06, 8.96397978067398e-06, 9.745359420776367e-06, 1.0526739060878754e-05, 1.130811870098114e-05, 1.2089498341083527e-05, 1.2870877981185913e-05, 1.36522576212883e-05, 1.4433637261390686e-05, 1.5215016901493073e-05, 1.599639654159546e-05, 1.6777776181697845e-05, 1.7559155821800232e-05, 1.834053546190262e-05, 1.9121915102005005e-05, 1.990329474210739e-05, 2.0684674382209778e-05, 2.1466054022312164e-05, 2.224743366241455e-05, 2.3028813302516937e-05, 2.3810192942619324e-05, 2.459157258272171e-05, 2.5372952222824097e-05, 2.6154331862926483e-05, 2.693571150302887e-05, 2.7717091143131256e-05, 2.8498470783233643e-05, 2.927985042333603e-05, 3.0061230063438416e-05, 3.08426097035408e-05, 3.162398934364319e-05, 3.2405368983745575e-05, 3.318674862384796e-05, 3.396812826395035e-05, 3.4749507904052734e-05]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 8.0, 17.0, 14.0, 19.0, 33.0, 50.0, 55.0, 81.0, 104.0, 179.0, 294.0, 445.0, 646.0, 938.0, 1429.0, 2002.0, 3243.0, 4941.0, 7395.0, 11381.0, 17534.0, 28340.0, 47338.0, 86039.0, 200530.0, 358081.0, 119322.0, 60860.0, 35477.0, 21564.0, 13915.0, 8855.0, 5956.0, 3748.0, 2608.0, 1751.0, 1033.0, 773.0, 479.0, 329.0, 255.0, 160.0, 129.0, 72.0, 47.0, 25.0, 25.0, 8.0, 13.0, 9.0, 5.0, 1.0, 3.0, 7.0, 1.0, 1.0], "bins": [-3.9577484130859375e-05, -3.838632255792618e-05, -3.719516098499298e-05, -3.6003999412059784e-05, -3.481283783912659e-05, -3.362167626619339e-05, -3.243051469326019e-05, -3.1239353120326996e-05, -3.00481915473938e-05, -2.8857029974460602e-05, -2.7665868401527405e-05, -2.6474706828594208e-05, -2.528354525566101e-05, -2.4092383682727814e-05, -2.2901222109794617e-05, -2.171006053686142e-05, -2.0518898963928223e-05, -1.9327737390995026e-05, -1.813657581806183e-05, -1.694541424512863e-05, -1.5754252672195435e-05, -1.4563091099262238e-05, -1.337192952632904e-05, -1.2180767953395844e-05, -1.0989606380462646e-05, -9.79844480752945e-06, -8.607283234596252e-06, -7.416121661663055e-06, -6.224960088729858e-06, -5.033798515796661e-06, -3.842636942863464e-06, -2.6514753699302673e-06, -1.4603137969970703e-06, -2.691522240638733e-07, 9.220093488693237e-07, 2.1131709218025208e-06, 3.3043324947357178e-06, 4.495494067668915e-06, 5.686655640602112e-06, 6.877817213535309e-06, 8.068978786468506e-06, 9.260140359401703e-06, 1.04513019323349e-05, 1.1642463505268097e-05, 1.2833625078201294e-05, 1.4024786651134491e-05, 1.5215948224067688e-05, 1.6407109797000885e-05, 1.7598271369934082e-05, 1.878943294286728e-05, 1.9980594515800476e-05, 2.1171756088733673e-05, 2.236291766166687e-05, 2.3554079234600067e-05, 2.4745240807533264e-05, 2.593640238046646e-05, 2.7127563953399658e-05, 2.8318725526332855e-05, 2.9509887099266052e-05, 3.070104867219925e-05, 3.1892210245132446e-05, 3.308337181806564e-05, 3.427453339099884e-05, 3.546569496393204e-05, 3.6656856536865234e-05]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 10.0, 7.0, 11.0, 10.0, 8.0, 7.0, 20.0, 8.0, 24.0, 18.0, 18.0, 29.0, 29.0, 29.0, 42.0, 29.0, 32.0, 48.0, 46.0, 50.0, 53.0, 47.0, 54.0, 48.0, 42.0, 48.0, 23.0, 29.0, 26.0, 20.0, 22.0, 14.0, 16.0, 17.0, 15.0, 12.0, 10.0, 10.0, 4.0, 2.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.319978713989258e-05, -3.219861537218094e-05, -3.11974436044693e-05, -3.019627183675766e-05, -2.919510006904602e-05, -2.819392830133438e-05, -2.7192756533622742e-05, -2.6191584765911102e-05, -2.5190412998199463e-05, -2.4189241230487823e-05, -2.3188069462776184e-05, -2.2186897695064545e-05, -2.1185725927352905e-05, -2.0184554159641266e-05, -1.9183382391929626e-05, -1.8182210624217987e-05, -1.7181038856506348e-05, -1.6179867088794708e-05, -1.5178695321083069e-05, -1.417752355337143e-05, -1.317635178565979e-05, -1.217518001794815e-05, -1.1174008250236511e-05, -1.0172836482524872e-05, -9.171664714813232e-06, -8.170492947101593e-06, -7.169321179389954e-06, -6.168149411678314e-06, -5.166977643966675e-06, -4.165805876255035e-06, -3.164634108543396e-06, -2.1634623408317566e-06, -1.1622905731201172e-06, -1.6111880540847778e-07, 8.400529623031616e-07, 1.841224730014801e-06, 2.8423964977264404e-06, 3.84356826543808e-06, 4.844740033149719e-06, 5.845911800861359e-06, 6.847083568572998e-06, 7.848255336284637e-06, 8.849427103996277e-06, 9.850598871707916e-06, 1.0851770639419556e-05, 1.1852942407131195e-05, 1.2854114174842834e-05, 1.3855285942554474e-05, 1.4856457710266113e-05, 1.5857629477977753e-05, 1.6858801245689392e-05, 1.785997301340103e-05, 1.886114478111267e-05, 1.986231654882431e-05, 2.086348831653595e-05, 2.186466008424759e-05, 2.286583185195923e-05, 2.3867003619670868e-05, 2.4868175387382507e-05, 2.5869347155094147e-05, 2.6870518922805786e-05, 2.7871690690517426e-05, 2.8872862458229065e-05, 2.9874034225940704e-05, 3.0875205993652344e-05]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 5.0, 13.0, 10.0, 18.0, 31.0, 43.0, 60.0, 70.0, 107.0, 156.0, 251.0, 220.0, 491.0, 708.0, 1183.0, 1177.0, 2680.0, 4970.0, 9470.0, 11602.0, 36678.0, 102394.0, 476251.0, 276276.0, 53929.0, 36140.0, 15625.0, 7756.0, 3079.0, 2718.0, 1591.0, 943.0, 422.0, 472.0, 312.0, 222.0, 106.0, 128.0, 80.0, 49.0, 34.0, 19.0, 17.0, 12.0, 12.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.424022674560547e-06, -5.259178578853607e-06, -5.0943344831466675e-06, -4.929490387439728e-06, -4.764646291732788e-06, -4.599802196025848e-06, -4.434958100318909e-06, -4.270114004611969e-06, -4.105269908905029e-06, -3.94042581319809e-06, -3.77558171749115e-06, -3.61073762178421e-06, -3.4458935260772705e-06, -3.281049430370331e-06, -3.116205334663391e-06, -2.9513612389564514e-06, -2.7865171432495117e-06, -2.621673047542572e-06, -2.4568289518356323e-06, -2.2919848561286926e-06, -2.127140760421753e-06, -1.9622966647148132e-06, -1.7974525690078735e-06, -1.6326084733009338e-06, -1.4677643775939941e-06, -1.3029202818870544e-06, -1.1380761861801147e-06, -9.73232090473175e-07, -8.083879947662354e-07, -6.435438990592957e-07, -4.78699803352356e-07, -3.1385570764541626e-07, -1.4901161193847656e-07, 1.5832483768463135e-08, 1.8067657947540283e-07, 3.4552067518234253e-07, 5.103647708892822e-07, 6.752088665962219e-07, 8.400529623031616e-07, 1.0048970580101013e-06, 1.169741153717041e-06, 1.3345852494239807e-06, 1.4994293451309204e-06, 1.6642734408378601e-06, 1.8291175365447998e-06, 1.9939616322517395e-06, 2.158805727958679e-06, 2.323649823665619e-06, 2.4884939193725586e-06, 2.6533380150794983e-06, 2.818182110786438e-06, 2.9830262064933777e-06, 3.1478703022003174e-06, 3.312714397907257e-06, 3.4775584936141968e-06, 3.6424025893211365e-06, 3.807246685028076e-06, 3.972090780735016e-06, 4.1369348764419556e-06, 4.301778972148895e-06, 4.466623067855835e-06, 4.631467163562775e-06, 4.796311259269714e-06, 4.961155354976654e-06, 5.125999450683594e-06]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 8.0, 9.0, 0.0, 11.0, 14.0, 0.0, 18.0, 35.0, 0.0, 33.0, 39.0, 0.0, 63.0, 65.0, 0.0, 90.0, 94.0, 82.0, 0.0, 89.0, 81.0, 0.0, 57.0, 60.0, 0.0, 37.0, 31.0, 0.0, 24.0, 14.0, 0.0, 24.0, 13.0, 6.0, 0.0, 5.0, 5.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.430511474609375e-06, -1.389533281326294e-06, -1.3485550880432129e-06, -1.3075768947601318e-06, -1.2665987014770508e-06, -1.2256205081939697e-06, -1.1846423149108887e-06, -1.1436641216278076e-06, -1.1026859283447266e-06, -1.0617077350616455e-06, -1.0207295417785645e-06, -9.797513484954834e-07, -9.387731552124023e-07, -8.977949619293213e-07, -8.568167686462402e-07, -8.158385753631592e-07, -7.748603820800781e-07, -7.338821887969971e-07, -6.92903995513916e-07, -6.51925802230835e-07, -6.109476089477539e-07, -5.699694156646729e-07, -5.289912223815918e-07, -4.880130290985107e-07, -4.470348358154297e-07, -4.0605664253234863e-07, -3.650784492492676e-07, -3.241002559661865e-07, -2.8312206268310547e-07, -2.421438694000244e-07, -2.0116567611694336e-07, -1.601874828338623e-07, -1.1920928955078125e-07, -7.82310962677002e-08, -3.725290298461914e-08, 3.725290298461914e-09, 4.470348358154297e-08, 8.568167686462402e-08, 1.2665987014770508e-07, 1.6763806343078613e-07, 2.086162567138672e-07, 2.4959444999694824e-07, 2.905726432800293e-07, 3.3155083656311035e-07, 3.725290298461914e-07, 4.1350722312927246e-07, 4.544854164123535e-07, 4.954636096954346e-07, 5.364418029785156e-07, 5.774199962615967e-07, 6.183981895446777e-07, 6.593763828277588e-07, 7.003545761108398e-07, 7.413327693939209e-07, 7.82310962677002e-07, 8.23289155960083e-07, 8.642673492431641e-07, 9.052455425262451e-07, 9.462237358093262e-07, 9.872019290924072e-07, 1.0281801223754883e-06, 1.0691583156585693e-06, 1.1101365089416504e-06, 1.1511147022247314e-06, 1.1920928955078125e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 4.0, 2.0, 7.0, 11.0, 26.0, 14.0, 20.0, 79.0, 40.0, 100.0, 85.0, 223.0, 135.0, 413.0, 279.0, 776.0, 548.0, 668.0, 1961.0, 1381.0, 4178.0, 3037.0, 9840.0, 7896.0, 27215.0, 25381.0, 117019.0, 163378.0, 318859.0, 238963.0, 41757.0, 41559.0, 11192.0, 13313.0, 4133.0, 5441.0, 1832.0, 2426.0, 897.0, 721.0, 997.0, 334.0, 465.0, 201.0, 255.0, 92.0, 151.0, 60.0, 87.0, 19.0, 23.0, 30.0, 8.0, 15.0, 7.0, 8.0, 1.0, 3.0, 0.0, 2.0], "bins": [-2.8014183044433594e-06, -2.71480530500412e-06, -2.6281923055648804e-06, -2.541579306125641e-06, -2.4549663066864014e-06, -2.368353307247162e-06, -2.2817403078079224e-06, -2.195127308368683e-06, -2.1085143089294434e-06, -2.021901309490204e-06, -1.9352883100509644e-06, -1.8486753106117249e-06, -1.7620623111724854e-06, -1.6754493117332458e-06, -1.5888363122940063e-06, -1.5022233128547668e-06, -1.4156103134155273e-06, -1.3289973139762878e-06, -1.2423843145370483e-06, -1.1557713150978088e-06, -1.0691583156585693e-06, -9.825453162193298e-07, -8.959323167800903e-07, -8.093193173408508e-07, -7.227063179016113e-07, -6.360933184623718e-07, -5.494803190231323e-07, -4.628673195838928e-07, -3.762543201446533e-07, -2.896413207054138e-07, -2.0302832126617432e-07, -1.1641532182693481e-07, -2.9802322387695312e-08, 5.681067705154419e-08, 1.434236764907837e-07, 2.300366759300232e-07, 3.166496753692627e-07, 4.032626748085022e-07, 4.898756742477417e-07, 5.764886736869812e-07, 6.631016731262207e-07, 7.497146725654602e-07, 8.363276720046997e-07, 9.229406714439392e-07, 1.0095536708831787e-06, 1.0961666703224182e-06, 1.1827796697616577e-06, 1.2693926692008972e-06, 1.3560056686401367e-06, 1.4426186680793762e-06, 1.5292316675186157e-06, 1.6158446669578552e-06, 1.7024576663970947e-06, 1.7890706658363342e-06, 1.8756836652755737e-06, 1.9622966647148132e-06, 2.0489096641540527e-06, 2.1355226635932922e-06, 2.2221356630325317e-06, 2.3087486624717712e-06, 2.3953616619110107e-06, 2.4819746613502502e-06, 2.5685876607894897e-06, 2.6552006602287292e-06, 2.7418136596679688e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 6.0, 2.0, 2.0, 7.0, 4.0, 6.0, 4.0, 7.0, 20.0, 15.0, 12.0, 15.0, 24.0, 54.0, 30.0, 38.0, 47.0, 45.0, 68.0, 132.0, 56.0, 62.0, 46.0, 45.0, 71.0, 26.0, 26.0, 17.0, 9.0, 28.0, 10.0, 11.0, 8.0, 2.0, 4.0, 17.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.3245811462402344e-06, -2.253800630569458e-06, -2.1830201148986816e-06, -2.1122395992279053e-06, -2.041459083557129e-06, -1.9706785678863525e-06, -1.8998980522155762e-06, -1.8291175365447998e-06, -1.7583370208740234e-06, -1.687556505203247e-06, -1.6167759895324707e-06, -1.5459954738616943e-06, -1.475214958190918e-06, -1.4044344425201416e-06, -1.3336539268493652e-06, -1.2628734111785889e-06, -1.1920928955078125e-06, -1.1213123798370361e-06, -1.0505318641662598e-06, -9.797513484954834e-07, -9.08970832824707e-07, -8.381903171539307e-07, -7.674098014831543e-07, -6.966292858123779e-07, -6.258487701416016e-07, -5.550682544708252e-07, -4.842877388000488e-07, -4.1350722312927246e-07, -3.427267074584961e-07, -2.7194619178771973e-07, -2.0116567611694336e-07, -1.30385160446167e-07, -5.960464477539063e-08, 1.1175870895385742e-08, 8.195638656616211e-08, 1.5273690223693848e-07, 2.2351741790771484e-07, 2.942979335784912e-07, 3.650784492492676e-07, 4.3585896492004395e-07, 5.066394805908203e-07, 5.774199962615967e-07, 6.48200511932373e-07, 7.189810276031494e-07, 7.897615432739258e-07, 8.605420589447021e-07, 9.313225746154785e-07, 1.0021030902862549e-06, 1.0728836059570312e-06, 1.1436641216278076e-06, 1.214444637298584e-06, 1.2852251529693604e-06, 1.3560056686401367e-06, 1.426786184310913e-06, 1.4975666999816895e-06, 1.5683472156524658e-06, 1.6391277313232422e-06, 1.7099082469940186e-06, 1.780688762664795e-06, 1.8514692783355713e-06, 1.9222497940063477e-06, 1.993030309677124e-06, 2.0638108253479004e-06, 2.1345913410186768e-06, 2.205371856689453e-06]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 8.0, 9.0, 21.0, 29.0, 30.0, 48.0, 82.0, 146.0, 189.0, 107.0, 74.0, 36.0, 33.0, 24.0, 24.0, 30.0, 11.0, 15.0, 7.0, 12.0, 10.0, 8.0, 10.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012616651656571776, -0.00012093228724552318, -0.00011569806520128623, -0.00011046383588109165, -0.0001052296138368547, -9.999538451666012e-05, -9.476115519646555e-05, -8.95269331522286e-05, -8.429270383203402e-05, -7.905847451183945e-05, -7.382425246760249e-05, -6.859002314740792e-05, -6.335579382721335e-05, -5.812157178297639e-05, -5.288734246278182e-05, -4.765311678056605e-05, -4.2418891098350286e-05, -3.718466541613452e-05, -3.1950439733918756e-05, -2.6716210413724184e-05, -2.148198473150842e-05, -1.6247759049292654e-05, -1.1013529729098082e-05, -5.7793040468823165e-06, -5.450783646665514e-07, 4.6891482270439155e-06, 9.923374818754382e-06, 1.5157602319959551e-05, 2.0391828002175316e-05, 2.562605368439108e-05, 3.0860283004585654e-05, 3.609450868680142e-05, 4.1328719817101955e-05, 4.656294549931772e-05, 5.1797171181533486e-05, 5.703140050172806e-05, 6.226562254596502e-05, 6.749985186615959e-05, 7.273408118635416e-05, 7.796830323059112e-05, 8.320253255078569e-05, 8.843676187098026e-05, 9.367098391521722e-05, 9.890521323541179e-05, 0.00010413944255560637, 0.00010937366459984332, 0.0001146078939200379, 0.00011984212324023247, 0.00012507634528446943, 0.00013031056732870638, 0.00013554480392485857, 0.00014077902596909553, 0.00014601324801333249, 0.00015124748460948467, 0.00015648170665372163, 0.0001617159286979586, 0.00016695016529411077, 0.00017218438733834773, 0.00017741862393449992, 0.00018265284597873688, 0.00018788706802297384, 0.0001931212900672108, 0.00019835552666336298, 0.00020358974870759994, 0.0002088239707518369]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 8.0, 4.0, 3.0, 7.0, 7.0, 9.0, 15.0, 10.0, 10.0, 11.0, 11.0, 17.0, 18.0, 19.0, 23.0, 27.0, 30.0, 33.0, 28.0, 32.0, 39.0, 49.0, 39.0, 47.0, 47.0, 36.0, 30.0, 41.0, 31.0, 38.0, 34.0, 32.0, 29.0, 28.0, 18.0, 28.0, 17.0, 16.0, 16.0, 13.0, 7.0, 13.0, 3.0, 5.0, 8.0, 3.0, 2.0, 5.0, 3.0, 8.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.620189666748047e-05, -9.331479668617249e-05, -9.04276967048645e-05, -8.754059672355652e-05, -8.465349674224854e-05, -8.176639676094055e-05, -7.887929677963257e-05, -7.599219679832458e-05, -7.31050968170166e-05, -7.021799683570862e-05, -6.733089685440063e-05, -6.444379687309265e-05, -6.155669689178467e-05, -5.8669596910476685e-05, -5.57824969291687e-05, -5.289539694786072e-05, -5.0008296966552734e-05, -4.712119698524475e-05, -4.423409700393677e-05, -4.1346997022628784e-05, -3.84598970413208e-05, -3.557279706001282e-05, -3.2685697078704834e-05, -2.979859709739685e-05, -2.6911497116088867e-05, -2.4024397134780884e-05, -2.11372971534729e-05, -1.8250197172164917e-05, -1.5363097190856934e-05, -1.247599720954895e-05, -9.588897228240967e-06, -6.701797246932983e-06, -3.814697265625e-06, -9.275972843170166e-07, 1.959502696990967e-06, 4.84660267829895e-06, 7.733702659606934e-06, 1.0620802640914917e-05, 1.35079026222229e-05, 1.6395002603530884e-05, 1.9282102584838867e-05, 2.216920256614685e-05, 2.5056302547454834e-05, 2.7943402528762817e-05, 3.08305025100708e-05, 3.3717602491378784e-05, 3.660470247268677e-05, 3.949180245399475e-05, 4.2378902435302734e-05, 4.526600241661072e-05, 4.81531023979187e-05, 5.1040202379226685e-05, 5.392730236053467e-05, 5.681440234184265e-05, 5.9701502323150635e-05, 6.258860230445862e-05, 6.54757022857666e-05, 6.836280226707458e-05, 7.124990224838257e-05, 7.413700222969055e-05, 7.702410221099854e-05, 7.991120219230652e-05, 8.27983021736145e-05, 8.568540215492249e-05, 8.857250213623047e-05]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 16.0, 24.0, 27.0, 38.0, 54.0, 89.0, 136.0, 203.0, 306.0, 519.0, 723.0, 1211.0, 1926.0, 3053.0, 4964.0, 8100.0, 14325.0, 29887.0, 72523.0, 3698165.0, 258589.0, 50415.0, 22557.0, 10891.0, 6020.0, 3236.0, 2048.0, 1288.0, 777.0, 654.0, 418.0, 262.0, 217.0, 161.0, 120.0, 79.0, 53.0, 54.0, 43.0, 32.0, 16.0, 9.0, 11.0, 8.0, 7.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-8.374452590942383e-05, -8.050259202718735e-05, -7.726065814495087e-05, -7.401872426271439e-05, -7.07767903804779e-05, -6.753485649824142e-05, -6.429292261600494e-05, -6.105098873376846e-05, -5.780905485153198e-05, -5.45671209692955e-05, -5.132518708705902e-05, -4.808325320482254e-05, -4.484131932258606e-05, -4.159938544034958e-05, -3.83574515581131e-05, -3.511551767587662e-05, -3.187358379364014e-05, -2.8631649911403656e-05, -2.5389716029167175e-05, -2.2147782146930695e-05, -1.8905848264694214e-05, -1.5663914382457733e-05, -1.2421980500221252e-05, -9.180046617984772e-06, -5.938112735748291e-06, -2.6961788535118103e-06, 5.457550287246704e-07, 3.787688910961151e-06, 7.029622793197632e-06, 1.0271556675434113e-05, 1.3513490557670593e-05, 1.6755424439907074e-05, 1.9997358322143555e-05, 2.3239292204380035e-05, 2.6481226086616516e-05, 2.9723159968852997e-05, 3.296509385108948e-05, 3.620702773332596e-05, 3.944896161556244e-05, 4.269089549779892e-05, 4.59328293800354e-05, 4.917476326227188e-05, 5.241669714450836e-05, 5.565863102674484e-05, 5.890056490898132e-05, 6.21424987912178e-05, 6.538443267345428e-05, 6.862636655569077e-05, 7.186830043792725e-05, 7.511023432016373e-05, 7.835216820240021e-05, 8.159410208463669e-05, 8.483603596687317e-05, 8.807796984910965e-05, 9.131990373134613e-05, 9.456183761358261e-05, 9.780377149581909e-05, 0.00010104570537805557, 0.00010428763926029205, 0.00010752957314252853, 0.00011077150702476501, 0.0001140134409070015, 0.00011725537478923798, 0.00012049730867147446, 0.00012373924255371094]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 9.0, 10.0, 11.0, 15.0, 16.0, 20.0, 13.0, 35.0, 44.0, 48.0, 68.0, 82.0, 90.0, 94.0, 74.0, 80.0, 71.0, 50.0, 43.0, 29.0, 30.0, 15.0, 11.0, 9.0, 9.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3828277587890625e-05, -1.3285316526889801e-05, -1.2742355465888977e-05, -1.2199394404888153e-05, -1.1656433343887329e-05, -1.1113472282886505e-05, -1.0570511221885681e-05, -1.0027550160884857e-05, -9.484589099884033e-06, -8.94162803888321e-06, -8.398666977882385e-06, -7.855705916881561e-06, -7.312744855880737e-06, -6.769783794879913e-06, -6.226822733879089e-06, -5.683861672878265e-06, -5.140900611877441e-06, -4.5979395508766174e-06, -4.0549784898757935e-06, -3.5120174288749695e-06, -2.9690563678741455e-06, -2.4260953068733215e-06, -1.8831342458724976e-06, -1.3401731848716736e-06, -7.972121238708496e-07, -2.5425106287002563e-07, 2.8870999813079834e-07, 8.316710591316223e-07, 1.3746321201324463e-06, 1.9175931811332703e-06, 2.4605542421340942e-06, 3.0035153031349182e-06, 3.546476364135742e-06, 4.089437425136566e-06, 4.63239848613739e-06, 5.175359547138214e-06, 5.718320608139038e-06, 6.261281669139862e-06, 6.804242730140686e-06, 7.34720379114151e-06, 7.890164852142334e-06, 8.433125913143158e-06, 8.976086974143982e-06, 9.519048035144806e-06, 1.006200909614563e-05, 1.0604970157146454e-05, 1.1147931218147278e-05, 1.1690892279148102e-05, 1.2233853340148926e-05, 1.277681440114975e-05, 1.3319775462150574e-05, 1.3862736523151398e-05, 1.4405697584152222e-05, 1.4948658645153046e-05, 1.549161970615387e-05, 1.6034580767154694e-05, 1.6577541828155518e-05, 1.712050288915634e-05, 1.7663463950157166e-05, 1.820642501115799e-05, 1.8749386072158813e-05, 1.9292347133159637e-05, 1.983530819416046e-05, 2.0378269255161285e-05, 2.092123031616211e-05]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 6.0, 9.0, 11.0, 30.0, 22.0, 22.0, 47.0, 81.0, 87.0, 166.0, 238.0, 411.0, 607.0, 969.0, 1587.0, 2845.0, 5015.0, 9393.0, 19108.0, 43542.0, 124202.0, 3609708.0, 259033.0, 63221.0, 25931.0, 12340.0, 6682.0, 3509.0, 2070.0, 1269.0, 734.0, 525.0, 299.0, 171.0, 136.0, 82.0, 48.0, 41.0, 28.0, 20.0, 10.0, 8.0, 11.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.635354995727539e-05, -7.401779294013977e-05, -7.168203592300415e-05, -6.934627890586853e-05, -6.701052188873291e-05, -6.467476487159729e-05, -6.233900785446167e-05, -6.000325083732605e-05, -5.766749382019043e-05, -5.533173680305481e-05, -5.299597978591919e-05, -5.066022276878357e-05, -4.832446575164795e-05, -4.598870873451233e-05, -4.365295171737671e-05, -4.131719470024109e-05, -3.898143768310547e-05, -3.664568066596985e-05, -3.430992364883423e-05, -3.197416663169861e-05, -2.9638409614562988e-05, -2.7302652597427368e-05, -2.4966895580291748e-05, -2.2631138563156128e-05, -2.0295381546020508e-05, -1.7959624528884888e-05, -1.5623867511749268e-05, -1.3288110494613647e-05, -1.0952353477478027e-05, -8.616596460342407e-06, -6.280839443206787e-06, -3.945082426071167e-06, -1.6093254089355469e-06, 7.264316082000732e-07, 3.0621886253356934e-06, 5.3979456424713135e-06, 7.733702659606934e-06, 1.0069459676742554e-05, 1.2405216693878174e-05, 1.4740973711013794e-05, 1.7076730728149414e-05, 1.9412487745285034e-05, 2.1748244762420654e-05, 2.4084001779556274e-05, 2.6419758796691895e-05, 2.8755515813827515e-05, 3.1091272830963135e-05, 3.3427029848098755e-05, 3.5762786865234375e-05, 3.8098543882369995e-05, 4.0434300899505615e-05, 4.2770057916641235e-05, 4.5105814933776855e-05, 4.7441571950912476e-05, 4.9777328968048096e-05, 5.2113085985183716e-05, 5.4448843002319336e-05, 5.6784600019454956e-05, 5.9120357036590576e-05, 6.14561140537262e-05, 6.379187107086182e-05, 6.612762808799744e-05, 6.846338510513306e-05, 7.079914212226868e-05, 7.31348991394043e-05]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 21.0, 15.0, 23.0, 26.0, 38.0, 50.0, 76.0, 260.0, 2118.0, 872.0, 167.0, 65.0, 47.0, 45.0, 40.0, 33.0, 29.0, 14.0, 16.0, 21.0, 14.0, 9.0, 8.0, 9.0, 7.0, 5.0, 5.0, 3.0, 7.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5391578674316406e-05, -2.4178065359592438e-05, -2.296455204486847e-05, -2.17510387301445e-05, -2.0537525415420532e-05, -1.9324012100696564e-05, -1.8110498785972595e-05, -1.6896985471248627e-05, -1.5683472156524658e-05, -1.446995884180069e-05, -1.3256445527076721e-05, -1.2042932212352753e-05, -1.0829418897628784e-05, -9.615905582904816e-06, -8.402392268180847e-06, -7.188878953456879e-06, -5.97536563873291e-06, -4.761852324008942e-06, -3.548339009284973e-06, -2.3348256945610046e-06, -1.1213123798370361e-06, 9.220093488693237e-08, 1.3057142496109009e-06, 2.5192275643348694e-06, 3.732740879058838e-06, 4.946254193782806e-06, 6.159767508506775e-06, 7.373280823230743e-06, 8.586794137954712e-06, 9.80030745267868e-06, 1.1013820767402649e-05, 1.2227334082126617e-05, 1.3440847396850586e-05, 1.4654360711574554e-05, 1.5867874026298523e-05, 1.708138734102249e-05, 1.829490065574646e-05, 1.950841397047043e-05, 2.0721927285194397e-05, 2.1935440599918365e-05, 2.3148953914642334e-05, 2.4362467229366302e-05, 2.557598054409027e-05, 2.678949385881424e-05, 2.8003007173538208e-05, 2.9216520488262177e-05, 3.0430033802986145e-05, 3.1643547117710114e-05, 3.285706043243408e-05, 3.407057374715805e-05, 3.528408706188202e-05, 3.649760037660599e-05, 3.7711113691329956e-05, 3.8924627006053925e-05, 4.013814032077789e-05, 4.135165363550186e-05, 4.256516695022583e-05, 4.37786802649498e-05, 4.499219357967377e-05, 4.6205706894397736e-05, 4.7419220209121704e-05, 4.863273352384567e-05, 4.984624683856964e-05, 5.105976015329361e-05, 5.227327346801758e-05]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 12.0, 17.0, 21.0, 36.0, 63.0, 102.0, 190.0, 124.0, 101.0, 81.0, 45.0, 40.0, 32.0, 32.0, 21.0, 18.0, 10.0, 5.0, 10.0, 7.0, 6.0, 4.0, 4.0, 9.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002415499766357243, -0.00023281027097254992, -0.00022407056530937552, -0.0002153308450942859, -0.00020659113943111151, -0.00019785143376793712, -0.0001891117135528475, -0.00018037200788967311, -0.00017163230222649872, -0.00016289259656332433, -0.00015415289090014994, -0.00014541317068506032, -0.00013667346502188593, -0.00012793375935871154, -0.00011919404641957954, -0.00011045433348044753, -0.00010171462781727314, -9.297492215409875e-05, -8.423520921496674e-05, -7.549549627583474e-05, -6.675579061266035e-05, -5.801608131150715e-05, -4.927637201035395e-05, -4.053665907122195e-05, -3.179695340804756e-05, -2.305724410689436e-05, -1.4317534805741161e-05, -5.577825504587963e-06, 3.1618837965652347e-06, 1.1901593097718433e-05, 2.064130239887163e-05, 2.9381015338003635e-05, 3.812069189734757e-05, 4.686040119850077e-05, 5.5600110499653965e-05, 6.433982343878597e-05, 7.307952910196036e-05, 8.181923476513475e-05, 9.055894770426676e-05, 9.929866064339876e-05, 0.00010803836630657315, 0.00011677807196974754, 0.00012551777763292193, 0.00013425749784801155, 0.00014299720351118594, 0.00015173690917436033, 0.00016047662938944995, 0.00016921633505262434, 0.00017795604071579874, 0.00018669574637897313, 0.00019543545204214752, 0.00020417517225723714, 0.00021291487792041153, 0.00022165458358358592, 0.00023039430379867554, 0.00023913400946184993, 0.0002478737151250243, 0.0002566134207881987, 0.0002653531264513731, 0.0002740928321145475, 0.0002828325377777219, 0.00029157227254472673, 0.0003003119782079011, 0.0003090516838710755, 0.0003177913895342499]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 9.0, 11.0, 8.0, 1.0, 12.0, 9.0, 16.0, 17.0, 17.0, 17.0, 25.0, 29.0, 32.0, 31.0, 34.0, 29.0, 30.0, 35.0, 43.0, 37.0, 42.0, 40.0, 38.0, 34.0, 42.0, 37.0, 37.0, 33.0, 21.0, 27.0, 23.0, 30.0, 29.0, 20.0, 11.0, 20.0, 8.0, 11.0, 9.0, 11.0, 7.0, 7.0, 3.0, 7.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012010335922241211, -0.00011602137237787247, -0.00011193938553333282, -0.00010785739868879318, -0.00010377541184425354, -9.96934249997139e-05, -9.561143815517426e-05, -9.152945131063461e-05, -8.744746446609497e-05, -8.336547762155533e-05, -7.928349077701569e-05, -7.520150393247604e-05, -7.11195170879364e-05, -6.703753024339676e-05, -6.295554339885712e-05, -5.8873556554317474e-05, -5.479156970977783e-05, -5.070958286523819e-05, -4.662759602069855e-05, -4.2545609176158905e-05, -3.846362233161926e-05, -3.438163548707962e-05, -3.0299648642539978e-05, -2.6217661798000336e-05, -2.2135674953460693e-05, -1.805368810892105e-05, -1.3971701264381409e-05, -9.889714419841766e-06, -5.807727575302124e-06, -1.7257407307624817e-06, 2.3562461137771606e-06, 6.438232958316803e-06, 1.0520219802856445e-05, 1.4602206647396088e-05, 1.868419349193573e-05, 2.2766180336475372e-05, 2.6848167181015015e-05, 3.093015402555466e-05, 3.50121408700943e-05, 3.909412771463394e-05, 4.3176114559173584e-05, 4.7258101403713226e-05, 5.134008824825287e-05, 5.542207509279251e-05, 5.950406193733215e-05, 6.35860487818718e-05, 6.766803562641144e-05, 7.175002247095108e-05, 7.583200931549072e-05, 7.991399616003036e-05, 8.399598300457001e-05, 8.807796984910965e-05, 9.215995669364929e-05, 9.624194353818893e-05, 0.00010032393038272858, 0.00010440591722726822, 0.00010848790407180786, 0.0001125698909163475, 0.00011665187776088715, 0.00012073386460542679, 0.00012481585144996643, 0.00012889783829450607, 0.00013297982513904572, 0.00013706181198358536, 0.000141143798828125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 8.0, 9.0, 10.0, 10.0, 17.0, 24.0, 20.0, 36.0, 46.0, 81.0, 147.0, 270.0, 510.0, 1092.0, 2400.0, 5455.0, 14590.0, 46087.0, 274879.0, 601559.0, 68835.0, 19574.0, 7089.0, 3013.0, 1337.0, 623.0, 308.0, 184.0, 114.0, 54.0, 36.0, 17.0, 23.0, 18.0, 10.0, 17.0, 5.0, 6.0, 4.0, 8.0, 4.0, 0.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001360177993774414, -0.0001315046101808548, -0.0001269914209842682, -0.00012247823178768158, -0.00011796504259109497, -0.00011345185339450836, -0.00010893866419792175, -0.00010442547500133514, -9.991228580474854e-05, -9.539909660816193e-05, -9.088590741157532e-05, -8.637271821498871e-05, -8.18595290184021e-05, -7.734633982181549e-05, -7.283315062522888e-05, -6.831996142864227e-05, -6.380677223205566e-05, -5.9293583035469055e-05, -5.4780393838882446e-05, -5.026720464229584e-05, -4.575401544570923e-05, -4.124082624912262e-05, -3.672763705253601e-05, -3.22144478559494e-05, -2.7701258659362793e-05, -2.3188069462776184e-05, -1.8674880266189575e-05, -1.4161691069602966e-05, -9.648501873016357e-06, -5.1353126764297485e-06, -6.221234798431396e-07, 3.891065716743469e-06, 8.404254913330078e-06, 1.2917444109916687e-05, 1.7430633306503296e-05, 2.1943822503089905e-05, 2.6457011699676514e-05, 3.097020089626312e-05, 3.548339009284973e-05, 3.999657928943634e-05, 4.450976848602295e-05, 4.902295768260956e-05, 5.353614687919617e-05, 5.8049336075782776e-05, 6.256252527236938e-05, 6.7075714468956e-05, 7.15889036655426e-05, 7.610209286212921e-05, 8.061528205871582e-05, 8.512847125530243e-05, 8.964166045188904e-05, 9.415484964847565e-05, 9.866803884506226e-05, 0.00010318122804164886, 0.00010769441723823547, 0.00011220760643482208, 0.00011672079563140869, 0.0001212339848279953, 0.0001257471740245819, 0.00013026036322116852, 0.00013477355241775513, 0.00013928674161434174, 0.00014379993081092834, 0.00014831312000751495, 0.00015282630920410156]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 9.0, 6.0, 19.0, 17.0, 23.0, 24.0, 49.0, 67.0, 106.0, 108.0, 144.0, 102.0, 109.0, 68.0, 40.0, 39.0, 21.0, 16.0, 12.0, 5.0, 7.0, 3.0, 5.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3887882232666016e-05, -1.3134442269802094e-05, -1.2381002306938171e-05, -1.162756234407425e-05, -1.0874122381210327e-05, -1.0120682418346405e-05, -9.367242455482483e-06, -8.61380249261856e-06, -7.860362529754639e-06, -7.1069225668907166e-06, -6.3534826040267944e-06, -5.600042641162872e-06, -4.84660267829895e-06, -4.093162715435028e-06, -3.339722752571106e-06, -2.586282789707184e-06, -1.8328428268432617e-06, -1.0794028639793396e-06, -3.259629011154175e-07, 4.2747706174850464e-07, 1.1809170246124268e-06, 1.934356987476349e-06, 2.687796950340271e-06, 3.441236913204193e-06, 4.194676876068115e-06, 4.948116838932037e-06, 5.7015568017959595e-06, 6.454996764659882e-06, 7.208436727523804e-06, 7.961876690387726e-06, 8.715316653251648e-06, 9.46875661611557e-06, 1.0222196578979492e-05, 1.0975636541843414e-05, 1.1729076504707336e-05, 1.2482516467571259e-05, 1.323595643043518e-05, 1.3989396393299103e-05, 1.4742836356163025e-05, 1.5496276319026947e-05, 1.624971628189087e-05, 1.700315624475479e-05, 1.7756596207618713e-05, 1.8510036170482635e-05, 1.9263476133346558e-05, 2.001691609621048e-05, 2.0770356059074402e-05, 2.1523796021938324e-05, 2.2277235984802246e-05, 2.3030675947666168e-05, 2.378411591053009e-05, 2.4537555873394012e-05, 2.5290995836257935e-05, 2.6044435799121857e-05, 2.679787576198578e-05, 2.75513157248497e-05, 2.8304755687713623e-05, 2.9058195650577545e-05, 2.9811635613441467e-05, 3.056507557630539e-05, 3.131851553916931e-05, 3.2071955502033234e-05, 3.2825395464897156e-05, 3.357883542776108e-05, 3.4332275390625e-05]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 5.0, 7.0, 4.0, 17.0, 16.0, 24.0, 45.0, 30.0, 66.0, 110.0, 153.0, 211.0, 292.0, 418.0, 569.0, 871.0, 1235.0, 1756.0, 2427.0, 3737.0, 5476.0, 7541.0, 11767.0, 17538.0, 26251.0, 37691.0, 65783.0, 119860.0, 291836.0, 203143.0, 94555.0, 53923.0, 31865.0, 22540.0, 15040.0, 10113.0, 6433.0, 4742.0, 3320.0, 2051.0, 1594.0, 1064.0, 738.0, 494.0, 350.0, 270.0, 175.0, 119.0, 90.0, 60.0, 50.0, 35.0, 15.0, 19.0, 9.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0], "bins": [-2.9802322387695312e-05, -2.886541187763214e-05, -2.792850136756897e-05, -2.69915908575058e-05, -2.6054680347442627e-05, -2.5117769837379456e-05, -2.4180859327316284e-05, -2.3243948817253113e-05, -2.230703830718994e-05, -2.137012779712677e-05, -2.04332172870636e-05, -1.9496306777000427e-05, -1.8559396266937256e-05, -1.7622485756874084e-05, -1.6685575246810913e-05, -1.5748664736747742e-05, -1.481175422668457e-05, -1.3874843716621399e-05, -1.2937933206558228e-05, -1.2001022696495056e-05, -1.1064112186431885e-05, -1.0127201676368713e-05, -9.190291166305542e-06, -8.25338065624237e-06, -7.316470146179199e-06, -6.379559636116028e-06, -5.4426491260528564e-06, -4.505738615989685e-06, -3.5688281059265137e-06, -2.6319175958633423e-06, -1.695007085800171e-06, -7.580965757369995e-07, 1.7881393432617188e-07, 1.1157244443893433e-06, 2.0526349544525146e-06, 2.989545464515686e-06, 3.926455974578857e-06, 4.863366484642029e-06, 5.8002769947052e-06, 6.737187504768372e-06, 7.674098014831543e-06, 8.611008524894714e-06, 9.547919034957886e-06, 1.0484829545021057e-05, 1.1421740055084229e-05, 1.23586505651474e-05, 1.3295561075210571e-05, 1.4232471585273743e-05, 1.5169382095336914e-05, 1.6106292605400085e-05, 1.7043203115463257e-05, 1.7980113625526428e-05, 1.89170241355896e-05, 1.985393464565277e-05, 2.0790845155715942e-05, 2.1727755665779114e-05, 2.2664666175842285e-05, 2.3601576685905457e-05, 2.4538487195968628e-05, 2.54753977060318e-05, 2.641230821609497e-05, 2.7349218726158142e-05, 2.8286129236221313e-05, 2.9223039746284485e-05, 3.0159950256347656e-05]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 9.0, 10.0, 8.0, 14.0, 14.0, 12.0, 18.0, 22.0, 12.0, 16.0, 31.0, 24.0, 33.0, 32.0, 35.0, 50.0, 40.0, 36.0, 35.0, 39.0, 45.0, 38.0, 33.0, 48.0, 38.0, 37.0, 28.0, 35.0, 19.0, 23.0, 22.0, 18.0, 20.0, 19.0, 10.0, 11.0, 13.0, 12.0, 10.0, 11.0, 5.0, 2.0, 3.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.855062484741211e-05, -2.766679972410202e-05, -2.678297460079193e-05, -2.5899149477481842e-05, -2.5015324354171753e-05, -2.4131499230861664e-05, -2.3247674107551575e-05, -2.2363848984241486e-05, -2.1480023860931396e-05, -2.0596198737621307e-05, -1.9712373614311218e-05, -1.882854849100113e-05, -1.794472336769104e-05, -1.706089824438095e-05, -1.6177073121070862e-05, -1.5293247997760773e-05, -1.4409422874450684e-05, -1.3525597751140594e-05, -1.2641772627830505e-05, -1.1757947504520416e-05, -1.0874122381210327e-05, -9.990297257900238e-06, -9.106472134590149e-06, -8.22264701128006e-06, -7.338821887969971e-06, -6.454996764659882e-06, -5.5711716413497925e-06, -4.687346518039703e-06, -3.8035213947296143e-06, -2.919696271419525e-06, -2.035871148109436e-06, -1.152046024799347e-06, -2.682209014892578e-07, 6.156042218208313e-07, 1.4994293451309204e-06, 2.3832544684410095e-06, 3.2670795917510986e-06, 4.150904715061188e-06, 5.034729838371277e-06, 5.918554961681366e-06, 6.802380084991455e-06, 7.686205208301544e-06, 8.570030331611633e-06, 9.453855454921722e-06, 1.0337680578231812e-05, 1.12215057015419e-05, 1.210533082485199e-05, 1.2989155948162079e-05, 1.3872981071472168e-05, 1.4756806194782257e-05, 1.5640631318092346e-05, 1.6524456441402435e-05, 1.7408281564712524e-05, 1.8292106688022614e-05, 1.9175931811332703e-05, 2.0059756934642792e-05, 2.094358205795288e-05, 2.182740718126297e-05, 2.271123230457306e-05, 2.3595057427883148e-05, 2.4478882551193237e-05, 2.5362707674503326e-05, 2.6246532797813416e-05, 2.7130357921123505e-05, 2.8014183044433594e-05]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 8.0, 8.0, 9.0, 10.0, 17.0, 28.0, 24.0, 46.0, 70.0, 75.0, 244.0, 254.0, 427.0, 637.0, 1114.0, 2074.0, 3677.0, 6974.0, 13834.0, 29260.0, 64215.0, 295868.0, 357860.0, 149274.0, 63889.0, 28891.0, 13942.0, 7028.0, 3682.0, 2064.0, 1183.0, 908.0, 321.0, 191.0, 152.0, 90.0, 59.0, 46.0, 21.0, 16.0, 15.0, 9.0, 14.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0], "bins": [-4.172325134277344e-06, -4.04752790927887e-06, -3.9227306842803955e-06, -3.7979334592819214e-06, -3.6731362342834473e-06, -3.548339009284973e-06, -3.423541784286499e-06, -3.298744559288025e-06, -3.1739473342895508e-06, -3.0491501092910767e-06, -2.9243528842926025e-06, -2.7995556592941284e-06, -2.6747584342956543e-06, -2.54996120929718e-06, -2.425163984298706e-06, -2.300366759300232e-06, -2.175569534301758e-06, -2.0507723093032837e-06, -1.9259750843048096e-06, -1.8011778593063354e-06, -1.6763806343078613e-06, -1.5515834093093872e-06, -1.426786184310913e-06, -1.301988959312439e-06, -1.1771917343139648e-06, -1.0523945093154907e-06, -9.275972843170166e-07, -8.028000593185425e-07, -6.780028343200684e-07, -5.532056093215942e-07, -4.284083843231201e-07, -3.03611159324646e-07, -1.7881393432617188e-07, -5.4016709327697754e-08, 7.078051567077637e-08, 1.955777406692505e-07, 3.203749656677246e-07, 4.4517219066619873e-07, 5.699694156646729e-07, 6.94766640663147e-07, 8.195638656616211e-07, 9.443610906600952e-07, 1.0691583156585693e-06, 1.1939555406570435e-06, 1.3187527656555176e-06, 1.4435499906539917e-06, 1.5683472156524658e-06, 1.69314444065094e-06, 1.817941665649414e-06, 1.942738890647888e-06, 2.0675361156463623e-06, 2.1923333406448364e-06, 2.3171305656433105e-06, 2.4419277906417847e-06, 2.566725015640259e-06, 2.691522240638733e-06, 2.816319465637207e-06, 2.941116690635681e-06, 3.0659139156341553e-06, 3.1907111406326294e-06, 3.3155083656311035e-06, 3.4403055906295776e-06, 3.5651028156280518e-06, 3.689900040626526e-06, 3.814697265625e-06]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 5.0, 2.0, 6.0, 19.0, 12.0, 15.0, 12.0, 21.0, 27.0, 24.0, 32.0, 38.0, 37.0, 38.0, 41.0, 41.0, 83.0, 54.0, 46.0, 53.0, 47.0, 36.0, 38.0, 48.0, 31.0, 41.0, 35.0, 22.0, 26.0, 27.0, 10.0, 7.0, 7.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6642734408378601e-06, -1.600012183189392e-06, -1.535750925540924e-06, -1.471489667892456e-06, -1.407228410243988e-06, -1.34296715259552e-06, -1.278705894947052e-06, -1.214444637298584e-06, -1.150183379650116e-06, -1.085922122001648e-06, -1.02166086435318e-06, -9.57399606704712e-07, -8.931383490562439e-07, -8.288770914077759e-07, -7.646158337593079e-07, -7.003545761108398e-07, -6.360933184623718e-07, -5.718320608139038e-07, -5.075708031654358e-07, -4.4330954551696777e-07, -3.7904828786849976e-07, -3.1478703022003174e-07, -2.505257725715637e-07, -1.862645149230957e-07, -1.2200325727462769e-07, -5.774199962615967e-08, 6.51925802230835e-09, 7.078051567077637e-08, 1.3504177331924438e-07, 1.993030309677124e-07, 2.635642886161804e-07, 3.2782554626464844e-07, 3.9208680391311646e-07, 4.5634806156158447e-07, 5.206093192100525e-07, 5.848705768585205e-07, 6.491318345069885e-07, 7.133930921554565e-07, 7.776543498039246e-07, 8.419156074523926e-07, 9.061768651008606e-07, 9.704381227493286e-07, 1.0346993803977966e-06, 1.0989606380462646e-06, 1.1632218956947327e-06, 1.2274831533432007e-06, 1.2917444109916687e-06, 1.3560056686401367e-06, 1.4202669262886047e-06, 1.4845281839370728e-06, 1.5487894415855408e-06, 1.6130506992340088e-06, 1.6773119568824768e-06, 1.7415732145309448e-06, 1.8058344721794128e-06, 1.8700957298278809e-06, 1.934356987476349e-06, 1.998618245124817e-06, 2.062879502773285e-06, 2.127140760421753e-06, 2.191402018070221e-06, 2.255663275718689e-06, 2.319924533367157e-06, 2.384185791015625e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 5.0, 7.0, 12.0, 10.0, 15.0, 15.0, 23.0, 37.0, 67.0, 143.0, 171.0, 282.0, 516.0, 985.0, 1987.0, 4192.0, 18334.0, 37673.0, 114963.0, 519485.0, 244665.0, 63743.0, 23293.0, 11921.0, 2844.0, 1398.0, 746.0, 394.0, 218.0, 126.0, 112.0, 43.0, 26.0, 28.0, 11.0, 14.0, 7.0, 19.0, 6.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0531158447265625e-06, -3.925524652004242e-06, -3.7979334592819214e-06, -3.670342266559601e-06, -3.5427510738372803e-06, -3.4151598811149597e-06, -3.287568688392639e-06, -3.1599774956703186e-06, -3.032386302947998e-06, -2.9047951102256775e-06, -2.777203917503357e-06, -2.6496127247810364e-06, -2.522021532058716e-06, -2.3944303393363953e-06, -2.2668391466140747e-06, -2.139247953891754e-06, -2.0116567611694336e-06, -1.884065568447113e-06, -1.7564743757247925e-06, -1.628883183002472e-06, -1.5012919902801514e-06, -1.3737007975578308e-06, -1.2461096048355103e-06, -1.1185184121131897e-06, -9.909272193908691e-07, -8.633360266685486e-07, -7.35744833946228e-07, -6.081536412239075e-07, -4.805624485015869e-07, -3.5297125577926636e-07, -2.253800630569458e-07, -9.778887033462524e-08, 2.9802322387695312e-08, 1.5739351511001587e-07, 2.849847078323364e-07, 4.12575900554657e-07, 5.401670932769775e-07, 6.677582859992981e-07, 7.953494787216187e-07, 9.229406714439392e-07, 1.0505318641662598e-06, 1.1781230568885803e-06, 1.3057142496109009e-06, 1.4333054423332214e-06, 1.560896635055542e-06, 1.6884878277778625e-06, 1.816079020500183e-06, 1.9436702132225037e-06, 2.0712614059448242e-06, 2.1988525986671448e-06, 2.3264437913894653e-06, 2.454034984111786e-06, 2.5816261768341064e-06, 2.709217369556427e-06, 2.8368085622787476e-06, 2.964399755001068e-06, 3.0919909477233887e-06, 3.2195821404457092e-06, 3.3471733331680298e-06, 3.4747645258903503e-06, 3.602355718612671e-06, 3.7299469113349915e-06, 3.857538104057312e-06, 3.9851292967796326e-06, 4.112720489501953e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 10.0, 14.0, 31.0, 17.0, 59.0, 26.0, 82.0, 26.0, 99.0, 65.0, 150.0, 61.0, 99.0, 47.0, 69.0, 19.0, 45.0, 15.0, 17.0, 7.0, 14.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.814697265625e-06, -3.7243589758872986e-06, -3.634020686149597e-06, -3.5436823964118958e-06, -3.4533441066741943e-06, -3.363005816936493e-06, -3.2726675271987915e-06, -3.18232923746109e-06, -3.0919909477233887e-06, -3.0016526579856873e-06, -2.911314368247986e-06, -2.8209760785102844e-06, -2.730637788772583e-06, -2.6402994990348816e-06, -2.54996120929718e-06, -2.4596229195594788e-06, -2.3692846298217773e-06, -2.278946340084076e-06, -2.1886080503463745e-06, -2.098269760608673e-06, -2.0079314708709717e-06, -1.9175931811332703e-06, -1.8272548913955688e-06, -1.7369166016578674e-06, -1.646578311920166e-06, -1.5562400221824646e-06, -1.4659017324447632e-06, -1.3755634427070618e-06, -1.2852251529693604e-06, -1.194886863231659e-06, -1.1045485734939575e-06, -1.014210283756256e-06, -9.238719940185547e-07, -8.335337042808533e-07, -7.431954145431519e-07, -6.528571248054504e-07, -5.62518835067749e-07, -4.721805453300476e-07, -3.818422555923462e-07, -2.915039658546448e-07, -2.0116567611694336e-07, -1.1082738637924194e-07, -2.0489096641540527e-08, 6.984919309616089e-08, 1.601874828338623e-07, 2.505257725715637e-07, 3.4086406230926514e-07, 4.3120235204696655e-07, 5.21540641784668e-07, 6.118789315223694e-07, 7.022172212600708e-07, 7.925555109977722e-07, 8.828938007354736e-07, 9.73232090473175e-07, 1.0635703802108765e-06, 1.1539086699485779e-06, 1.2442469596862793e-06, 1.3345852494239807e-06, 1.4249235391616821e-06, 1.5152618288993835e-06, 1.605600118637085e-06, 1.6959384083747864e-06, 1.7862766981124878e-06, 1.8766149878501892e-06, 1.9669532775878906e-06]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 13.0, 17.0, 42.0, 79.0, 164.0, 224.0, 115.0, 73.0, 55.0, 33.0, 35.0, 29.0, 24.0, 9.0, 16.0, 14.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 6.0, 2.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.116457658819854e-05, -8.470849570585415e-05, -7.825241482350975e-05, -7.179633394116536e-05, -6.534025305882096e-05, -5.888417217647657e-05, -5.242809129413217e-05, -4.597201041178778e-05, -3.951592952944338e-05, -3.305984864709899e-05, -2.6603767764754593e-05, -2.01476868824102e-05, -1.3691606000065804e-05, -7.235525117721409e-06, -7.794442353770137e-07, 5.676636646967381e-06, 1.2132717529311776e-05, 1.858879841165617e-05, 2.5044879294000566e-05, 3.150096017634496e-05, 3.7957041058689356e-05, 4.441312194103375e-05, 5.0869202823378146e-05, 5.732528370572254e-05, 6.378136458806694e-05, 7.023744547041133e-05, 7.669352635275573e-05, 8.314960723510012e-05, 8.960568811744452e-05, 9.606176899978891e-05, 0.0001025178498821333, 0.0001089739307644777, 0.0001154300116468221, 0.00012188609252916649, 0.00012834217341151088, 0.0001347982615698129, 0.00014125433517619967, 0.00014771040878258646, 0.00015416649694088846, 0.00016062258509919047, 0.00016707865870557725, 0.00017353473231196404, 0.00017999082047026604, 0.00018644690862856805, 0.00019290298223495483, 0.00019935905584134161, 0.00020581514399964362, 0.00021227123215794563, 0.00021872730576433241, 0.0002251833793707192, 0.0002316394675290212, 0.0002380955556873232, 0.00024455162929371, 0.0002510077029000968, 0.00025746377650648355, 0.0002639198792167008, 0.0002703759528230876, 0.00027683202642947435, 0.0002832881291396916, 0.00028974420274607837, 0.00029620027635246515, 0.00030265634995885193, 0.0003091124235652387, 0.00031556852627545595, 0.00032202459988184273]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 3.0, 5.0, 4.0, 10.0, 10.0, 10.0, 11.0, 17.0, 9.0, 24.0, 36.0, 32.0, 34.0, 41.0, 34.0, 39.0, 40.0, 50.0, 49.0, 45.0, 55.0, 50.0, 48.0, 32.0, 41.0, 34.0, 26.0, 40.0, 25.0, 27.0, 22.0, 14.0, 9.0, 16.0, 6.0, 15.0, 9.0, 7.0, 6.0, 4.0, 4.0, 3.0, 8.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.846687316894531e-05, -9.508151561021805e-05, -9.169615805149078e-05, -8.831080049276352e-05, -8.492544293403625e-05, -8.154008537530899e-05, -7.815472781658173e-05, -7.476937025785446e-05, -7.13840126991272e-05, -6.799865514039993e-05, -6.461329758167267e-05, -6.12279400229454e-05, -5.784258246421814e-05, -5.4457224905490875e-05, -5.107186734676361e-05, -4.7686509788036346e-05, -4.430115222930908e-05, -4.091579467058182e-05, -3.753043711185455e-05, -3.414507955312729e-05, -3.0759721994400024e-05, -2.737436443567276e-05, -2.3989006876945496e-05, -2.060364931821823e-05, -1.7218291759490967e-05, -1.3832934200763702e-05, -1.0447576642036438e-05, -7.062219083309174e-06, -3.676861524581909e-06, -2.915039658546448e-07, 3.0938535928726196e-06, 6.479211151599884e-06, 9.864568710327148e-06, 1.3249926269054413e-05, 1.6635283827781677e-05, 2.002064138650894e-05, 2.3405998945236206e-05, 2.679135650396347e-05, 3.0176714062690735e-05, 3.3562071621418e-05, 3.6947429180145264e-05, 4.033278673887253e-05, 4.371814429759979e-05, 4.710350185632706e-05, 5.048885941505432e-05, 5.3874216973781586e-05, 5.725957453250885e-05, 6.0644932091236115e-05, 6.403028964996338e-05, 6.741564720869064e-05, 7.080100476741791e-05, 7.418636232614517e-05, 7.757171988487244e-05, 8.09570774435997e-05, 8.434243500232697e-05, 8.772779256105423e-05, 9.11131501197815e-05, 9.449850767850876e-05, 9.788386523723602e-05, 0.00010126922279596329, 0.00010465458035469055, 0.00010803993791341782, 0.00011142529547214508, 0.00011481065303087234, 0.00011819601058959961]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 6.0, 9.0, 13.0, 25.0, 63.0, 77.0, 122.0, 186.0, 319.0, 514.0, 825.0, 1540.0, 2796.0, 5558.0, 14029.0, 44694.0, 3834363.0, 237493.0, 29775.0, 10606.0, 4913.0, 2429.0, 1409.0, 875.0, 552.0, 328.0, 200.0, 126.0, 122.0, 81.0, 41.0, 24.0, 38.0, 22.0, 18.0, 18.0, 11.0, 9.0, 8.0, 7.0, 7.0, 3.0, 11.0, 8.0, 7.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.784366607666016e-05, -7.410906255245209e-05, -7.037445902824402e-05, -6.663985550403595e-05, -6.290525197982788e-05, -5.917064845561981e-05, -5.543604493141174e-05, -5.1701441407203674e-05, -4.7966837882995605e-05, -4.423223435878754e-05, -4.049763083457947e-05, -3.67630273103714e-05, -3.302842378616333e-05, -2.929382026195526e-05, -2.5559216737747192e-05, -2.1824613213539124e-05, -1.8090009689331055e-05, -1.4355406165122986e-05, -1.0620802640914917e-05, -6.886199116706848e-06, -3.1515955924987793e-06, 5.830079317092896e-07, 4.317611455917358e-06, 8.052214980125427e-06, 1.1786818504333496e-05, 1.5521422028541565e-05, 1.9256025552749634e-05, 2.2990629076957703e-05, 2.672523260116577e-05, 3.045983612537384e-05, 3.419443964958191e-05, 3.792904317378998e-05, 4.166364669799805e-05, 4.5398250222206116e-05, 4.9132853746414185e-05, 5.2867457270622253e-05, 5.660206079483032e-05, 6.033666431903839e-05, 6.407126784324646e-05, 6.780587136745453e-05, 7.15404748916626e-05, 7.527507841587067e-05, 7.900968194007874e-05, 8.27442854642868e-05, 8.647888898849487e-05, 9.021349251270294e-05, 9.394809603691101e-05, 9.768269956111908e-05, 0.00010141730308532715, 0.00010515190660953522, 0.00010888651013374329, 0.00011262111365795135, 0.00011635571718215942, 0.00012009032070636749, 0.00012382492423057556, 0.00012755952775478363, 0.0001312941312789917, 0.00013502873480319977, 0.00013876333832740784, 0.0001424979418516159, 0.00014623254537582397, 0.00014996714890003204, 0.0001537017524242401, 0.00015743635594844818, 0.00016117095947265625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 5.0, 2.0, 15.0, 10.0, 15.0, 16.0, 29.0, 64.0, 75.0, 100.0, 133.0, 90.0, 113.0, 103.0, 74.0, 35.0, 41.0, 28.0, 11.0, 7.0, 8.0, 8.0, 5.0, 8.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4722347259521484e-05, -1.400243490934372e-05, -1.3282522559165955e-05, -1.256261020898819e-05, -1.1842697858810425e-05, -1.112278550863266e-05, -1.0402873158454895e-05, -9.68296080827713e-06, -8.963048458099365e-06, -8.2431361079216e-06, -7.5232237577438354e-06, -6.8033114075660706e-06, -6.083399057388306e-06, -5.363486707210541e-06, -4.643574357032776e-06, -3.923662006855011e-06, -3.203749656677246e-06, -2.483837306499481e-06, -1.7639249563217163e-06, -1.0440126061439514e-06, -3.241002559661865e-07, 3.9581209421157837e-07, 1.1157244443893433e-06, 1.8356367945671082e-06, 2.555549144744873e-06, 3.275461494922638e-06, 3.995373845100403e-06, 4.715286195278168e-06, 5.435198545455933e-06, 6.1551108956336975e-06, 6.875023245811462e-06, 7.594935595989227e-06, 8.314847946166992e-06, 9.034760296344757e-06, 9.754672646522522e-06, 1.0474584996700287e-05, 1.1194497346878052e-05, 1.1914409697055817e-05, 1.2634322047233582e-05, 1.3354234397411346e-05, 1.4074146747589111e-05, 1.4794059097766876e-05, 1.551397144794464e-05, 1.6233883798122406e-05, 1.695379614830017e-05, 1.7673708498477936e-05, 1.83936208486557e-05, 1.9113533198833466e-05, 1.983344554901123e-05, 2.0553357899188995e-05, 2.127327024936676e-05, 2.1993182599544525e-05, 2.271309494972229e-05, 2.3433007299900055e-05, 2.415291965007782e-05, 2.4872832000255585e-05, 2.559274435043335e-05, 2.6312656700611115e-05, 2.703256905078888e-05, 2.7752481400966644e-05, 2.847239375114441e-05, 2.9192306101322174e-05, 2.991221845149994e-05, 3.0632130801677704e-05, 3.135204315185547e-05]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 10.0, 8.0, 14.0, 18.0, 31.0, 50.0, 66.0, 79.0, 162.0, 212.0, 344.0, 525.0, 848.0, 1451.0, 2507.0, 3948.0, 7377.0, 14006.0, 28249.0, 77208.0, 2706817.0, 1211510.0, 78179.0, 28934.0, 14019.0, 7116.0, 4353.0, 2409.0, 1402.0, 864.0, 552.0, 367.0, 203.0, 154.0, 95.0, 58.0, 37.0, 33.0, 17.0, 20.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1140785217285156e-05, -4.949048161506653e-05, -4.78401780128479e-05, -4.618987441062927e-05, -4.4539570808410645e-05, -4.2889267206192017e-05, -4.123896360397339e-05, -3.958866000175476e-05, -3.793835639953613e-05, -3.6288052797317505e-05, -3.463774919509888e-05, -3.298744559288025e-05, -3.133714199066162e-05, -2.9686838388442993e-05, -2.8036534786224365e-05, -2.6386231184005737e-05, -2.473592758178711e-05, -2.308562397956848e-05, -2.1435320377349854e-05, -1.9785016775131226e-05, -1.8134713172912598e-05, -1.648440957069397e-05, -1.4834105968475342e-05, -1.3183802366256714e-05, -1.1533498764038086e-05, -9.883195161819458e-06, -8.23289155960083e-06, -6.582587957382202e-06, -4.932284355163574e-06, -3.2819807529449463e-06, -1.6316771507263184e-06, 1.862645149230957e-08, 1.6689300537109375e-06, 3.3192336559295654e-06, 4.969537258148193e-06, 6.619840860366821e-06, 8.27014446258545e-06, 9.920448064804077e-06, 1.1570751667022705e-05, 1.3221055269241333e-05, 1.4871358871459961e-05, 1.652166247367859e-05, 1.8171966075897217e-05, 1.9822269678115845e-05, 2.1472573280334473e-05, 2.31228768825531e-05, 2.477318048477173e-05, 2.6423484086990356e-05, 2.8073787689208984e-05, 2.9724091291427612e-05, 3.137439489364624e-05, 3.302469849586487e-05, 3.4675002098083496e-05, 3.6325305700302124e-05, 3.797560930252075e-05, 3.962591290473938e-05, 4.127621650695801e-05, 4.2926520109176636e-05, 4.4576823711395264e-05, 4.622712731361389e-05, 4.787743091583252e-05, 4.952773451805115e-05, 5.1178038120269775e-05, 5.28283417224884e-05, 5.447864532470703e-05]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 5.0, 8.0, 5.0, 11.0, 20.0, 19.0, 27.0, 47.0, 67.0, 183.0, 634.0, 2274.0, 362.0, 104.0, 46.0, 47.0, 40.0, 19.0, 14.0, 15.0, 20.0, 18.0, 17.0, 12.0, 4.0, 7.0, 8.0, 9.0, 3.0, 9.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4080276489257812e-05, -2.3000873625278473e-05, -2.1921470761299133e-05, -2.0842067897319794e-05, -1.9762665033340454e-05, -1.8683262169361115e-05, -1.7603859305381775e-05, -1.6524456441402435e-05, -1.5445053577423096e-05, -1.4365650713443756e-05, -1.3286247849464417e-05, -1.2206844985485077e-05, -1.1127442121505737e-05, -1.0048039257526398e-05, -8.968636393547058e-06, -7.889233529567719e-06, -6.809830665588379e-06, -5.730427801609039e-06, -4.6510249376297e-06, -3.57162207365036e-06, -2.4922192096710205e-06, -1.412816345691681e-06, -3.334134817123413e-07, 7.459893822669983e-07, 1.8253922462463379e-06, 2.9047951102256775e-06, 3.984197974205017e-06, 5.063600838184357e-06, 6.143003702163696e-06, 7.222406566143036e-06, 8.301809430122375e-06, 9.381212294101715e-06, 1.0460615158081055e-05, 1.1540018022060394e-05, 1.2619420886039734e-05, 1.3698823750019073e-05, 1.4778226613998413e-05, 1.5857629477977753e-05, 1.6937032341957092e-05, 1.8016435205936432e-05, 1.909583806991577e-05, 2.017524093389511e-05, 2.125464379787445e-05, 2.233404666185379e-05, 2.341344952583313e-05, 2.449285238981247e-05, 2.557225525379181e-05, 2.665165811777115e-05, 2.7731060981750488e-05, 2.8810463845729828e-05, 2.9889866709709167e-05, 3.096926957368851e-05, 3.204867243766785e-05, 3.3128075301647186e-05, 3.4207478165626526e-05, 3.5286881029605865e-05, 3.6366283893585205e-05, 3.7445686757564545e-05, 3.8525089621543884e-05, 3.9604492485523224e-05, 4.0683895349502563e-05, 4.17632982134819e-05, 4.284270107746124e-05, 4.392210394144058e-05, 4.500150680541992e-05]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 9.0, 15.0, 18.0, 37.0, 53.0, 76.0, 154.0, 158.0, 105.0, 81.0, 58.0, 59.0, 33.0, 22.0, 26.0, 21.0, 18.0, 9.0, 10.0, 4.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013057143951300532, -0.0001240523997694254, -0.00011753334547393024, -0.0001110142984543927, -0.00010449525143485516, -9.797620441531762e-05, -9.145715739578009e-05, -8.493811037624255e-05, -7.841906335670501e-05, -7.190001633716747e-05, -6.538096931762993e-05, -5.8861922298092395e-05, -5.234287527855486e-05, -4.582382825901732e-05, -3.930478123947978e-05, -3.278573421994224e-05, -2.6266687200404704e-05, -1.9747640180867165e-05, -1.3228593161329627e-05, -6.709546141792089e-06, -1.9049912225455046e-07, 6.328547897282988e-06, 1.2847594916820526e-05, 1.9366641936358064e-05, 2.5885688955895603e-05, 3.240473597543314e-05, 3.892378299497068e-05, 4.544283001450822e-05, 5.1961877034045756e-05, 5.8480924053583294e-05, 6.499997107312083e-05, 7.151901809265837e-05, 7.803805056028068e-05, 8.455709757981822e-05, 9.107614459935576e-05, 9.75951916188933e-05, 0.00010411423863843083, 0.00011063328565796837, 0.00011715233267750591, 0.00012367137242108583, 0.000130190426716581, 0.00013670948101207614, 0.00014322852075565606, 0.000149747560499236, 0.00015626661479473114, 0.0001627856690902263, 0.00016930470883380622, 0.00017582374857738614, 0.0001823428028728813, 0.00018886185716837645, 0.00019538089691195637, 0.0002018999366555363, 0.00020841899095103145, 0.0002149380452465266, 0.00022145708499010652, 0.00022797612473368645, 0.0002344951790291816, 0.00024101423332467675, 0.00024753325851634145, 0.0002540523128118366, 0.00026057136710733175, 0.0002670904214028269, 0.00027360947569832206, 0.00028012850088998675, 0.0002866475551854819]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 11.0, 4.0, 6.0, 15.0, 8.0, 16.0, 13.0, 19.0, 25.0, 17.0, 21.0, 22.0, 34.0, 38.0, 36.0, 35.0, 31.0, 35.0, 36.0, 40.0, 22.0, 48.0, 35.0, 38.0, 30.0, 33.0, 34.0, 45.0, 33.0, 29.0, 27.0, 32.0, 18.0, 25.0, 15.0, 13.0, 14.0, 13.0, 12.0, 5.0, 6.0, 3.0, 6.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.34600830078125e-05, -9.044818580150604e-05, -8.743628859519958e-05, -8.442439138889313e-05, -8.141249418258667e-05, -7.840059697628021e-05, -7.538869976997375e-05, -7.23768025636673e-05, -6.936490535736084e-05, -6.635300815105438e-05, -6.334111094474792e-05, -6.032921373844147e-05, -5.731731653213501e-05, -5.430541932582855e-05, -5.1293522119522095e-05, -4.828162491321564e-05, -4.526972770690918e-05, -4.225783050060272e-05, -3.9245933294296265e-05, -3.623403608798981e-05, -3.322213888168335e-05, -3.0210241675376892e-05, -2.7198344469070435e-05, -2.4186447262763977e-05, -2.117455005645752e-05, -1.8162652850151062e-05, -1.5150755643844604e-05, -1.2138858437538147e-05, -9.12696123123169e-06, -6.115064024925232e-06, -3.1031668186187744e-06, -9.12696123123169e-08, 2.9206275939941406e-06, 5.932524800300598e-06, 8.944422006607056e-06, 1.1956319212913513e-05, 1.496821641921997e-05, 1.7980113625526428e-05, 2.0992010831832886e-05, 2.4003908038139343e-05, 2.70158052444458e-05, 3.0027702450752258e-05, 3.3039599657058716e-05, 3.605149686336517e-05, 3.906339406967163e-05, 4.207529127597809e-05, 4.5087188482284546e-05, 4.8099085688591003e-05, 5.111098289489746e-05, 5.412288010120392e-05, 5.7134777307510376e-05, 6.0146674513816833e-05, 6.315857172012329e-05, 6.617046892642975e-05, 6.91823661327362e-05, 7.219426333904266e-05, 7.520616054534912e-05, 7.821805775165558e-05, 8.122995495796204e-05, 8.42418521642685e-05, 8.725374937057495e-05, 9.026564657688141e-05, 9.327754378318787e-05, 9.628944098949432e-05, 9.930133819580078e-05]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 4.0, 6.0, 8.0, 8.0, 15.0, 10.0, 16.0, 14.0, 16.0, 34.0, 57.0, 96.0, 168.0, 390.0, 795.0, 1764.0, 4153.0, 11403.0, 39417.0, 251289.0, 639695.0, 71455.0, 17206.0, 6036.0, 2379.0, 1013.0, 497.0, 237.0, 114.0, 60.0, 40.0, 33.0, 23.0, 24.0, 19.0, 11.0, 7.0, 8.0, 7.0, 4.0, 3.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.000179290771484375, -0.0001741945743560791, -0.0001690983772277832, -0.0001640021800994873, -0.0001589059829711914, -0.0001538097858428955, -0.0001487135887145996, -0.0001436173915863037, -0.0001385211944580078, -0.00013342499732971191, -0.00012832880020141602, -0.00012323260307312012, -0.00011813640594482422, -0.00011304020881652832, -0.00010794401168823242, -0.00010284781455993652, -9.775161743164062e-05, -9.265542030334473e-05, -8.755922317504883e-05, -8.246302604675293e-05, -7.736682891845703e-05, -7.227063179016113e-05, -6.717443466186523e-05, -6.207823753356934e-05, -5.698204040527344e-05, -5.188584327697754e-05, -4.678964614868164e-05, -4.169344902038574e-05, -3.6597251892089844e-05, -3.1501054763793945e-05, -2.6404857635498047e-05, -2.130866050720215e-05, -1.621246337890625e-05, -1.1116266250610352e-05, -6.020069122314453e-06, -9.238719940185547e-07, 4.172325134277344e-06, 9.268522262573242e-06, 1.436471939086914e-05, 1.946091651916504e-05, 2.4557113647460938e-05, 2.9653310775756836e-05, 3.4749507904052734e-05, 3.984570503234863e-05, 4.494190216064453e-05, 5.003809928894043e-05, 5.513429641723633e-05, 6.0230493545532227e-05, 6.532669067382812e-05, 7.042288780212402e-05, 7.551908493041992e-05, 8.061528205871582e-05, 8.571147918701172e-05, 9.080767631530762e-05, 9.590387344360352e-05, 0.00010100007057189941, 0.00010609626770019531, 0.00011119246482849121, 0.00011628866195678711, 0.00012138485908508301, 0.0001264810562133789, 0.0001315772533416748, 0.0001366734504699707, 0.0001417696475982666, 0.0001468658447265625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 4.0, 7.0, 16.0, 18.0, 22.0, 35.0, 57.0, 84.0, 126.0, 119.0, 121.0, 111.0, 98.0, 62.0, 38.0, 24.0, 21.0, 8.0, 11.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.531839370727539e-05, -1.451931893825531e-05, -1.372024416923523e-05, -1.2921169400215149e-05, -1.2122094631195068e-05, -1.1323019862174988e-05, -1.0523945093154907e-05, -9.724870324134827e-06, -8.925795555114746e-06, -8.126720786094666e-06, -7.327646017074585e-06, -6.528571248054504e-06, -5.729496479034424e-06, -4.930421710014343e-06, -4.131346940994263e-06, -3.332272171974182e-06, -2.5331974029541016e-06, -1.734122633934021e-06, -9.350478649139404e-07, -1.3597309589385986e-07, 6.631016731262207e-07, 1.4621764421463013e-06, 2.261251211166382e-06, 3.0603259801864624e-06, 3.859400749206543e-06, 4.6584755182266235e-06, 5.457550287246704e-06, 6.256625056266785e-06, 7.055699825286865e-06, 7.854774594306946e-06, 8.653849363327026e-06, 9.452924132347107e-06, 1.0251998901367188e-05, 1.1051073670387268e-05, 1.1850148439407349e-05, 1.264922320842743e-05, 1.344829797744751e-05, 1.424737274646759e-05, 1.5046447515487671e-05, 1.584552228450775e-05, 1.6644597053527832e-05, 1.7443671822547913e-05, 1.8242746591567993e-05, 1.9041821360588074e-05, 1.9840896129608154e-05, 2.0639970898628235e-05, 2.1439045667648315e-05, 2.2238120436668396e-05, 2.3037195205688477e-05, 2.3836269974708557e-05, 2.4635344743728638e-05, 2.5434419512748718e-05, 2.62334942817688e-05, 2.703256905078888e-05, 2.783164381980896e-05, 2.863071858882904e-05, 2.942979335784912e-05, 3.02288681268692e-05, 3.102794289588928e-05, 3.182701766490936e-05, 3.262609243392944e-05, 3.3425167202949524e-05, 3.4224241971969604e-05, 3.5023316740989685e-05, 3.5822391510009766e-05]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 10.0, 15.0, 16.0, 18.0, 26.0, 54.0, 69.0, 96.0, 136.0, 231.0, 319.0, 489.0, 743.0, 1121.0, 1764.0, 2908.0, 4271.0, 7077.0, 11403.0, 17691.0, 32126.0, 54960.0, 117338.0, 364905.0, 222337.0, 93271.0, 47428.0, 25400.0, 15915.0, 9797.0, 5823.0, 3789.0, 2373.0, 1671.0, 1009.0, 664.0, 420.0, 267.0, 206.0, 135.0, 82.0, 58.0, 41.0, 25.0, 22.0, 13.0, 7.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.6716461181640625e-05, -3.548618406057358e-05, -3.425590693950653e-05, -3.3025629818439484e-05, -3.1795352697372437e-05, -3.056507557630539e-05, -2.9334798455238342e-05, -2.8104521334171295e-05, -2.6874244213104248e-05, -2.56439670920372e-05, -2.4413689970970154e-05, -2.3183412849903107e-05, -2.195313572883606e-05, -2.0722858607769012e-05, -1.9492581486701965e-05, -1.8262304365634918e-05, -1.703202724456787e-05, -1.5801750123500824e-05, -1.4571473002433777e-05, -1.334119588136673e-05, -1.2110918760299683e-05, -1.0880641639232635e-05, -9.650364518165588e-06, -8.420087397098541e-06, -7.189810276031494e-06, -5.959533154964447e-06, -4.7292560338974e-06, -3.4989789128303528e-06, -2.2687017917633057e-06, -1.0384246706962585e-06, 1.9185245037078857e-07, 1.4221295714378357e-06, 2.652406692504883e-06, 3.88268381357193e-06, 5.112960934638977e-06, 6.343238055706024e-06, 7.573515176773071e-06, 8.803792297840118e-06, 1.0034069418907166e-05, 1.1264346539974213e-05, 1.249462366104126e-05, 1.3724900782108307e-05, 1.4955177903175354e-05, 1.61854550242424e-05, 1.7415732145309448e-05, 1.8646009266376495e-05, 1.9876286387443542e-05, 2.110656350851059e-05, 2.2336840629577637e-05, 2.3567117750644684e-05, 2.479739487171173e-05, 2.6027671992778778e-05, 2.7257949113845825e-05, 2.8488226234912872e-05, 2.971850335597992e-05, 3.0948780477046967e-05, 3.2179057598114014e-05, 3.340933471918106e-05, 3.463961184024811e-05, 3.5869888961315155e-05, 3.71001660823822e-05, 3.833044320344925e-05, 3.9560720324516296e-05, 4.0790997445583344e-05, 4.202127456665039e-05]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 0.0, 5.0, 6.0, 10.0, 5.0, 13.0, 4.0, 10.0, 10.0, 19.0, 14.0, 20.0, 29.0, 33.0, 26.0, 37.0, 28.0, 32.0, 33.0, 54.0, 35.0, 35.0, 54.0, 47.0, 46.0, 46.0, 38.0, 46.0, 39.0, 30.0, 26.0, 23.0, 18.0, 13.0, 22.0, 15.0, 18.0, 10.0, 13.0, 3.0, 12.0, 7.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-3.6835670471191406e-05, -3.5814009606838226e-05, -3.4792348742485046e-05, -3.3770687878131866e-05, -3.2749027013778687e-05, -3.1727366149425507e-05, -3.070570528507233e-05, -2.9684044420719147e-05, -2.8662383556365967e-05, -2.7640722692012787e-05, -2.6619061827659607e-05, -2.5597400963306427e-05, -2.4575740098953247e-05, -2.3554079234600067e-05, -2.2532418370246887e-05, -2.1510757505893707e-05, -2.0489096641540527e-05, -1.9467435777187347e-05, -1.8445774912834167e-05, -1.7424114048480988e-05, -1.6402453184127808e-05, -1.5380792319774628e-05, -1.4359131455421448e-05, -1.3337470591068268e-05, -1.2315809726715088e-05, -1.1294148862361908e-05, -1.0272487998008728e-05, -9.250827133655548e-06, -8.229166269302368e-06, -7.207505404949188e-06, -6.185844540596008e-06, -5.164183676242828e-06, -4.1425228118896484e-06, -3.1208619475364685e-06, -2.0992010831832886e-06, -1.0775402188301086e-06, -5.587935447692871e-08, 9.657815098762512e-07, 1.987442374229431e-06, 3.009103238582611e-06, 4.030764102935791e-06, 5.052424967288971e-06, 6.074085831642151e-06, 7.095746695995331e-06, 8.11740756034851e-06, 9.13906842470169e-06, 1.016072928905487e-05, 1.118239015340805e-05, 1.220405101776123e-05, 1.322571188211441e-05, 1.424737274646759e-05, 1.526903361082077e-05, 1.629069447517395e-05, 1.731235533952713e-05, 1.833401620388031e-05, 1.935567706823349e-05, 2.037733793258667e-05, 2.139899879693985e-05, 2.242065966129303e-05, 2.344232052564621e-05, 2.446398138999939e-05, 2.548564225435257e-05, 2.650730311870575e-05, 2.752896398305893e-05, 2.855062484741211e-05]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 13.0, 12.0, 24.0, 52.0, 72.0, 252.0, 307.0, 642.0, 2445.0, 4313.0, 20894.0, 45676.0, 139685.0, 619488.0, 139741.0, 56107.0, 10686.0, 4328.0, 2479.0, 625.0, 417.0, 118.0, 65.0, 57.0, 25.0, 7.0, 11.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-06, -4.625879228115082e-06, -4.4833868741989136e-06, -4.340894520282745e-06, -4.198402166366577e-06, -4.055909812450409e-06, -3.913417458534241e-06, -3.7709251046180725e-06, -3.6284327507019043e-06, -3.485940396785736e-06, -3.343448042869568e-06, -3.2009556889533997e-06, -3.0584633350372314e-06, -2.9159709811210632e-06, -2.773478627204895e-06, -2.630986273288727e-06, -2.4884939193725586e-06, -2.3460015654563904e-06, -2.203509211540222e-06, -2.061016857624054e-06, -1.9185245037078857e-06, -1.7760321497917175e-06, -1.6335397958755493e-06, -1.491047441959381e-06, -1.3485550880432129e-06, -1.2060627341270447e-06, -1.0635703802108765e-06, -9.210780262947083e-07, -7.7858567237854e-07, -6.360933184623718e-07, -4.936009645462036e-07, -3.511086106300354e-07, -2.086162567138672e-07, -6.612390279769897e-08, 7.636845111846924e-08, 2.1886080503463745e-07, 3.6135315895080566e-07, 5.038455128669739e-07, 6.463378667831421e-07, 7.888302206993103e-07, 9.313225746154785e-07, 1.0738149285316467e-06, 1.216307282447815e-06, 1.3587996363639832e-06, 1.5012919902801514e-06, 1.6437843441963196e-06, 1.7862766981124878e-06, 1.928769052028656e-06, 2.0712614059448242e-06, 2.2137537598609924e-06, 2.3562461137771606e-06, 2.498738467693329e-06, 2.641230821609497e-06, 2.7837231755256653e-06, 2.9262155294418335e-06, 3.0687078833580017e-06, 3.21120023727417e-06, 3.353692591190338e-06, 3.4961849451065063e-06, 3.6386772990226746e-06, 3.7811696529388428e-06, 3.923662006855011e-06, 4.066154360771179e-06, 4.208646714687347e-06, 4.351139068603516e-06]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 6.0, 0.0, 16.0, 12.0, 0.0, 9.0, 0.0, 17.0, 36.0, 0.0, 29.0, 0.0, 38.0, 44.0, 0.0, 62.0, 71.0, 0.0, 59.0, 0.0, 71.0, 66.0, 0.0, 76.0, 0.0, 75.0, 62.0, 0.0, 36.0, 0.0, 46.0, 48.0, 0.0, 31.0, 0.0, 30.0, 15.0, 0.0, 22.0, 11.0, 0.0, 7.0, 0.0, 6.0, 5.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.76957380771637e-07, -9.406358003616333e-07, -9.043142199516296e-07, -8.67992639541626e-07, -8.316710591316223e-07, -7.953494787216187e-07, -7.59027898311615e-07, -7.227063179016113e-07, -6.863847374916077e-07, -6.50063157081604e-07, -6.137415766716003e-07, -5.774199962615967e-07, -5.41098415851593e-07, -5.047768354415894e-07, -4.684552550315857e-07, -4.3213367462158203e-07, -3.9581209421157837e-07, -3.594905138015747e-07, -3.2316893339157104e-07, -2.868473529815674e-07, -2.505257725715637e-07, -2.1420419216156006e-07, -1.778826117515564e-07, -1.4156103134155273e-07, -1.0523945093154907e-07, -6.891787052154541e-08, -3.259629011154175e-08, 3.725290298461914e-09, 4.0046870708465576e-08, 7.636845111846924e-08, 1.126900315284729e-07, 1.4901161193847656e-07, 1.8533319234848022e-07, 2.2165477275848389e-07, 2.5797635316848755e-07, 2.942979335784912e-07, 3.3061951398849487e-07, 3.6694109439849854e-07, 4.032626748085022e-07, 4.3958425521850586e-07, 4.759058356285095e-07, 5.122274160385132e-07, 5.485489964485168e-07, 5.848705768585205e-07, 6.211921572685242e-07, 6.575137376785278e-07, 6.938353180885315e-07, 7.301568984985352e-07, 7.664784789085388e-07, 8.028000593185425e-07, 8.391216397285461e-07, 8.754432201385498e-07, 9.117648005485535e-07, 9.480863809585571e-07, 9.844079613685608e-07, 1.0207295417785645e-06, 1.0570511221885681e-06, 1.0933727025985718e-06, 1.1296942830085754e-06, 1.166015863418579e-06, 1.2023374438285828e-06, 1.2386590242385864e-06, 1.27498060464859e-06, 1.3113021850585938e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 12.0, 12.0, 14.0, 22.0, 22.0, 40.0, 81.0, 72.0, 131.0, 182.0, 252.0, 361.0, 492.0, 724.0, 1106.0, 0.0, 1678.0, 2511.0, 3938.0, 6390.0, 10607.0, 18241.0, 34480.0, 71613.0, 178879.0, 384587.0, 178660.0, 72113.0, 34351.0, 18386.0, 10589.0, 6323.0, 3918.0, 2621.0, 1651.0, 1132.0, 0.0, 714.0, 483.0, 356.0, 255.0, 151.0, 120.0, 86.0, 62.0, 34.0, 37.0, 19.0, 10.0, 11.0, 14.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.7881393432617188e-06, -1.7313286662101746e-06, -1.6745179891586304e-06, -1.6177073121070862e-06, -1.560896635055542e-06, -1.5040859580039978e-06, -1.4472752809524536e-06, -1.3904646039009094e-06, -1.3336539268493652e-06, -1.276843249797821e-06, -1.2200325727462769e-06, -1.1632218956947327e-06, -1.1064112186431885e-06, -1.0496005415916443e-06, -9.927898645401e-07, -9.359791874885559e-07, -8.791685104370117e-07, -8.223578333854675e-07, -7.655471563339233e-07, -7.087364792823792e-07, -6.51925802230835e-07, -5.951151251792908e-07, -5.383044481277466e-07, -4.814937710762024e-07, -4.246830940246582e-07, -3.67872416973114e-07, -3.110617399215698e-07, -2.5425106287002563e-07, -1.9744038581848145e-07, -1.4062970876693726e-07, -8.381903171539307e-08, -2.7008354663848877e-08, 2.9802322387695312e-08, 8.66129994392395e-08, 1.434236764907837e-07, 2.0023435354232788e-07, 2.5704503059387207e-07, 3.1385570764541626e-07, 3.7066638469696045e-07, 4.2747706174850464e-07, 4.842877388000488e-07, 5.41098415851593e-07, 5.979090929031372e-07, 6.547197699546814e-07, 7.115304470062256e-07, 7.683411240577698e-07, 8.25151801109314e-07, 8.819624781608582e-07, 9.387731552124023e-07, 9.955838322639465e-07, 1.0523945093154907e-06, 1.109205186367035e-06, 1.166015863418579e-06, 1.2228265404701233e-06, 1.2796372175216675e-06, 1.3364478945732117e-06, 1.3932585716247559e-06, 1.4500692486763e-06, 1.5068799257278442e-06, 1.5636906027793884e-06, 1.6205012798309326e-06, 1.6773119568824768e-06, 1.734122633934021e-06, 1.7909333109855652e-06, 1.8477439880371094e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 5.0, 0.0, 9.0, 5.0, 9.0, 11.0, 13.0, 25.0, 26.0, 28.0, 28.0, 48.0, 58.0, 63.0, 65.0, 62.0, 75.0, 0.0, 54.0, 67.0, 48.0, 52.0, 48.0, 51.0, 18.0, 29.0, 14.0, 16.0, 18.0, 10.0, 8.0, 6.0, 6.0, 0.0, 5.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6726553440093994e-06, -1.6167759895324707e-06, -1.560896635055542e-06, -1.5050172805786133e-06, -1.4491379261016846e-06, -1.3932585716247559e-06, -1.3373792171478271e-06, -1.2814998626708984e-06, -1.2256205081939697e-06, -1.169741153717041e-06, -1.1138617992401123e-06, -1.0579824447631836e-06, -1.0021030902862549e-06, -9.462237358093262e-07, -8.903443813323975e-07, -8.344650268554688e-07, -7.7858567237854e-07, -7.227063179016113e-07, -6.668269634246826e-07, -6.109476089477539e-07, -5.550682544708252e-07, -4.991888999938965e-07, -4.4330954551696777e-07, -3.8743019104003906e-07, -3.3155083656311035e-07, -2.7567148208618164e-07, -2.1979212760925293e-07, -1.6391277313232422e-07, -1.0803341865539551e-07, -5.21540641784668e-08, 3.725290298461914e-09, 5.960464477539063e-08, 1.1548399925231934e-07, 1.7136335372924805e-07, 2.2724270820617676e-07, 2.8312206268310547e-07, 3.390014171600342e-07, 3.948807716369629e-07, 4.507601261138916e-07, 5.066394805908203e-07, 5.62518835067749e-07, 6.183981895446777e-07, 6.742775440216064e-07, 7.301568984985352e-07, 7.860362529754639e-07, 8.419156074523926e-07, 8.977949619293213e-07, 9.5367431640625e-07, 1.0095536708831787e-06, 1.0654330253601074e-06, 1.1213123798370361e-06, 1.1771917343139648e-06, 1.2330710887908936e-06, 1.2889504432678223e-06, 1.344829797744751e-06, 1.4007091522216797e-06, 1.4565885066986084e-06, 1.5124678611755371e-06, 1.5683472156524658e-06, 1.6242265701293945e-06, 1.6801059246063232e-06, 1.735985279083252e-06, 1.7918646335601807e-06, 1.8477439880371094e-06]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 11.0, 7.0, 11.0, 10.0, 26.0, 55.0, 98.0, 230.0, 183.0, 94.0, 57.0, 47.0, 39.0, 38.0, 19.0, 18.0, 9.0, 12.0, 12.0, 11.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001511340233264491, -0.00014345854287967086, -0.00013578306243289262, -0.00012810758198611438, -0.00012043210153933614, -0.00011275662109255791, -0.00010508114792173728, -9.740566747495905e-05, -8.973018702818081e-05, -8.205470658140257e-05, -7.437922613462433e-05, -6.670375296380371e-05, -5.9028268879046664e-05, -5.1352788432268426e-05, -4.3677311623468995e-05, -3.600183117669076e-05, -2.832635072991252e-05, -2.065087028313428e-05, -1.2975391655345447e-05, -5.299913027556613e-06, 2.3755674192216247e-06, 1.0051047865999863e-05, 1.7726524674799293e-05, 2.540200512157753e-05, 3.307748556835577e-05, 4.075296601513401e-05, 4.8428446461912245e-05, 5.6103923270711675e-05, 6.37794000795111e-05, 7.145488052628934e-05, 7.913036097306758e-05, 8.680584141984582e-05, 9.448133641853929e-05, 0.00010215681686531752, 0.00010983229731209576, 0.000117507777758874, 0.00012518325820565224, 0.00013285873865243047, 0.0001405342190992087, 0.00014820968499407172, 0.0001558851799927652, 0.00016356066043954343, 0.00017123614088632166, 0.0001789116213330999, 0.00018658710177987814, 0.00019426258222665638, 0.00020193806267343462, 0.00020961352856829762, 0.00021728900901507586, 0.0002249644894618541, 0.00023263996990863234, 0.00024031545035541058, 0.0002479909162502736, 0.00025566641124896705, 0.00026334187714383006, 0.00027101737214252353, 0.00027869283803738654, 0.00028636830393224955, 0.000294043798930943, 0.000301719264825806, 0.0003093947598244995, 0.0003170702257193625, 0.00032474572071805596, 0.000332421186612919, 0.00034009668161161244]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 13.0, 11.0, 10.0, 8.0, 11.0, 18.0, 23.0, 30.0, 34.0, 29.0, 22.0, 36.0, 38.0, 50.0, 39.0, 44.0, 47.0, 49.0, 46.0, 49.0, 43.0, 42.0, 47.0, 36.0, 32.0, 35.0, 29.0, 23.0, 21.0, 15.0, 12.0, 9.0, 4.0, 11.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.00012433528900146484, -0.00012046750634908676, -0.00011659972369670868, -0.0001127319410443306, -0.00010886415839195251, -0.00010499637573957443, -0.00010112859308719635, -9.726081043481827e-05, -9.339302778244019e-05, -8.95252451300621e-05, -8.565746247768402e-05, -8.178967982530594e-05, -7.792189717292786e-05, -7.405411452054977e-05, -7.018633186817169e-05, -6.631854921579361e-05, -6.245076656341553e-05, -5.8582983911037445e-05, -5.471520125865936e-05, -5.084741860628128e-05, -4.69796359539032e-05, -4.3111853301525116e-05, -3.9244070649147034e-05, -3.537628799676895e-05, -3.150850534439087e-05, -2.7640722692012787e-05, -2.3772940039634705e-05, -1.9905157387256622e-05, -1.603737473487854e-05, -1.2169592082500458e-05, -8.301809430122375e-06, -4.434026777744293e-06, -5.662441253662109e-07, 3.3015385270118713e-06, 7.169321179389954e-06, 1.1037103831768036e-05, 1.4904886484146118e-05, 1.87726691365242e-05, 2.2640451788902283e-05, 2.6508234441280365e-05, 3.0376017093658447e-05, 3.424379974603653e-05, 3.811158239841461e-05, 4.1979365050792694e-05, 4.5847147703170776e-05, 4.971493035554886e-05, 5.358271300792694e-05, 5.745049566030502e-05, 6.13182783126831e-05, 6.518606096506119e-05, 6.905384361743927e-05, 7.292162626981735e-05, 7.678940892219543e-05, 8.065719157457352e-05, 8.45249742269516e-05, 8.839275687932968e-05, 9.226053953170776e-05, 9.612832218408585e-05, 9.999610483646393e-05, 0.00010386388748884201, 0.00010773167014122009, 0.00011159945279359818, 0.00011546723544597626, 0.00011933501809835434, 0.00012320280075073242]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 15.0, 21.0, 42.0, 61.0, 103.0, 188.0, 359.0, 670.0, 1213.0, 2188.0, 4440.0, 9612.0, 25735.0, 96387.0, 3929693.0, 83345.0, 23563.0, 8752.0, 3786.0, 1849.0, 908.0, 549.0, 243.0, 159.0, 109.0, 61.0, 36.0, 27.0, 25.0, 18.0, 17.0, 14.0, 10.0, 11.0, 12.0, 10.0, 9.0, 4.0, 8.0, 2.0, 4.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.401538848876953e-05, -6.072781980037689e-05, -5.744025111198425e-05, -5.4152682423591614e-05, -5.0865113735198975e-05, -4.7577545046806335e-05, -4.4289976358413696e-05, -4.100240767002106e-05, -3.771483898162842e-05, -3.442727029323578e-05, -3.113970160484314e-05, -2.78521329164505e-05, -2.456456422805786e-05, -2.1276995539665222e-05, -1.7989426851272583e-05, -1.4701858162879944e-05, -1.1414289474487305e-05, -8.126720786094666e-06, -4.839152097702026e-06, -1.5515834093093872e-06, 1.735985279083252e-06, 5.023553967475891e-06, 8.31112265586853e-06, 1.159869134426117e-05, 1.4886260032653809e-05, 1.8173828721046448e-05, 2.1461397409439087e-05, 2.4748966097831726e-05, 2.8036534786224365e-05, 3.1324103474617004e-05, 3.4611672163009644e-05, 3.789924085140228e-05, 4.118680953979492e-05, 4.447437822818756e-05, 4.77619469165802e-05, 5.104951560497284e-05, 5.433708429336548e-05, 5.762465298175812e-05, 6.091222167015076e-05, 6.41997903585434e-05, 6.748735904693604e-05, 7.077492773532867e-05, 7.406249642372131e-05, 7.735006511211395e-05, 8.063763380050659e-05, 8.392520248889923e-05, 8.721277117729187e-05, 9.050033986568451e-05, 9.378790855407715e-05, 9.707547724246979e-05, 0.00010036304593086243, 0.00010365061461925507, 0.0001069381833076477, 0.00011022575199604034, 0.00011351332068443298, 0.00011680088937282562, 0.00012008845806121826, 0.0001233760267496109, 0.00012666359543800354, 0.00012995116412639618, 0.00013323873281478882, 0.00013652630150318146, 0.0001398138701915741, 0.00014310143887996674, 0.00014638900756835938]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 13.0, 14.0, 15.0, 17.0, 28.0, 54.0, 77.0, 104.0, 111.0, 131.0, 110.0, 108.0, 65.0, 39.0, 39.0, 27.0, 12.0, 8.0, 11.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3768672943115234e-05, -1.3024546205997467e-05, -1.22804194688797e-05, -1.1536292731761932e-05, -1.0792165994644165e-05, -1.0048039257526398e-05, -9.30391252040863e-06, -8.559785783290863e-06, -7.815659046173096e-06, -7.071532309055328e-06, -6.327405571937561e-06, -5.583278834819794e-06, -4.839152097702026e-06, -4.095025360584259e-06, -3.3508986234664917e-06, -2.6067718863487244e-06, -1.862645149230957e-06, -1.1185184121131897e-06, -3.7439167499542236e-07, 3.6973506212234497e-07, 1.1138617992401123e-06, 1.8579885363578796e-06, 2.602115273475647e-06, 3.3462420105934143e-06, 4.090368747711182e-06, 4.834495484828949e-06, 5.578622221946716e-06, 6.322748959064484e-06, 7.066875696182251e-06, 7.811002433300018e-06, 8.555129170417786e-06, 9.299255907535553e-06, 1.004338264465332e-05, 1.0787509381771088e-05, 1.1531636118888855e-05, 1.2275762856006622e-05, 1.301988959312439e-05, 1.3764016330242157e-05, 1.4508143067359924e-05, 1.5252269804477692e-05, 1.599639654159546e-05, 1.6740523278713226e-05, 1.7484650015830994e-05, 1.822877675294876e-05, 1.897290349006653e-05, 1.9717030227184296e-05, 2.0461156964302063e-05, 2.120528370141983e-05, 2.1949410438537598e-05, 2.2693537175655365e-05, 2.3437663912773132e-05, 2.41817906498909e-05, 2.4925917387008667e-05, 2.5670044124126434e-05, 2.64141708612442e-05, 2.715829759836197e-05, 2.7902424335479736e-05, 2.8646551072597504e-05, 2.939067780971527e-05, 3.013480454683304e-05, 3.0878931283950806e-05, 3.162305802106857e-05, 3.236718475818634e-05, 3.311131149530411e-05, 3.3855438232421875e-05]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 12.0, 7.0, 9.0, 22.0, 34.0, 41.0, 45.0, 92.0, 131.0, 214.0, 370.0, 612.0, 1119.0, 1903.0, 3478.0, 6873.0, 14540.0, 31957.0, 82488.0, 2564904.0, 1341796.0, 82843.0, 31454.0, 14632.0, 6750.0, 3442.0, 1856.0, 1056.0, 541.0, 387.0, 229.0, 154.0, 77.0, 61.0, 35.0, 28.0, 26.0, 13.0, 8.0, 9.0, 11.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.936622619628906e-05, -5.761999636888504e-05, -5.587376654148102e-05, -5.4127536714076996e-05, -5.2381306886672974e-05, -5.063507705926895e-05, -4.888884723186493e-05, -4.714261740446091e-05, -4.5396387577056885e-05, -4.365015774965286e-05, -4.190392792224884e-05, -4.015769809484482e-05, -3.8411468267440796e-05, -3.6665238440036774e-05, -3.491900861263275e-05, -3.317277878522873e-05, -3.142654895782471e-05, -2.9680319130420685e-05, -2.7934089303016663e-05, -2.618785947561264e-05, -2.4441629648208618e-05, -2.2695399820804596e-05, -2.0949169993400574e-05, -1.920294016599655e-05, -1.745671033859253e-05, -1.5710480511188507e-05, -1.3964250683784485e-05, -1.2218020856380463e-05, -1.047179102897644e-05, -8.725561201572418e-06, -6.979331374168396e-06, -5.233101546764374e-06, -3.4868717193603516e-06, -1.7406418919563293e-06, 5.587935447692871e-09, 1.751817762851715e-06, 3.4980475902557373e-06, 5.2442774176597595e-06, 6.990507245063782e-06, 8.736737072467804e-06, 1.0482966899871826e-05, 1.2229196727275848e-05, 1.397542655467987e-05, 1.5721656382083893e-05, 1.7467886209487915e-05, 1.9214116036891937e-05, 2.096034586429596e-05, 2.270657569169998e-05, 2.4452805519104004e-05, 2.6199035346508026e-05, 2.794526517391205e-05, 2.969149500131607e-05, 3.143772482872009e-05, 3.3183954656124115e-05, 3.493018448352814e-05, 3.667641431093216e-05, 3.842264413833618e-05, 4.0168873965740204e-05, 4.1915103793144226e-05, 4.366133362054825e-05, 4.540756344795227e-05, 4.715379327535629e-05, 4.8900023102760315e-05, 5.064625293016434e-05, 5.239248275756836e-05]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 8.0, 10.0, 19.0, 10.0, 8.0, 17.0, 31.0, 23.0, 41.0, 44.0, 59.0, 115.0, 466.0, 2229.0, 580.0, 136.0, 70.0, 40.0, 36.0, 33.0, 26.0, 14.0, 15.0, 14.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.658367156982422e-05, -2.540741115808487e-05, -2.423115074634552e-05, -2.305489033460617e-05, -2.187862992286682e-05, -2.0702369511127472e-05, -1.9526109099388123e-05, -1.8349848687648773e-05, -1.7173588275909424e-05, -1.5997327864170074e-05, -1.4821067452430725e-05, -1.3644807040691376e-05, -1.2468546628952026e-05, -1.1292286217212677e-05, -1.0116025805473328e-05, -8.939765393733978e-06, -7.763504981994629e-06, -6.5872445702552795e-06, -5.41098415851593e-06, -4.234723746776581e-06, -3.0584633350372314e-06, -1.882202923297882e-06, -7.059425115585327e-07, 4.7031790018081665e-07, 1.646578311920166e-06, 2.8228387236595154e-06, 3.999099135398865e-06, 5.175359547138214e-06, 6.3516199588775635e-06, 7.527880370616913e-06, 8.704140782356262e-06, 9.880401194095612e-06, 1.1056661605834961e-05, 1.223292201757431e-05, 1.340918242931366e-05, 1.4585442841053009e-05, 1.576170325279236e-05, 1.6937963664531708e-05, 1.8114224076271057e-05, 1.9290484488010406e-05, 2.0466744899749756e-05, 2.1643005311489105e-05, 2.2819265723228455e-05, 2.3995526134967804e-05, 2.5171786546707153e-05, 2.6348046958446503e-05, 2.7524307370185852e-05, 2.87005677819252e-05, 2.987682819366455e-05, 3.10530886054039e-05, 3.222934901714325e-05, 3.34056094288826e-05, 3.458186984062195e-05, 3.57581302523613e-05, 3.693439066410065e-05, 3.8110651075839996e-05, 3.9286911487579346e-05, 4.0463171899318695e-05, 4.1639432311058044e-05, 4.2815692722797394e-05, 4.399195313453674e-05, 4.516821354627609e-05, 4.634447395801544e-05, 4.752073436975479e-05, 4.869699478149414e-05]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 9.0, 5.0, 7.0, 8.0, 22.0, 30.0, 27.0, 44.0, 65.0, 105.0, 167.0, 171.0, 103.0, 81.0, 53.0, 33.0, 24.0, 18.0, 14.0, 10.0, 10.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018070924852509052, -0.00017403258243575692, -0.00016735591634642333, -0.00016067925025708973, -0.00015400258416775614, -0.00014732591807842255, -0.00014064923743717372, -0.00013397258589975536, -0.00012729590525850654, -0.00012061923916917294, -0.00011394257307983935, -0.00010726590699050575, -0.00010058924090117216, -9.391257481183857e-05, -8.723590144654736e-05, -8.055923535721377e-05, -7.388257654383779e-05, -6.720591045450419e-05, -6.05292443651706e-05, -5.38525746378582e-05, -4.71759085485246e-05, -4.049924245919101e-05, -3.382257273187861e-05, -2.7145906642545015e-05, -2.046924055321142e-05, -1.3792573554383125e-05, -7.1159065555548295e-06, -4.3923864723183215e-07, 6.237427442101762e-06, 1.2914093531435356e-05, 1.9590763258747756e-05, 2.626742934808135e-05, 3.2944080885499716e-05, 3.962074697483331e-05, 4.6297413064166903e-05, 5.2974082791479304e-05, 5.96507488808129e-05, 6.632741133216769e-05, 7.300408469745889e-05, 7.968075078679249e-05, 8.635741687612608e-05, 9.303408296545967e-05, 9.971074905479327e-05, 0.00010638742242008448, 0.00011306408850941807, 0.00011974075459875166, 0.00012641742068808526, 0.00013309408677741885, 0.00013977075286675245, 0.00014644741895608604, 0.00015312408504541963, 0.00015980075113475323, 0.00016647741722408682, 0.00017315408331342041, 0.00017983076395466924, 0.0001865074154920876, 0.00019318409613333642, 0.00019986076222267002, 0.0002065374283120036, 0.0002132140944013372, 0.0002198907604906708, 0.0002265674265800044, 0.000233244092669338, 0.0002399207733105868, 0.0002465974248480052]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 3.0, 11.0, 6.0, 10.0, 13.0, 18.0, 14.0, 27.0, 24.0, 26.0, 26.0, 29.0, 36.0, 41.0, 41.0, 36.0, 37.0, 42.0, 41.0, 40.0, 55.0, 50.0, 33.0, 31.0, 22.0, 42.0, 31.0, 36.0, 26.0, 20.0, 27.0, 13.0, 15.0, 10.0, 20.0, 8.0, 9.0, 4.0, 7.0, 6.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.589029312133789e-05, -8.345581591129303e-05, -8.102133870124817e-05, -7.858686149120331e-05, -7.615238428115845e-05, -7.371790707111359e-05, -7.128342986106873e-05, -6.884895265102386e-05, -6.6414475440979e-05, -6.397999823093414e-05, -6.154552102088928e-05, -5.911104381084442e-05, -5.667656660079956e-05, -5.42420893907547e-05, -5.180761218070984e-05, -4.937313497066498e-05, -4.693865776062012e-05, -4.4504180550575256e-05, -4.2069703340530396e-05, -3.9635226130485535e-05, -3.7200748920440674e-05, -3.476627171039581e-05, -3.233179450035095e-05, -2.989731729030609e-05, -2.746284008026123e-05, -2.502836287021637e-05, -2.259388566017151e-05, -2.0159408450126648e-05, -1.7724931240081787e-05, -1.5290454030036926e-05, -1.2855976819992065e-05, -1.0421499609947205e-05, -7.987022399902344e-06, -5.552545189857483e-06, -3.118067979812622e-06, -6.835907697677612e-07, 1.7508864402770996e-06, 4.1853636503219604e-06, 6.619840860366821e-06, 9.054318070411682e-06, 1.1488795280456543e-05, 1.3923272490501404e-05, 1.6357749700546265e-05, 1.8792226910591125e-05, 2.1226704120635986e-05, 2.3661181330680847e-05, 2.6095658540725708e-05, 2.853013575077057e-05, 3.096461296081543e-05, 3.339909017086029e-05, 3.583356738090515e-05, 3.826804459095001e-05, 4.070252180099487e-05, 4.3136999011039734e-05, 4.5571476221084595e-05, 4.8005953431129456e-05, 5.0440430641174316e-05, 5.287490785121918e-05, 5.530938506126404e-05, 5.77438622713089e-05, 6.017833948135376e-05, 6.261281669139862e-05, 6.504729390144348e-05, 6.748177111148834e-05, 6.99162483215332e-05]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 11.0, 28.0, 22.0, 31.0, 41.0, 39.0, 86.0, 147.0, 176.0, 294.0, 404.0, 674.0, 1056.0, 1796.0, 3071.0, 5835.0, 11647.0, 26738.0, 71258.0, 265287.0, 495042.0, 99120.0, 34787.0, 14546.0, 7032.0, 3683.0, 2135.0, 1264.0, 786.0, 450.0, 357.0, 221.0, 154.0, 85.0, 74.0, 44.0, 40.0, 20.0, 24.0, 13.0, 5.0, 8.0, 5.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.380413055419922e-05, -8.135009557008743e-05, -7.889606058597565e-05, -7.644202560186386e-05, -7.398799061775208e-05, -7.153395563364029e-05, -6.90799206495285e-05, -6.662588566541672e-05, -6.417185068130493e-05, -6.171781569719315e-05, -5.926378071308136e-05, -5.6809745728969574e-05, -5.435571074485779e-05, -5.1901675760746e-05, -4.9447640776634216e-05, -4.699360579252243e-05, -4.4539570808410645e-05, -4.208553582429886e-05, -3.963150084018707e-05, -3.717746585607529e-05, -3.47234308719635e-05, -3.2269395887851715e-05, -2.981536090373993e-05, -2.7361325919628143e-05, -2.4907290935516357e-05, -2.245325595140457e-05, -1.9999220967292786e-05, -1.7545185983181e-05, -1.5091150999069214e-05, -1.2637116014957428e-05, -1.0183081030845642e-05, -7.729046046733856e-06, -5.27501106262207e-06, -2.8209760785102844e-06, -3.6694109439849854e-07, 2.0870938897132874e-06, 4.541128873825073e-06, 6.995163857936859e-06, 9.449198842048645e-06, 1.1903233826160431e-05, 1.4357268810272217e-05, 1.6811303794384003e-05, 1.926533877849579e-05, 2.1719373762607574e-05, 2.417340874671936e-05, 2.6627443730831146e-05, 2.9081478714942932e-05, 3.153551369905472e-05, 3.3989548683166504e-05, 3.644358366727829e-05, 3.8897618651390076e-05, 4.135165363550186e-05, 4.380568861961365e-05, 4.625972360372543e-05, 4.871375858783722e-05, 5.1167793571949005e-05, 5.362182855606079e-05, 5.607586354017258e-05, 5.852989852428436e-05, 6.098393350839615e-05, 6.343796849250793e-05, 6.589200347661972e-05, 6.83460384607315e-05, 7.080007344484329e-05, 7.325410842895508e-05]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 5.0, 9.0, 9.0, 6.0, 21.0, 20.0, 27.0, 41.0, 59.0, 57.0, 81.0, 115.0, 77.0, 80.0, 80.0, 54.0, 56.0, 55.0, 42.0, 23.0, 22.0, 14.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.52587890625e-05, -1.4711171388626099e-05, -1.4163553714752197e-05, -1.3615936040878296e-05, -1.3068318367004395e-05, -1.2520700693130493e-05, -1.1973083019256592e-05, -1.142546534538269e-05, -1.0877847671508789e-05, -1.0330229997634888e-05, -9.782612323760986e-06, -9.234994649887085e-06, -8.687376976013184e-06, -8.139759302139282e-06, -7.592141628265381e-06, -7.0445239543914795e-06, -6.496906280517578e-06, -5.949288606643677e-06, -5.401670932769775e-06, -4.854053258895874e-06, -4.306435585021973e-06, -3.7588179111480713e-06, -3.21120023727417e-06, -2.6635825634002686e-06, -2.115964889526367e-06, -1.5683472156524658e-06, -1.0207295417785645e-06, -4.731118679046631e-07, 7.450580596923828e-08, 6.221234798431396e-07, 1.169741153717041e-06, 1.7173588275909424e-06, 2.2649765014648438e-06, 2.812594175338745e-06, 3.3602118492126465e-06, 3.907829523086548e-06, 4.455447196960449e-06, 5.003064870834351e-06, 5.550682544708252e-06, 6.098300218582153e-06, 6.645917892456055e-06, 7.193535566329956e-06, 7.741153240203857e-06, 8.288770914077759e-06, 8.83638858795166e-06, 9.384006261825562e-06, 9.931623935699463e-06, 1.0479241609573364e-05, 1.1026859283447266e-05, 1.1574476957321167e-05, 1.2122094631195068e-05, 1.266971230506897e-05, 1.3217329978942871e-05, 1.3764947652816772e-05, 1.4312565326690674e-05, 1.4860183000564575e-05, 1.5407800674438477e-05, 1.5955418348312378e-05, 1.650303602218628e-05, 1.705065369606018e-05, 1.7598271369934082e-05, 1.8145889043807983e-05, 1.8693506717681885e-05, 1.9241124391555786e-05, 1.9788742065429688e-05]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 7.0, 15.0, 29.0, 39.0, 36.0, 67.0, 108.0, 156.0, 232.0, 321.0, 584.0, 803.0, 1388.0, 1960.0, 3169.0, 5414.0, 8288.0, 14558.0, 23367.0, 42508.0, 74795.0, 155816.0, 394574.0, 148309.0, 74979.0, 38099.0, 23728.0, 13205.0, 8480.0, 4860.0, 3027.0, 2039.0, 1197.0, 856.0, 505.0, 325.0, 246.0, 144.0, 101.0, 62.0, 58.0, 30.0, 24.0, 14.0, 5.0, 10.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.3736228942871094e-05, -3.269687294960022e-05, -3.1657516956329346e-05, -3.061816096305847e-05, -2.9578804969787598e-05, -2.8539448976516724e-05, -2.750009298324585e-05, -2.6460736989974976e-05, -2.54213809967041e-05, -2.4382025003433228e-05, -2.3342669010162354e-05, -2.230331301689148e-05, -2.1263957023620605e-05, -2.022460103034973e-05, -1.9185245037078857e-05, -1.8145889043807983e-05, -1.710653305053711e-05, -1.6067177057266235e-05, -1.5027821063995361e-05, -1.3988465070724487e-05, -1.2949109077453613e-05, -1.190975308418274e-05, -1.0870397090911865e-05, -9.831041097640991e-06, -8.791685104370117e-06, -7.752329111099243e-06, -6.712973117828369e-06, -5.673617124557495e-06, -4.634261131286621e-06, -3.594905138015747e-06, -2.555549144744873e-06, -1.516193151473999e-06, -4.76837158203125e-07, 5.62518835067749e-07, 1.601874828338623e-06, 2.641230821609497e-06, 3.680586814880371e-06, 4.719942808151245e-06, 5.759298801422119e-06, 6.798654794692993e-06, 7.838010787963867e-06, 8.877366781234741e-06, 9.916722774505615e-06, 1.095607876777649e-05, 1.1995434761047363e-05, 1.3034790754318237e-05, 1.4074146747589111e-05, 1.5113502740859985e-05, 1.615285873413086e-05, 1.7192214727401733e-05, 1.8231570720672607e-05, 1.927092671394348e-05, 2.0310282707214355e-05, 2.134963870048523e-05, 2.2388994693756104e-05, 2.3428350687026978e-05, 2.446770668029785e-05, 2.5507062673568726e-05, 2.65464186668396e-05, 2.7585774660110474e-05, 2.8625130653381348e-05, 2.966448664665222e-05, 3.0703842639923096e-05, 3.174319863319397e-05, 3.2782554626464844e-05]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 4.0, 6.0, 5.0, 8.0, 12.0, 20.0, 16.0, 17.0, 25.0, 21.0, 22.0, 28.0, 43.0, 34.0, 40.0, 48.0, 51.0, 42.0, 56.0, 56.0, 37.0, 49.0, 48.0, 45.0, 35.0, 38.0, 32.0, 30.0, 24.0, 14.0, 26.0, 17.0, 14.0, 11.0, 8.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0219554901123047e-05, -2.9212795197963715e-05, -2.8206035494804382e-05, -2.719927579164505e-05, -2.6192516088485718e-05, -2.5185756385326385e-05, -2.4178996682167053e-05, -2.317223697900772e-05, -2.216547727584839e-05, -2.1158717572689056e-05, -2.0151957869529724e-05, -1.9145198166370392e-05, -1.813843846321106e-05, -1.7131678760051727e-05, -1.6124919056892395e-05, -1.5118159353733063e-05, -1.411139965057373e-05, -1.3104639947414398e-05, -1.2097880244255066e-05, -1.1091120541095734e-05, -1.0084360837936401e-05, -9.077601134777069e-06, -8.070841431617737e-06, -7.0640817284584045e-06, -6.057322025299072e-06, -5.05056232213974e-06, -4.043802618980408e-06, -3.0370429158210754e-06, -2.030283212661743e-06, -1.0235235095024109e-06, -1.6763806343078613e-08, 9.899958968162537e-07, 1.996755599975586e-06, 3.0035153031349182e-06, 4.0102750062942505e-06, 5.017034709453583e-06, 6.023794412612915e-06, 7.030554115772247e-06, 8.03731381893158e-06, 9.044073522090912e-06, 1.0050833225250244e-05, 1.1057592928409576e-05, 1.2064352631568909e-05, 1.3071112334728241e-05, 1.4077872037887573e-05, 1.5084631741046906e-05, 1.6091391444206238e-05, 1.709815114736557e-05, 1.8104910850524902e-05, 1.9111670553684235e-05, 2.0118430256843567e-05, 2.11251899600029e-05, 2.213194966316223e-05, 2.3138709366321564e-05, 2.4145469069480896e-05, 2.5152228772640228e-05, 2.615898847579956e-05, 2.7165748178958893e-05, 2.8172507882118225e-05, 2.9179267585277557e-05, 3.018602728843689e-05, 3.119278699159622e-05, 3.2199546694755554e-05, 3.3206306397914886e-05, 3.421306610107422e-05]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 9.0, 12.0, 0.0, 27.0, 23.0, 42.0, 46.0, 0.0, 71.0, 100.0, 168.0, 240.0, 0.0, 367.0, 609.0, 992.0, 1614.0, 2702.0, 0.0, 4459.0, 7569.0, 13153.0, 23333.0, 0.0, 41933.0, 80660.0, 176508.0, 339235.0, 0.0, 176501.0, 80870.0, 41889.0, 23031.0, 13046.0, 0.0, 7806.0, 4504.0, 2690.0, 1711.0, 0.0, 976.0, 623.0, 357.0, 230.0, 0.0, 153.0, 98.0, 65.0, 43.0, 33.0, 0.0, 22.0, 15.0, 10.0, 8.0, 0.0, 6.0, 3.0, 5.0, 2.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4416873455047607e-06, -1.3932585716247559e-06, -1.344829797744751e-06, -1.296401023864746e-06, -1.2479722499847412e-06, -1.1995434761047363e-06, -1.1511147022247314e-06, -1.1026859283447266e-06, -1.0542571544647217e-06, -1.0058283805847168e-06, -9.57399606704712e-07, -9.08970832824707e-07, -8.605420589447021e-07, -8.121132850646973e-07, -7.636845111846924e-07, -7.152557373046875e-07, -6.668269634246826e-07, -6.183981895446777e-07, -5.699694156646729e-07, -5.21540641784668e-07, -4.731118679046631e-07, -4.246830940246582e-07, -3.762543201446533e-07, -3.2782554626464844e-07, -2.7939677238464355e-07, -2.3096799850463867e-07, -1.825392246246338e-07, -1.341104507446289e-07, -8.568167686462402e-08, -3.725290298461914e-08, 1.1175870895385742e-08, 5.960464477539063e-08, 1.0803341865539551e-07, 1.564621925354004e-07, 2.0489096641540527e-07, 2.5331974029541016e-07, 3.0174851417541504e-07, 3.501772880554199e-07, 3.986060619354248e-07, 4.470348358154297e-07, 4.954636096954346e-07, 5.438923835754395e-07, 5.923211574554443e-07, 6.407499313354492e-07, 6.891787052154541e-07, 7.37607479095459e-07, 7.860362529754639e-07, 8.344650268554688e-07, 8.828938007354736e-07, 9.313225746154785e-07, 9.797513484954834e-07, 1.0281801223754883e-06, 1.0766088962554932e-06, 1.125037670135498e-06, 1.173466444015503e-06, 1.2218952178955078e-06, 1.2703239917755127e-06, 1.3187527656555176e-06, 1.3671815395355225e-06, 1.4156103134155273e-06, 1.4640390872955322e-06, 1.5124678611755371e-06, 1.560896635055542e-06, 1.6093254089355469e-06]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 0.0, 13.0, 10.0, 26.0, 26.0, 0.0, 20.0, 24.0, 33.0, 38.0, 0.0, 59.0, 60.0, 71.0, 70.0, 0.0, 77.0, 86.0, 58.0, 46.0, 0.0, 48.0, 45.0, 35.0, 33.0, 0.0, 36.0, 19.0, 16.0, 15.0, 0.0, 11.0, 10.0, 8.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.621432602405548e-06, -1.5739351511001587e-06, -1.5264376997947693e-06, -1.4789402484893799e-06, -1.4314427971839905e-06, -1.383945345878601e-06, -1.3364478945732117e-06, -1.2889504432678223e-06, -1.2414529919624329e-06, -1.1939555406570435e-06, -1.146458089351654e-06, -1.0989606380462646e-06, -1.0514631867408752e-06, -1.0039657354354858e-06, -9.564682841300964e-07, -9.08970832824707e-07, -8.614733815193176e-07, -8.139759302139282e-07, -7.664784789085388e-07, -7.189810276031494e-07, -6.7148357629776e-07, -6.239861249923706e-07, -5.764886736869812e-07, -5.289912223815918e-07, -4.814937710762024e-07, -4.33996319770813e-07, -3.864988684654236e-07, -3.390014171600342e-07, -2.915039658546448e-07, -2.4400651454925537e-07, -1.9650906324386597e-07, -1.4901161193847656e-07, -1.0151416063308716e-07, -5.4016709327697754e-08, -6.51925802230835e-09, 4.0978193283081055e-08, 8.847564458847046e-08, 1.3597309589385986e-07, 1.8347054719924927e-07, 2.3096799850463867e-07, 2.784654498100281e-07, 3.259629011154175e-07, 3.734603524208069e-07, 4.209578037261963e-07, 4.684552550315857e-07, 5.159527063369751e-07, 5.634501576423645e-07, 6.109476089477539e-07, 6.584450602531433e-07, 7.059425115585327e-07, 7.534399628639221e-07, 8.009374141693115e-07, 8.484348654747009e-07, 8.959323167800903e-07, 9.434297680854797e-07, 9.909272193908691e-07, 1.0384246706962585e-06, 1.085922122001648e-06, 1.1334195733070374e-06, 1.1809170246124268e-06, 1.2284144759178162e-06, 1.2759119272232056e-06, 1.323409378528595e-06, 1.3709068298339844e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 10.0, 0.0, 10.0, 0.0, 24.0, 51.0, 0.0, 87.0, 144.0, 0.0, 316.0, 568.0, 0.0, 1033.0, 2090.0, 0.0, 4155.0, 0.0, 9045.0, 20919.0, 0.0, 55440.0, 183161.0, 0.0, 494318.0, 183120.0, 0.0, 55619.0, 0.0, 20925.0, 8964.0, 0.0, 4287.0, 2019.0, 0.0, 1065.0, 567.0, 0.0, 296.0, 146.0, 0.0, 85.0, 0.0, 51.0, 21.0, 0.0, 14.0, 9.0, 0.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.3113021850585938e-06, -1.2731179594993591e-06, -1.2349337339401245e-06, -1.1967495083808899e-06, -1.1585652828216553e-06, -1.1203810572624207e-06, -1.082196831703186e-06, -1.0440126061439514e-06, -1.0058283805847168e-06, -9.676441550254822e-07, -9.294599294662476e-07, -8.912757039070129e-07, -8.530914783477783e-07, -8.149072527885437e-07, -7.767230272293091e-07, -7.385388016700745e-07, -7.003545761108398e-07, -6.621703505516052e-07, -6.239861249923706e-07, -5.85801899433136e-07, -5.476176738739014e-07, -5.094334483146667e-07, -4.7124922275543213e-07, -4.330649971961975e-07, -3.948807716369629e-07, -3.5669654607772827e-07, -3.1851232051849365e-07, -2.8032809495925903e-07, -2.421438694000244e-07, -2.039596438407898e-07, -1.6577541828155518e-07, -1.2759119272232056e-07, -8.940696716308594e-08, -5.122274160385132e-08, -1.30385160446167e-08, 2.514570951461792e-08, 6.332993507385254e-08, 1.0151416063308716e-07, 1.3969838619232178e-07, 1.778826117515564e-07, 2.1606683731079102e-07, 2.5425106287002563e-07, 2.9243528842926025e-07, 3.3061951398849487e-07, 3.688037395477295e-07, 4.069879651069641e-07, 4.4517219066619873e-07, 4.833564162254333e-07, 5.21540641784668e-07, 5.597248673439026e-07, 5.979090929031372e-07, 6.360933184623718e-07, 6.742775440216064e-07, 7.124617695808411e-07, 7.506459951400757e-07, 7.888302206993103e-07, 8.270144462585449e-07, 8.651986718177795e-07, 9.033828973770142e-07, 9.415671229362488e-07, 9.797513484954834e-07, 1.017935574054718e-06, 1.0561197996139526e-06, 1.0943040251731873e-06, 1.1324882507324219e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 8.0, 0.0, 6.0, 0.0, 8.0, 0.0, 19.0, 0.0, 21.0, 0.0, 30.0, 0.0, 43.0, 0.0, 52.0, 0.0, 76.0, 0.0, 98.0, 0.0, 103.0, 0.0, 88.0, 0.0, 114.0, 0.0, 83.0, 0.0, 75.0, 0.0, 56.0, 0.0, 40.0, 0.0, 23.0, 0.0, 26.0, 0.0, 14.0, 0.0, 7.0, 0.0, 7.0, 0.0, 5.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 10.0, 6.0, 14.0, 14.0, 21.0, 21.0, 33.0, 40.0, 51.0, 78.0, 172.0, 125.0, 92.0, 65.0, 52.0, 34.0, 28.0, 26.0, 16.0, 20.0, 17.0, 13.0, 13.0, 8.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001048088088282384, -0.00010088112321682274, -9.69534448813647e-05, -9.302575926994905e-05, -8.90980736585334e-05, -8.517039532307535e-05, -8.12427097116597e-05, -7.731502410024405e-05, -7.3387345764786e-05, -6.945966015337035e-05, -6.553198181791231e-05, -6.160429620649666e-05, -5.7676610595081e-05, -5.3748928621644154e-05, -4.982124664820731e-05, -4.589356103679165e-05, -4.1965875425376e-05, -3.803819345193915e-05, -3.4110507840523496e-05, -3.018282586708665e-05, -2.6255142074660398e-05, -2.2327458282234147e-05, -1.83997763087973e-05, -1.4472092516371049e-05, -1.0544408723944798e-05, -6.616725386265898e-06, -2.689042048586998e-06, 1.238640834344551e-06, 5.166324626770802e-06, 9.094008419197053e-06, 1.30216903926339e-05, 1.694937418506015e-05, 2.0877050701528788e-05, 2.480473449395504e-05, 2.873241828638129e-05, 3.266010025981814e-05, 3.658778587123379e-05, 4.051546784467064e-05, 4.4443149818107486e-05, 4.837083542952314e-05, 5.229851740295999e-05, 5.6226199376396835e-05, 6.015388498781249e-05, 6.408157059922814e-05, 6.800924893468618e-05, 7.193693454610184e-05, 7.586462015751749e-05, 7.979229849297553e-05, 8.371998410439119e-05, 8.764766971580684e-05, 9.157534805126488e-05, 9.550303366268054e-05, 9.943071927409619e-05, 0.00010335839760955423, 0.00010728608322096989, 0.00011121376883238554, 0.00011514144716784358, 0.00011906913277925923, 0.0001229968183906749, 0.00012692449672613293, 0.00013085217506159097, 0.00013477986794896424, 0.00013870754628442228, 0.00014263522461988032, 0.0001465629175072536]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 9.0, 11.0, 13.0, 9.0, 16.0, 13.0, 19.0, 15.0, 23.0, 28.0, 22.0, 39.0, 31.0, 48.0, 33.0, 33.0, 35.0, 54.0, 42.0, 42.0, 25.0, 45.0, 55.0, 26.0, 31.0, 32.0, 38.0, 27.0, 35.0, 27.0, 17.0, 20.0, 17.0, 16.0, 13.0, 9.0, 12.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-9.107589721679688e-05, -8.833874017000198e-05, -8.560158312320709e-05, -8.28644260764122e-05, -8.012726902961731e-05, -7.739011198282242e-05, -7.465295493602753e-05, -7.191579788923264e-05, -6.917864084243774e-05, -6.644148379564285e-05, -6.370432674884796e-05, -6.096716970205307e-05, -5.823001265525818e-05, -5.549285560846329e-05, -5.2755698561668396e-05, -5.0018541514873505e-05, -4.728138446807861e-05, -4.454422742128372e-05, -4.180707037448883e-05, -3.906991332769394e-05, -3.633275628089905e-05, -3.3595599234104156e-05, -3.0858442187309265e-05, -2.8121285140514374e-05, -2.5384128093719482e-05, -2.264697104692459e-05, -1.99098140001297e-05, -1.717265695333481e-05, -1.4435499906539917e-05, -1.1698342859745026e-05, -8.961185812950134e-06, -6.224028766155243e-06, -3.4868717193603516e-06, -7.497146725654602e-07, 1.987442374229431e-06, 4.7245994210243225e-06, 7.461756467819214e-06, 1.0198913514614105e-05, 1.2936070561408997e-05, 1.5673227608203888e-05, 1.841038465499878e-05, 2.114754170179367e-05, 2.3884698748588562e-05, 2.6621855795383453e-05, 2.9359012842178345e-05, 3.2096169888973236e-05, 3.483332693576813e-05, 3.757048398256302e-05, 4.030764102935791e-05, 4.30447980761528e-05, 4.578195512294769e-05, 4.8519112169742584e-05, 5.1256269216537476e-05, 5.399342626333237e-05, 5.673058331012726e-05, 5.946774035692215e-05, 6.220489740371704e-05, 6.494205445051193e-05, 6.767921149730682e-05, 7.041636854410172e-05, 7.31535255908966e-05, 7.58906826376915e-05, 7.862783968448639e-05, 8.136499673128128e-05, 8.410215377807617e-05]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 15.0, 19.0, 22.0, 38.0, 60.0, 107.0, 182.0, 291.0, 482.0, 832.0, 1636.0, 3272.0, 7338.0, 20187.0, 101057.0, 3955948.0, 69458.0, 18535.0, 7239.0, 3218.0, 1672.0, 983.0, 571.0, 315.0, 212.0, 180.0, 98.0, 58.0, 53.0, 40.0, 38.0, 33.0, 14.0, 13.0, 10.0, 8.0, 16.0, 6.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.43865966796875e-05, -7.091276347637177e-05, -6.743893027305603e-05, -6.39650970697403e-05, -6.049126386642456e-05, -5.7017430663108826e-05, -5.354359745979309e-05, -5.0069764256477356e-05, -4.659593105316162e-05, -4.3122097849845886e-05, -3.964826464653015e-05, -3.6174431443214417e-05, -3.270059823989868e-05, -2.9226765036582947e-05, -2.5752931833267212e-05, -2.2279098629951477e-05, -1.8805265426635742e-05, -1.5331432223320007e-05, -1.1857599020004272e-05, -8.383765816688538e-06, -4.909932613372803e-06, -1.4360994100570679e-06, 2.037733793258667e-06, 5.511566996574402e-06, 8.985400199890137e-06, 1.2459233403205872e-05, 1.5933066606521606e-05, 1.940689980983734e-05, 2.2880733013153076e-05, 2.635456621646881e-05, 2.9828399419784546e-05, 3.330223262310028e-05, 3.6776065826416016e-05, 4.024989902973175e-05, 4.3723732233047485e-05, 4.719756543636322e-05, 5.0671398639678955e-05, 5.414523184299469e-05, 5.7619065046310425e-05, 6.109289824962616e-05, 6.45667314529419e-05, 6.804056465625763e-05, 7.151439785957336e-05, 7.49882310628891e-05, 7.846206426620483e-05, 8.193589746952057e-05, 8.54097306728363e-05, 8.888356387615204e-05, 9.235739707946777e-05, 9.583123028278351e-05, 9.930506348609924e-05, 0.00010277889668941498, 0.00010625272989273071, 0.00010972656309604645, 0.00011320039629936218, 0.00011667422950267792, 0.00012014806270599365, 0.0001236218959093094, 0.00012709572911262512, 0.00013056956231594086, 0.0001340433955192566, 0.00013751722872257233, 0.00014099106192588806, 0.0001444648951292038, 0.00014793872833251953]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 7.0, 12.0, 16.0, 21.0, 29.0, 48.0, 67.0, 81.0, 107.0, 98.0, 114.0, 91.0, 75.0, 58.0, 48.0, 31.0, 23.0, 16.0, 7.0, 6.0, 10.0, 5.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.341104507446289e-05, -1.2765638530254364e-05, -1.2120231986045837e-05, -1.147482544183731e-05, -1.0829418897628784e-05, -1.0184012353420258e-05, -9.538605809211731e-06, -8.893199265003204e-06, -8.247792720794678e-06, -7.602386176586151e-06, -6.9569796323776245e-06, -6.311573088169098e-06, -5.666166543960571e-06, -5.020759999752045e-06, -4.375353455543518e-06, -3.7299469113349915e-06, -3.084540367126465e-06, -2.4391338229179382e-06, -1.7937272787094116e-06, -1.148320734500885e-06, -5.029141902923584e-07, 1.424923539161682e-07, 7.878988981246948e-07, 1.4333054423332214e-06, 2.078711986541748e-06, 2.7241185307502747e-06, 3.3695250749588013e-06, 4.014931619167328e-06, 4.6603381633758545e-06, 5.305744707584381e-06, 5.951151251792908e-06, 6.596557796001434e-06, 7.241964340209961e-06, 7.887370884418488e-06, 8.532777428627014e-06, 9.17818397283554e-06, 9.823590517044067e-06, 1.0468997061252594e-05, 1.111440360546112e-05, 1.1759810149669647e-05, 1.2405216693878174e-05, 1.30506232380867e-05, 1.3696029782295227e-05, 1.4341436326503754e-05, 1.498684287071228e-05, 1.5632249414920807e-05, 1.6277655959129333e-05, 1.692306250333786e-05, 1.7568469047546387e-05, 1.8213875591754913e-05, 1.885928213596344e-05, 1.9504688680171967e-05, 2.0150095224380493e-05, 2.079550176858902e-05, 2.1440908312797546e-05, 2.2086314857006073e-05, 2.27317214012146e-05, 2.3377127945423126e-05, 2.4022534489631653e-05, 2.466794103384018e-05, 2.5313347578048706e-05, 2.5958754122257233e-05, 2.660416066646576e-05, 2.7249567210674286e-05, 2.7894973754882812e-05]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 10.0, 20.0, 27.0, 29.0, 44.0, 101.0, 160.0, 208.0, 403.0, 750.0, 1339.0, 2540.0, 5035.0, 11145.0, 24910.0, 73774.0, 1431881.0, 2516336.0, 76063.0, 27016.0, 11466.0, 5148.0, 2695.0, 1371.0, 768.0, 419.0, 230.0, 153.0, 84.0, 52.0, 42.0, 16.0, 13.0, 8.0, 4.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.414817810058594e-05, -7.219798862934113e-05, -7.024779915809631e-05, -6.82976096868515e-05, -6.634742021560669e-05, -6.439723074436188e-05, -6.244704127311707e-05, -6.0496851801872253e-05, -5.854666233062744e-05, -5.659647285938263e-05, -5.464628338813782e-05, -5.2696093916893005e-05, -5.074590444564819e-05, -4.879571497440338e-05, -4.684552550315857e-05, -4.489533603191376e-05, -4.2945146560668945e-05, -4.099495708942413e-05, -3.904476761817932e-05, -3.709457814693451e-05, -3.51443886756897e-05, -3.3194199204444885e-05, -3.124400973320007e-05, -2.929382026195526e-05, -2.734363079071045e-05, -2.5393441319465637e-05, -2.3443251848220825e-05, -2.1493062376976013e-05, -1.95428729057312e-05, -1.759268343448639e-05, -1.5642493963241577e-05, -1.3692304491996765e-05, -1.1742115020751953e-05, -9.791925549507141e-06, -7.841736078262329e-06, -5.891546607017517e-06, -3.941357135772705e-06, -1.991167664527893e-06, -4.0978193283081055e-08, 1.909211277961731e-06, 3.859400749206543e-06, 5.809590220451355e-06, 7.759779691696167e-06, 9.709969162940979e-06, 1.1660158634185791e-05, 1.3610348105430603e-05, 1.5560537576675415e-05, 1.7510727047920227e-05, 1.946091651916504e-05, 2.141110599040985e-05, 2.3361295461654663e-05, 2.5311484932899475e-05, 2.7261674404144287e-05, 2.92118638753891e-05, 3.116205334663391e-05, 3.311224281787872e-05, 3.5062432289123535e-05, 3.701262176036835e-05, 3.896281123161316e-05, 4.091300070285797e-05, 4.286319017410278e-05, 4.4813379645347595e-05, 4.676356911659241e-05, 4.871375858783722e-05, 5.066394805908203e-05]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 5.0, 9.0, 9.0, 18.0, 12.0, 24.0, 32.0, 26.0, 47.0, 64.0, 188.0, 630.0, 2065.0, 494.0, 144.0, 74.0, 35.0, 39.0, 33.0, 24.0, 15.0, 16.0, 4.0, 9.0, 7.0, 7.0, 9.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.380941390991211e-05, -4.267040640115738e-05, -4.153139889240265e-05, -4.039239138364792e-05, -3.925338387489319e-05, -3.811437636613846e-05, -3.697536885738373e-05, -3.5836361348629e-05, -3.469735383987427e-05, -3.355834633111954e-05, -3.241933882236481e-05, -3.128033131361008e-05, -3.0141323804855347e-05, -2.9002316296100616e-05, -2.7863308787345886e-05, -2.6724301278591156e-05, -2.5585293769836426e-05, -2.4446286261081696e-05, -2.3307278752326965e-05, -2.2168271243572235e-05, -2.1029263734817505e-05, -1.9890256226062775e-05, -1.8751248717308044e-05, -1.7612241208553314e-05, -1.6473233699798584e-05, -1.5334226191043854e-05, -1.4195218682289124e-05, -1.3056211173534393e-05, -1.1917203664779663e-05, -1.0778196156024933e-05, -9.639188647270203e-06, -8.500181138515472e-06, -7.361173629760742e-06, -6.222166121006012e-06, -5.083158612251282e-06, -3.9441511034965515e-06, -2.8051435947418213e-06, -1.666136085987091e-06, -5.271285772323608e-07, 6.118789315223694e-07, 1.7508864402770996e-06, 2.88989394903183e-06, 4.02890145778656e-06, 5.16790896654129e-06, 6.3069164752960205e-06, 7.445923984050751e-06, 8.584931492805481e-06, 9.723939001560211e-06, 1.0862946510314941e-05, 1.2001954019069672e-05, 1.3140961527824402e-05, 1.4279969036579132e-05, 1.5418976545333862e-05, 1.6557984054088593e-05, 1.7696991562843323e-05, 1.8835999071598053e-05, 1.9975006580352783e-05, 2.1114014089107513e-05, 2.2253021597862244e-05, 2.3392029106616974e-05, 2.4531036615371704e-05, 2.5670044124126434e-05, 2.6809051632881165e-05, 2.7948059141635895e-05, 2.9087066650390625e-05]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 11.0, 6.0, 8.0, 13.0, 22.0, 27.0, 28.0, 51.0, 76.0, 101.0, 125.0, 120.0, 103.0, 56.0, 50.0, 48.0, 32.0, 29.0, 24.0, 13.0, 11.0, 9.0, 5.0, 6.0, 8.0, 5.0, 1.0, 7.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017065282736439258, -0.00016529108688700944, -0.0001599293464096263, -0.00015456760593224317, -0.0001492058509029448, -0.00014384411042556167, -0.00013848236994817853, -0.0001331206294707954, -0.00012775888899341226, -0.00012239714851602912, -0.00011703540803864598, -0.00011167366028530523, -0.0001063119198079221, -0.00010095017933053896, -9.558843157719821e-05, -9.022669109981507e-05, -8.486495062243193e-05, -7.95032101450488e-05, -7.414146966766566e-05, -6.877972191432491e-05, -6.341798143694177e-05, -5.8056240959558636e-05, -5.269449684419669e-05, -4.733275272883475e-05, -4.197101225145161e-05, -3.6609271774068475e-05, -3.124752765870653e-05, -2.588578536233399e-05, -2.052404306596145e-05, -1.516230076958891e-05, -9.80055847321637e-06, -4.438814357854426e-06, 9.229115676134825e-07, 6.284653863986023e-06, 1.1646396160358563e-05, 1.7008138456731103e-05, 2.2369880753103644e-05, 2.7731623049476184e-05, 3.3093365345848724e-05, 3.845510946121067e-05, 4.3816849938593805e-05, 4.917859041597694e-05, 5.4540334531338885e-05, 5.990207864670083e-05, 6.526381912408397e-05, 7.06255596014671e-05, 7.598730735480785e-05, 8.134904783219099e-05, 8.671078830957413e-05, 9.207252878695726e-05, 9.74342692643404e-05, 0.00010279601701768115, 0.00010815775749506429, 0.00011351949797244743, 0.00011888124572578818, 0.0001242429862031713, 0.00012960472668055445, 0.00013496646715793759, 0.00014032820763532072, 0.00014568994811270386, 0.00015105170314200222, 0.00015641344361938536, 0.0001617751840967685, 0.00016713692457415164, 0.00017249866505153477]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 12.0, 5.0, 12.0, 17.0, 19.0, 17.0, 22.0, 25.0, 31.0, 33.0, 28.0, 31.0, 40.0, 30.0, 43.0, 38.0, 41.0, 44.0, 50.0, 46.0, 43.0, 36.0, 42.0, 26.0, 32.0, 30.0, 32.0, 25.0, 21.0, 17.0, 19.0, 13.0, 12.0, 16.0, 9.0, 9.0, 6.0, 1.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-9.161233901977539e-05, -8.882023394107819e-05, -8.602812886238098e-05, -8.323602378368378e-05, -8.044391870498657e-05, -7.765181362628937e-05, -7.485970854759216e-05, -7.206760346889496e-05, -6.927549839019775e-05, -6.648339331150055e-05, -6.369128823280334e-05, -6.089918315410614e-05, -5.8107078075408936e-05, -5.531497299671173e-05, -5.2522867918014526e-05, -4.973076283931732e-05, -4.693865776062012e-05, -4.414655268192291e-05, -4.135444760322571e-05, -3.8562342524528503e-05, -3.57702374458313e-05, -3.2978132367134094e-05, -3.018602728843689e-05, -2.7393922209739685e-05, -2.460181713104248e-05, -2.1809712052345276e-05, -1.901760697364807e-05, -1.6225501894950867e-05, -1.3433396816253662e-05, -1.0641291737556458e-05, -7.849186658859253e-06, -5.057081580162048e-06, -2.2649765014648438e-06, 5.271285772323608e-07, 3.3192336559295654e-06, 6.11133873462677e-06, 8.903443813323975e-06, 1.169554889202118e-05, 1.4487653970718384e-05, 1.727975904941559e-05, 2.0071864128112793e-05, 2.2863969206809998e-05, 2.5656074285507202e-05, 2.8448179364204407e-05, 3.124028444290161e-05, 3.4032389521598816e-05, 3.682449460029602e-05, 3.9616599678993225e-05, 4.240870475769043e-05, 4.5200809836387634e-05, 4.799291491508484e-05, 5.0785019993782043e-05, 5.357712507247925e-05, 5.636923015117645e-05, 5.916133522987366e-05, 6.195344030857086e-05, 6.474554538726807e-05, 6.753765046596527e-05, 7.032975554466248e-05, 7.312186062335968e-05, 7.591396570205688e-05, 7.870607078075409e-05, 8.14981758594513e-05, 8.42902809381485e-05, 8.70823860168457e-05]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 8.0, 9.0, 16.0, 21.0, 42.0, 38.0, 76.0, 107.0, 196.0, 341.0, 596.0, 1079.0, 2012.0, 3812.0, 8146.0, 19524.0, 58118.0, 243780.0, 553559.0, 103929.0, 30191.0, 11695.0, 5424.0, 2622.0, 1332.0, 776.0, 423.0, 244.0, 154.0, 96.0, 61.0, 33.0, 28.0, 14.0, 13.0, 9.0, 4.0, 6.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00011289119720458984, -0.00010949280112981796, -0.00010609440505504608, -0.0001026960089802742, -9.929761290550232e-05, -9.589921683073044e-05, -9.250082075595856e-05, -8.910242468118668e-05, -8.57040286064148e-05, -8.230563253164291e-05, -7.890723645687103e-05, -7.550884038209915e-05, -7.211044430732727e-05, -6.871204823255539e-05, -6.531365215778351e-05, -6.191525608301163e-05, -5.8516860008239746e-05, -5.5118463933467865e-05, -5.1720067858695984e-05, -4.83216717839241e-05, -4.492327570915222e-05, -4.152487963438034e-05, -3.812648355960846e-05, -3.472808748483658e-05, -3.13296914100647e-05, -2.7931295335292816e-05, -2.4532899260520935e-05, -2.1134503185749054e-05, -1.7736107110977173e-05, -1.4337711036205292e-05, -1.093931496143341e-05, -7.5409188866615295e-06, -4.1425228118896484e-06, -7.441267371177673e-07, 2.6542693376541138e-06, 6.052665412425995e-06, 9.451061487197876e-06, 1.2849457561969757e-05, 1.6247853636741638e-05, 1.964624971151352e-05, 2.30446457862854e-05, 2.644304186105728e-05, 2.9841437935829163e-05, 3.3239834010601044e-05, 3.6638230085372925e-05, 4.0036626160144806e-05, 4.343502223491669e-05, 4.683341830968857e-05, 5.023181438446045e-05, 5.363021045923233e-05, 5.702860653400421e-05, 6.042700260877609e-05, 6.382539868354797e-05, 6.722379475831985e-05, 7.062219083309174e-05, 7.402058690786362e-05, 7.74189829826355e-05, 8.081737905740738e-05, 8.421577513217926e-05, 8.761417120695114e-05, 9.101256728172302e-05, 9.44109633564949e-05, 9.780935943126678e-05, 0.00010120775550603867, 0.00010460615158081055]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 12.0, 12.0, 14.0, 17.0, 20.0, 22.0, 47.0, 63.0, 82.0, 90.0, 104.0, 86.0, 78.0, 81.0, 76.0, 49.0, 55.0, 19.0, 22.0, 7.0, 8.0, 8.0, 3.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-05, -1.4884397387504578e-05, -1.4271587133407593e-05, -1.3658776879310608e-05, -1.3045966625213623e-05, -1.2433156371116638e-05, -1.1820346117019653e-05, -1.1207535862922668e-05, -1.0594725608825684e-05, -9.981915354728699e-06, -9.369105100631714e-06, -8.756294846534729e-06, -8.143484592437744e-06, -7.530674338340759e-06, -6.917864084243774e-06, -6.3050538301467896e-06, -5.692243576049805e-06, -5.07943332195282e-06, -4.466623067855835e-06, -3.85381281375885e-06, -3.2410025596618652e-06, -2.6281923055648804e-06, -2.0153820514678955e-06, -1.4025717973709106e-06, -7.897615432739258e-07, -1.7695128917694092e-07, 4.3585896492004395e-07, 1.0486692190170288e-06, 1.6614794731140137e-06, 2.2742897272109985e-06, 2.8870999813079834e-06, 3.4999102354049683e-06, 4.112720489501953e-06, 4.725530743598938e-06, 5.338340997695923e-06, 5.951151251792908e-06, 6.563961505889893e-06, 7.1767717599868774e-06, 7.789582014083862e-06, 8.402392268180847e-06, 9.015202522277832e-06, 9.628012776374817e-06, 1.0240823030471802e-05, 1.0853633284568787e-05, 1.1466443538665771e-05, 1.2079253792762756e-05, 1.2692064046859741e-05, 1.3304874300956726e-05, 1.3917684555053711e-05, 1.4530494809150696e-05, 1.514330506324768e-05, 1.5756115317344666e-05, 1.636892557144165e-05, 1.6981735825538635e-05, 1.759454607963562e-05, 1.8207356333732605e-05, 1.882016658782959e-05, 1.9432976841926575e-05, 2.004578709602356e-05, 2.0658597350120544e-05, 2.127140760421753e-05, 2.1884217858314514e-05, 2.24970281124115e-05, 2.3109838366508484e-05, 2.372264862060547e-05]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 10.0, 18.0, 15.0, 33.0, 39.0, 66.0, 73.0, 107.0, 164.0, 261.0, 385.0, 655.0, 952.0, 1462.0, 2252.0, 3876.0, 6016.0, 9578.0, 16049.0, 26728.0, 47450.0, 90712.0, 212054.0, 360048.0, 123139.0, 61265.0, 35357.0, 18972.0, 11655.0, 7236.0, 4195.0, 2628.0, 1752.0, 1123.0, 737.0, 502.0, 357.0, 194.0, 143.0, 91.0, 76.0, 42.0, 30.0, 19.0, 10.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.9742717742919922e-05, -2.872385084629059e-05, -2.7704983949661255e-05, -2.668611705303192e-05, -2.5667250156402588e-05, -2.4648383259773254e-05, -2.362951636314392e-05, -2.2610649466514587e-05, -2.1591782569885254e-05, -2.057291567325592e-05, -1.9554048776626587e-05, -1.8535181879997253e-05, -1.751631498336792e-05, -1.6497448086738586e-05, -1.5478581190109253e-05, -1.445971429347992e-05, -1.3440847396850586e-05, -1.2421980500221252e-05, -1.1403113603591919e-05, -1.0384246706962585e-05, -9.365379810333252e-06, -8.346512913703918e-06, -7.327646017074585e-06, -6.3087791204452515e-06, -5.289912223815918e-06, -4.2710453271865845e-06, -3.252178430557251e-06, -2.2333115339279175e-06, -1.214444637298584e-06, -1.955777406692505e-07, 8.23289155960083e-07, 1.8421560525894165e-06, 2.86102294921875e-06, 3.8798898458480835e-06, 4.898756742477417e-06, 5.9176236391067505e-06, 6.936490535736084e-06, 7.955357432365417e-06, 8.974224328994751e-06, 9.993091225624084e-06, 1.1011958122253418e-05, 1.2030825018882751e-05, 1.3049691915512085e-05, 1.4068558812141418e-05, 1.5087425708770752e-05, 1.6106292605400085e-05, 1.712515950202942e-05, 1.8144026398658752e-05, 1.9162893295288086e-05, 2.018176019191742e-05, 2.1200627088546753e-05, 2.2219493985176086e-05, 2.323836088180542e-05, 2.4257227778434753e-05, 2.5276094675064087e-05, 2.629496157169342e-05, 2.7313828468322754e-05, 2.8332695364952087e-05, 2.935156226158142e-05, 3.0370429158210754e-05, 3.138929605484009e-05, 3.240816295146942e-05, 3.3427029848098755e-05, 3.444589674472809e-05, 3.546476364135742e-05]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 10.0, 12.0, 10.0, 16.0, 10.0, 12.0, 8.0, 20.0, 20.0, 23.0, 22.0, 28.0, 30.0, 29.0, 30.0, 45.0, 34.0, 44.0, 46.0, 53.0, 35.0, 46.0, 33.0, 49.0, 39.0, 41.0, 32.0, 34.0, 33.0, 21.0, 25.0, 16.0, 18.0, 12.0, 10.0, 12.0, 7.0, 7.0, 5.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.5391578674316406e-05, -2.453010529279709e-05, -2.366863191127777e-05, -2.2807158529758453e-05, -2.1945685148239136e-05, -2.1084211766719818e-05, -2.02227383852005e-05, -1.9361265003681183e-05, -1.8499791622161865e-05, -1.7638318240642548e-05, -1.677684485912323e-05, -1.5915371477603912e-05, -1.5053898096084595e-05, -1.4192424714565277e-05, -1.333095133304596e-05, -1.2469477951526642e-05, -1.1608004570007324e-05, -1.0746531188488007e-05, -9.885057806968689e-06, -9.023584425449371e-06, -8.162111043930054e-06, -7.300637662410736e-06, -6.4391642808914185e-06, -5.577690899372101e-06, -4.716217517852783e-06, -3.8547441363334656e-06, -2.993270754814148e-06, -2.1317973732948303e-06, -1.2703239917755127e-06, -4.0885061025619507e-07, 4.5262277126312256e-07, 1.3140961527824402e-06, 2.175569534301758e-06, 3.0370429158210754e-06, 3.898516297340393e-06, 4.759989678859711e-06, 5.621463060379028e-06, 6.482936441898346e-06, 7.3444098234176636e-06, 8.205883204936981e-06, 9.067356586456299e-06, 9.928829967975616e-06, 1.0790303349494934e-05, 1.1651776731014252e-05, 1.251325011253357e-05, 1.3374723494052887e-05, 1.4236196875572205e-05, 1.5097670257091522e-05, 1.595914363861084e-05, 1.6820617020130157e-05, 1.7682090401649475e-05, 1.8543563783168793e-05, 1.940503716468811e-05, 2.0266510546207428e-05, 2.1127983927726746e-05, 2.1989457309246063e-05, 2.285093069076538e-05, 2.37124040722847e-05, 2.4573877453804016e-05, 2.5435350835323334e-05, 2.629682421684265e-05, 2.715829759836197e-05, 2.8019770979881287e-05, 2.8881244361400604e-05, 2.9742717742919922e-05]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 6.0, 4.0, 12.0, 19.0, 19.0, 33.0, 50.0, 59.0, 94.0, 122.0, 237.0, 380.0, 639.0, 1122.0, 2049.0, 4247.0, 9593.0, 25346.0, 75109.0, 262257.0, 459388.0, 136775.0, 42890.0, 15351.0, 6293.0, 2883.0, 1483.0, 855.0, 453.0, 289.0, 165.0, 113.0, 88.0, 36.0, 22.0, 25.0, 15.0, 13.0, 9.0, 2.0, 7.0, 2.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6954879760742188e-06, -3.577210009098053e-06, -3.458932042121887e-06, -3.3406540751457214e-06, -3.2223761081695557e-06, -3.10409814119339e-06, -2.985820174217224e-06, -2.8675422072410583e-06, -2.7492642402648926e-06, -2.630986273288727e-06, -2.512708306312561e-06, -2.3944303393363953e-06, -2.2761523723602295e-06, -2.1578744053840637e-06, -2.039596438407898e-06, -1.921318471431732e-06, -1.8030405044555664e-06, -1.6847625374794006e-06, -1.5664845705032349e-06, -1.448206603527069e-06, -1.3299286365509033e-06, -1.2116506695747375e-06, -1.0933727025985718e-06, -9.75094735622406e-07, -8.568167686462402e-07, -7.385388016700745e-07, -6.202608346939087e-07, -5.019828677177429e-07, -3.8370490074157715e-07, -2.654269337654114e-07, -1.471489667892456e-07, -2.8870999813079834e-08, 8.940696716308594e-08, 2.076849341392517e-07, 3.259629011154175e-07, 4.4424086809158325e-07, 5.62518835067749e-07, 6.807968020439148e-07, 7.990747690200806e-07, 9.173527359962463e-07, 1.0356307029724121e-06, 1.1539086699485779e-06, 1.2721866369247437e-06, 1.3904646039009094e-06, 1.5087425708770752e-06, 1.627020537853241e-06, 1.7452985048294067e-06, 1.8635764718055725e-06, 1.9818544387817383e-06, 2.100132405757904e-06, 2.21841037273407e-06, 2.3366883397102356e-06, 2.4549663066864014e-06, 2.573244273662567e-06, 2.691522240638733e-06, 2.8098002076148987e-06, 2.9280781745910645e-06, 3.0463561415672302e-06, 3.164634108543396e-06, 3.2829120755195618e-06, 3.4011900424957275e-06, 3.5194680094718933e-06, 3.637745976448059e-06, 3.756023943424225e-06, 3.874301910400391e-06]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 6.0, 4.0, 0.0, 5.0, 0.0, 8.0, 11.0, 0.0, 15.0, 0.0, 24.0, 28.0, 0.0, 27.0, 0.0, 41.0, 34.0, 0.0, 55.0, 0.0, 53.0, 78.0, 0.0, 85.0, 0.0, 80.0, 0.0, 85.0, 75.0, 0.0, 43.0, 0.0, 65.0, 41.0, 0.0, 35.0, 0.0, 32.0, 34.0, 0.0, 14.0, 0.0, 9.0, 10.0, 0.0, 4.0, 0.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.0728836059570312e-06, -1.037493348121643e-06, -1.0021030902862549e-06, -9.667128324508667e-07, -9.313225746154785e-07, -8.959323167800903e-07, -8.605420589447021e-07, -8.25151801109314e-07, -7.897615432739258e-07, -7.543712854385376e-07, -7.189810276031494e-07, -6.835907697677612e-07, -6.48200511932373e-07, -6.128102540969849e-07, -5.774199962615967e-07, -5.420297384262085e-07, -5.066394805908203e-07, -4.7124922275543213e-07, -4.3585896492004395e-07, -4.0046870708465576e-07, -3.650784492492676e-07, -3.296881914138794e-07, -2.942979335784912e-07, -2.5890767574310303e-07, -2.2351741790771484e-07, -1.8812716007232666e-07, -1.5273690223693848e-07, -1.1734664440155029e-07, -8.195638656616211e-08, -4.6566128730773926e-08, -1.1175870895385742e-08, 2.421438694000244e-08, 5.960464477539063e-08, 9.499490261077881e-08, 1.30385160446167e-07, 1.6577541828155518e-07, 2.0116567611694336e-07, 2.3655593395233154e-07, 2.7194619178771973e-07, 3.073364496231079e-07, 3.427267074584961e-07, 3.781169652938843e-07, 4.1350722312927246e-07, 4.4889748096466064e-07, 4.842877388000488e-07, 5.19677996635437e-07, 5.550682544708252e-07, 5.904585123062134e-07, 6.258487701416016e-07, 6.612390279769897e-07, 6.966292858123779e-07, 7.320195436477661e-07, 7.674098014831543e-07, 8.028000593185425e-07, 8.381903171539307e-07, 8.735805749893188e-07, 9.08970832824707e-07, 9.443610906600952e-07, 9.797513484954834e-07, 1.0151416063308716e-06, 1.0505318641662598e-06, 1.085922122001648e-06, 1.1213123798370361e-06, 1.1567026376724243e-06, 1.1920928955078125e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 19.0, 14.0, 26.0, 46.0, 129.0, 72.0, 114.0, 151.0, 224.0, 781.0, 573.0, 910.0, 1262.0, 4661.0, 4345.0, 7017.0, 11816.0, 58381.0, 75921.0, 179490.0, 357060.0, 255172.0, 37625.0, 20443.0, 11837.0, 7003.0, 7200.0, 1977.0, 1338.0, 899.0, 947.0, 308.0, 206.0, 142.0, 219.0, 60.0, 44.0, 36.0, 47.0, 10.0, 11.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.086162567138672e-06, -2.012588083744049e-06, -1.9390136003494263e-06, -1.8654391169548035e-06, -1.7918646335601807e-06, -1.7182901501655579e-06, -1.644715666770935e-06, -1.5711411833763123e-06, -1.4975666999816895e-06, -1.4239922165870667e-06, -1.3504177331924438e-06, -1.276843249797821e-06, -1.2032687664031982e-06, -1.1296942830085754e-06, -1.0561197996139526e-06, -9.825453162193298e-07, -9.08970832824707e-07, -8.353963494300842e-07, -7.618218660354614e-07, -6.882473826408386e-07, -6.146728992462158e-07, -5.41098415851593e-07, -4.675239324569702e-07, -3.939494490623474e-07, -3.203749656677246e-07, -2.468004822731018e-07, -1.73225998878479e-07, -9.96515154838562e-08, -2.60770320892334e-08, 4.7497451305389404e-08, 1.210719347000122e-07, 1.94646418094635e-07, 2.682209014892578e-07, 3.417953848838806e-07, 4.153698682785034e-07, 4.889443516731262e-07, 5.62518835067749e-07, 6.360933184623718e-07, 7.096678018569946e-07, 7.832422852516174e-07, 8.568167686462402e-07, 9.30391252040863e-07, 1.0039657354354858e-06, 1.0775402188301086e-06, 1.1511147022247314e-06, 1.2246891856193542e-06, 1.298263669013977e-06, 1.3718381524085999e-06, 1.4454126358032227e-06, 1.5189871191978455e-06, 1.5925616025924683e-06, 1.666136085987091e-06, 1.7397105693817139e-06, 1.8132850527763367e-06, 1.8868595361709595e-06, 1.9604340195655823e-06, 2.034008502960205e-06, 2.107582986354828e-06, 2.1811574697494507e-06, 2.2547319531440735e-06, 2.3283064365386963e-06, 2.401880919933319e-06, 2.475455403327942e-06, 2.5490298867225647e-06, 2.6226043701171875e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 10.0, 4.0, 18.0, 14.0, 15.0, 21.0, 0.0, 29.0, 28.0, 37.0, 43.0, 51.0, 55.0, 0.0, 57.0, 69.0, 70.0, 55.0, 59.0, 52.0, 0.0, 42.0, 40.0, 44.0, 40.0, 31.0, 20.0, 0.0, 16.0, 11.0, 12.0, 12.0, 5.0, 9.0, 0.0, 6.0, 1.0, 1.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.6093254089355469e-06, -1.5581026673316956e-06, -1.5068799257278442e-06, -1.455657184123993e-06, -1.4044344425201416e-06, -1.3532117009162903e-06, -1.301988959312439e-06, -1.2507662177085876e-06, -1.1995434761047363e-06, -1.148320734500885e-06, -1.0970979928970337e-06, -1.0458752512931824e-06, -9.94652509689331e-07, -9.434297680854797e-07, -8.922070264816284e-07, -8.409842848777771e-07, -7.897615432739258e-07, -7.385388016700745e-07, -6.873160600662231e-07, -6.360933184623718e-07, -5.848705768585205e-07, -5.336478352546692e-07, -4.824250936508179e-07, -4.3120235204696655e-07, -3.7997961044311523e-07, -3.287568688392639e-07, -2.775341272354126e-07, -2.2631138563156128e-07, -1.7508864402770996e-07, -1.2386590242385864e-07, -7.264316082000732e-08, -2.1420419216156006e-08, 2.9802322387695312e-08, 8.102506399154663e-08, 1.3224780559539795e-07, 1.8347054719924927e-07, 2.3469328880310059e-07, 2.859160304069519e-07, 3.371387720108032e-07, 3.8836151361465454e-07, 4.3958425521850586e-07, 4.908069968223572e-07, 5.420297384262085e-07, 5.932524800300598e-07, 6.444752216339111e-07, 6.956979632377625e-07, 7.469207048416138e-07, 7.981434464454651e-07, 8.493661880493164e-07, 9.005889296531677e-07, 9.51811671257019e-07, 1.0030344128608704e-06, 1.0542571544647217e-06, 1.105479896068573e-06, 1.1567026376724243e-06, 1.2079253792762756e-06, 1.259148120880127e-06, 1.3103708624839783e-06, 1.3615936040878296e-06, 1.412816345691681e-06, 1.4640390872955322e-06, 1.5152618288993835e-06, 1.5664845705032349e-06, 1.6177073121070862e-06, 1.6689300537109375e-06]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 4.0, 11.0, 17.0, 17.0, 21.0, 32.0, 48.0, 73.0, 103.0, 153.0, 111.0, 70.0, 80.0, 35.0, 28.0, 27.0, 26.0, 18.0, 23.0, 14.0, 7.0, 7.0, 11.0, 6.0, 9.0, 13.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.561863407725468e-05, -9.201111242873594e-05, -8.84035907802172e-05, -8.479606913169846e-05, -8.11885402072221e-05, -7.758101855870336e-05, -7.397349691018462e-05, -7.036597526166588e-05, -6.675845361314714e-05, -6.31509319646284e-05, -5.954341031610966e-05, -5.593588502961211e-05, -5.232836338109337e-05, -4.872084173257463e-05, -4.511331644607708e-05, -4.150579479755834e-05, -3.7898273149039596e-05, -3.4290751500520855e-05, -3.0683229852002114e-05, -2.7075704565504566e-05, -2.3468182916985825e-05, -1.9860661268467084e-05, -1.625313780095894e-05, -1.2645614333450794e-05, -9.038092684932053e-06, -5.43057012691861e-06, -1.8230475689051673e-06, 1.7844749891082756e-06, 5.3919975471217185e-06, 8.99951919564046e-06, 1.2607042663148604e-05, 1.621456613065675e-05, 1.9822080503217876e-05, 2.3429602151736617e-05, 2.7037125619244762e-05, 3.0644649086752906e-05, 3.425217073527165e-05, 3.785969238379039e-05, 4.146721767028794e-05, 4.507473931880668e-05, 4.868226096732542e-05, 5.228978261584416e-05, 5.58973042643629e-05, 5.950482955086045e-05, 6.3112354837358e-05, 6.671987648587674e-05, 7.032739813439548e-05, 7.393491978291422e-05, 7.754244143143296e-05, 8.11499630799517e-05, 8.475748472847044e-05, 8.836500637698919e-05, 9.197252802550793e-05, 9.558004967402667e-05, 9.918757859850302e-05, 0.00010279510024702176, 0.0001064026218955405, 0.00011001014354405925, 0.00011361766519257799, 0.00011722518684109673, 0.00012083271576557308, 0.00012444023741409183, 0.00012804775906261057, 0.0001316552807111293, 0.00013526280235964805]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 9.0, 6.0, 5.0, 10.0, 10.0, 17.0, 16.0, 17.0, 15.0, 27.0, 29.0, 30.0, 25.0, 35.0, 40.0, 31.0, 48.0, 28.0, 37.0, 38.0, 41.0, 40.0, 47.0, 37.0, 35.0, 37.0, 40.0, 28.0, 28.0, 28.0, 23.0, 15.0, 19.0, 15.0, 9.0, 14.0, 18.0, 8.0, 5.0, 7.0, 4.0, 4.0, 4.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.26120376586914e-05, -8.016545325517654e-05, -7.771886885166168e-05, -7.527228444814682e-05, -7.282570004463196e-05, -7.03791156411171e-05, -6.793253123760223e-05, -6.548594683408737e-05, -6.303936243057251e-05, -6.059277802705765e-05, -5.8146193623542786e-05, -5.5699609220027924e-05, -5.325302481651306e-05, -5.08064404129982e-05, -4.835985600948334e-05, -4.5913271605968475e-05, -4.346668720245361e-05, -4.102010279893875e-05, -3.857351839542389e-05, -3.612693399190903e-05, -3.3680349588394165e-05, -3.12337651848793e-05, -2.878718078136444e-05, -2.634059637784958e-05, -2.3894011974334717e-05, -2.1447427570819855e-05, -1.9000843167304993e-05, -1.655425876379013e-05, -1.4107674360275269e-05, -1.1661089956760406e-05, -9.214505553245544e-06, -6.767921149730682e-06, -4.32133674621582e-06, -1.8747523427009583e-06, 5.718320608139038e-07, 3.018416464328766e-06, 5.465000867843628e-06, 7.91158527135849e-06, 1.0358169674873352e-05, 1.2804754078388214e-05, 1.5251338481903076e-05, 1.7697922885417938e-05, 2.01445072889328e-05, 2.2591091692447662e-05, 2.5037676095962524e-05, 2.7484260499477386e-05, 2.993084490299225e-05, 3.237742930650711e-05, 3.482401371002197e-05, 3.7270598113536835e-05, 3.97171825170517e-05, 4.216376692056656e-05, 4.461035132408142e-05, 4.705693572759628e-05, 4.9503520131111145e-05, 5.195010453462601e-05, 5.439668893814087e-05, 5.684327334165573e-05, 5.928985774517059e-05, 6.173644214868546e-05, 6.418302655220032e-05, 6.662961095571518e-05, 6.907619535923004e-05, 7.15227797627449e-05, 7.396936416625977e-05]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 8.0, 18.0, 24.0, 34.0, 61.0, 68.0, 90.0, 176.0, 294.0, 433.0, 657.0, 1153.0, 2046.0, 3774.0, 8444.0, 21705.0, 123401.0, 3933626.0, 68947.0, 16205.0, 6408.0, 2962.0, 1697.0, 792.0, 496.0, 264.0, 149.0, 95.0, 75.0, 43.0, 31.0, 25.0, 18.0, 13.0, 15.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.414817810058594e-05, -7.144175469875336e-05, -6.873533129692078e-05, -6.60289078950882e-05, -6.332248449325562e-05, -6.0616061091423035e-05, -5.7909637689590454e-05, -5.5203214287757874e-05, -5.249679088592529e-05, -4.979036748409271e-05, -4.708394408226013e-05, -4.437752068042755e-05, -4.167109727859497e-05, -3.896467387676239e-05, -3.625825047492981e-05, -3.355182707309723e-05, -3.084540367126465e-05, -2.8138980269432068e-05, -2.5432556867599487e-05, -2.2726133465766907e-05, -2.0019710063934326e-05, -1.7313286662101746e-05, -1.4606863260269165e-05, -1.1900439858436584e-05, -9.194016456604004e-06, -6.487593054771423e-06, -3.7811696529388428e-06, -1.0747462511062622e-06, 1.6316771507263184e-06, 4.338100552558899e-06, 7.0445239543914795e-06, 9.75094735622406e-06, 1.245737075805664e-05, 1.5163794159889221e-05, 1.7870217561721802e-05, 2.0576640963554382e-05, 2.3283064365386963e-05, 2.5989487767219543e-05, 2.8695911169052124e-05, 3.1402334570884705e-05, 3.4108757972717285e-05, 3.6815181374549866e-05, 3.9521604776382446e-05, 4.222802817821503e-05, 4.493445158004761e-05, 4.764087498188019e-05, 5.034729838371277e-05, 5.305372178554535e-05, 5.576014518737793e-05, 5.846656858921051e-05, 6.117299199104309e-05, 6.387941539287567e-05, 6.658583879470825e-05, 6.929226219654083e-05, 7.199868559837341e-05, 7.4705109000206e-05, 7.741153240203857e-05, 8.011795580387115e-05, 8.282437920570374e-05, 8.553080260753632e-05, 8.82372260093689e-05, 9.094364941120148e-05, 9.365007281303406e-05, 9.635649621486664e-05, 9.906291961669922e-05]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 1.0, 6.0, 8.0, 5.0, 7.0, 9.0, 10.0, 21.0, 19.0, 35.0, 42.0, 71.0, 85.0, 89.0, 96.0, 83.0, 100.0, 79.0, 60.0, 39.0, 39.0, 29.0, 20.0, 6.0, 7.0, 7.0, 12.0, 3.0, 8.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6570091247558594e-05, -1.595914363861084e-05, -1.5348196029663086e-05, -1.4737248420715332e-05, -1.4126300811767578e-05, -1.3515353202819824e-05, -1.290440559387207e-05, -1.2293457984924316e-05, -1.1682510375976562e-05, -1.1071562767028809e-05, -1.0460615158081055e-05, -9.8496675491333e-06, -9.238719940185547e-06, -8.627772331237793e-06, -8.016824722290039e-06, -7.405877113342285e-06, -6.794929504394531e-06, -6.183981895446777e-06, -5.5730342864990234e-06, -4.9620866775512695e-06, -4.351139068603516e-06, -3.7401914596557617e-06, -3.129243850708008e-06, -2.518296241760254e-06, -1.9073486328125e-06, -1.296401023864746e-06, -6.854534149169922e-07, -7.450580596923828e-08, 5.364418029785156e-07, 1.1473894119262695e-06, 1.7583370208740234e-06, 2.3692846298217773e-06, 2.9802322387695312e-06, 3.591179847717285e-06, 4.202127456665039e-06, 4.813075065612793e-06, 5.424022674560547e-06, 6.034970283508301e-06, 6.645917892456055e-06, 7.256865501403809e-06, 7.867813110351562e-06, 8.478760719299316e-06, 9.08970832824707e-06, 9.700655937194824e-06, 1.0311603546142578e-05, 1.0922551155090332e-05, 1.1533498764038086e-05, 1.214444637298584e-05, 1.2755393981933594e-05, 1.3366341590881348e-05, 1.3977289199829102e-05, 1.4588236808776855e-05, 1.519918441772461e-05, 1.5810132026672363e-05, 1.6421079635620117e-05, 1.703202724456787e-05, 1.7642974853515625e-05, 1.825392246246338e-05, 1.8864870071411133e-05, 1.9475817680358887e-05, 2.008676528930664e-05, 2.0697712898254395e-05, 2.130866050720215e-05, 2.1919608116149902e-05, 2.2530555725097656e-05]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 9.0, 14.0, 19.0, 34.0, 48.0, 67.0, 112.0, 151.0, 240.0, 409.0, 650.0, 967.0, 1776.0, 3161.0, 6274.0, 11767.0, 25015.0, 65032.0, 398877.0, 3460593.0, 140430.0, 41470.0, 17686.0, 8598.0, 4478.0, 2542.0, 1433.0, 927.0, 496.0, 335.0, 225.0, 157.0, 83.0, 68.0, 45.0, 32.0, 21.0, 15.0, 5.0, 10.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.166364669799805e-05, -4.0288083255290985e-05, -3.891251981258392e-05, -3.753695636987686e-05, -3.61613929271698e-05, -3.478582948446274e-05, -3.3410266041755676e-05, -3.2034702599048615e-05, -3.065913915634155e-05, -2.928357571363449e-05, -2.790801227092743e-05, -2.6532448828220367e-05, -2.5156885385513306e-05, -2.3781321942806244e-05, -2.2405758500099182e-05, -2.103019505739212e-05, -1.965463161468506e-05, -1.8279068171977997e-05, -1.6903504729270935e-05, -1.5527941286563873e-05, -1.4152377843856812e-05, -1.277681440114975e-05, -1.1401250958442688e-05, -1.0025687515735626e-05, -8.650124073028564e-06, -7.274560630321503e-06, -5.898997187614441e-06, -4.523433744907379e-06, -3.1478703022003174e-06, -1.7723068594932556e-06, -3.9674341678619385e-07, 9.78820025920868e-07, 2.3543834686279297e-06, 3.7299469113349915e-06, 5.105510354042053e-06, 6.481073796749115e-06, 7.856637239456177e-06, 9.232200682163239e-06, 1.06077641248703e-05, 1.1983327567577362e-05, 1.3358891010284424e-05, 1.4734454452991486e-05, 1.6110017895698547e-05, 1.748558133840561e-05, 1.886114478111267e-05, 2.0236708223819733e-05, 2.1612271666526794e-05, 2.2987835109233856e-05, 2.4363398551940918e-05, 2.573896199464798e-05, 2.711452543735504e-05, 2.8490088880062103e-05, 2.9865652322769165e-05, 3.124121576547623e-05, 3.261677920818329e-05, 3.399234265089035e-05, 3.536790609359741e-05, 3.6743469536304474e-05, 3.8119032979011536e-05, 3.94945964217186e-05, 4.087015986442566e-05, 4.224572330713272e-05, 4.362128674983978e-05, 4.4996850192546844e-05, 4.6372413635253906e-05]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 7.0, 5.0, 10.0, 7.0, 14.0, 20.0, 17.0, 24.0, 33.0, 35.0, 38.0, 73.0, 147.0, 383.0, 1112.0, 1352.0, 365.0, 138.0, 62.0, 35.0, 42.0, 20.0, 21.0, 20.0, 18.0, 12.0, 8.0, 9.0, 7.0, 5.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6285648345947266e-05, -2.5346875190734863e-05, -2.440810203552246e-05, -2.346932888031006e-05, -2.2530555725097656e-05, -2.1591782569885254e-05, -2.065300941467285e-05, -1.971423625946045e-05, -1.8775463104248047e-05, -1.7836689949035645e-05, -1.6897916793823242e-05, -1.595914363861084e-05, -1.5020370483398438e-05, -1.4081597328186035e-05, -1.3142824172973633e-05, -1.220405101776123e-05, -1.1265277862548828e-05, -1.0326504707336426e-05, -9.387731552124023e-06, -8.448958396911621e-06, -7.510185241699219e-06, -6.571412086486816e-06, -5.632638931274414e-06, -4.693865776062012e-06, -3.7550926208496094e-06, -2.816319465637207e-06, -1.8775463104248047e-06, -9.387731552124023e-07, 0.0, 9.387731552124023e-07, 1.8775463104248047e-06, 2.816319465637207e-06, 3.7550926208496094e-06, 4.693865776062012e-06, 5.632638931274414e-06, 6.571412086486816e-06, 7.510185241699219e-06, 8.448958396911621e-06, 9.387731552124023e-06, 1.0326504707336426e-05, 1.1265277862548828e-05, 1.220405101776123e-05, 1.3142824172973633e-05, 1.4081597328186035e-05, 1.5020370483398438e-05, 1.595914363861084e-05, 1.6897916793823242e-05, 1.7836689949035645e-05, 1.8775463104248047e-05, 1.971423625946045e-05, 2.065300941467285e-05, 2.1591782569885254e-05, 2.2530555725097656e-05, 2.346932888031006e-05, 2.440810203552246e-05, 2.5346875190734863e-05, 2.6285648345947266e-05, 2.7224421501159668e-05, 2.816319465637207e-05, 2.9101967811584473e-05, 3.0040740966796875e-05, 3.097951412200928e-05, 3.191828727722168e-05, 3.285706043243408e-05, 3.3795833587646484e-05]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 7.0, 4.0, 18.0, 25.0, 35.0, 42.0, 56.0, 88.0, 107.0, 144.0, 98.0, 92.0, 61.0, 55.0, 40.0, 26.0, 19.0, 20.0, 10.0, 5.0, 13.0, 6.0, 8.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014836332411505282, -0.00014347155229188502, -0.00013857978046871722, -0.0001336879940936342, -0.0001287962222704664, -0.00012390445044729859, -0.00011901267862413079, -0.00011412090680096298, -0.00010922912770183757, -0.00010433735587866977, -9.944557677954435e-05, -9.455380495637655e-05, -8.966203313320875e-05, -8.477025403408334e-05, -7.987848221091554e-05, -7.498670311179012e-05, -7.009493128862232e-05, -6.520315946545452e-05, -6.0311380366329104e-05, -5.54196085431613e-05, -5.0527833082014695e-05, -4.563605762086809e-05, -4.0744285797700286e-05, -3.585251033655368e-05, -3.096073487540707e-05, -2.6068959414260462e-05, -2.1177185772103257e-05, -1.6285412129946053e-05, -1.1393636668799445e-05, -6.501861207652837e-06, -1.6100875654956326e-06, 3.281686076661572e-06, 8.17346153780818e-06, 1.3065236089460086e-05, 1.7957010641111992e-05, 2.2848784283269197e-05, 2.7740559744415805e-05, 3.263233520556241e-05, 3.7524107028730214e-05, 4.241588248987682e-05, 4.730765795102343e-05, 5.219943341217004e-05, 5.7091208873316646e-05, 6.198298069648445e-05, 6.687475251965225e-05, 7.176653161877766e-05, 7.665830344194546e-05, 8.155008254107088e-05, 8.644185436423868e-05, 9.133362618740648e-05, 9.62254052865319e-05, 0.0001011171771096997, 0.00010600895620882511, 0.00011090072803199291, 0.00011579249985516071, 0.00012068427167832851, 0.00012557604350149632, 0.00013046781532466412, 0.00013535958714783192, 0.00014025137352291495, 0.00014514314534608275, 0.00015003491716925055, 0.00015492668899241835, 0.00015981846081558615, 0.00016471024719066918]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 2.0, 6.0, 7.0, 10.0, 6.0, 17.0, 15.0, 17.0, 18.0, 25.0, 26.0, 35.0, 29.0, 41.0, 43.0, 46.0, 47.0, 59.0, 41.0, 54.0, 42.0, 39.0, 39.0, 50.0, 44.0, 39.0, 31.0, 22.0, 27.0, 23.0, 20.0, 17.0, 11.0, 17.0, 12.0, 9.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.679794311523438e-05, -9.406637400388718e-05, -9.133480489253998e-05, -8.860323578119278e-05, -8.587166666984558e-05, -8.314009755849838e-05, -8.040852844715118e-05, -7.767695933580399e-05, -7.494539022445679e-05, -7.221382111310959e-05, -6.948225200176239e-05, -6.675068289041519e-05, -6.401911377906799e-05, -6.12875446677208e-05, -5.8555975556373596e-05, -5.58244064450264e-05, -5.30928373336792e-05, -5.0361268222332e-05, -4.76296991109848e-05, -4.4898129999637604e-05, -4.2166560888290405e-05, -3.943499177694321e-05, -3.670342266559601e-05, -3.397185355424881e-05, -3.124028444290161e-05, -2.8508715331554413e-05, -2.5777146220207214e-05, -2.3045577108860016e-05, -2.0314007997512817e-05, -1.758243888616562e-05, -1.485086977481842e-05, -1.2119300663471222e-05, -9.387731552124023e-06, -6.656162440776825e-06, -3.9245933294296265e-06, -1.193024218082428e-06, 1.5385448932647705e-06, 4.270114004611969e-06, 7.0016831159591675e-06, 9.733252227306366e-06, 1.2464821338653564e-05, 1.5196390450000763e-05, 1.792795956134796e-05, 2.065952867269516e-05, 2.339109778404236e-05, 2.6122666895389557e-05, 2.8854236006736755e-05, 3.1585805118083954e-05, 3.431737422943115e-05, 3.704894334077835e-05, 3.978051245212555e-05, 4.251208156347275e-05, 4.5243650674819946e-05, 4.7975219786167145e-05, 5.070678889751434e-05, 5.343835800886154e-05, 5.616992712020874e-05, 5.890149623155594e-05, 6.163306534290314e-05, 6.436463445425034e-05, 6.709620356559753e-05, 6.982777267694473e-05, 7.255934178829193e-05, 7.529091089963913e-05, 7.802248001098633e-05]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 10.0, 12.0, 15.0, 26.0, 35.0, 40.0, 76.0, 103.0, 183.0, 261.0, 411.0, 647.0, 1090.0, 1785.0, 3151.0, 5633.0, 10239.0, 21098.0, 47043.0, 132037.0, 488254.0, 211190.0, 67306.0, 27374.0, 13652.0, 7257.0, 3880.0, 2283.0, 1306.0, 765.0, 457.0, 308.0, 173.0, 139.0, 89.0, 69.0, 52.0, 28.0, 21.0, 20.0, 8.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.231401443481445e-05, -8.000805974006653e-05, -7.77021050453186e-05, -7.539615035057068e-05, -7.309019565582275e-05, -7.078424096107483e-05, -6.84782862663269e-05, -6.617233157157898e-05, -6.386637687683105e-05, -6.156042218208313e-05, -5.9254467487335205e-05, -5.694851279258728e-05, -5.4642558097839355e-05, -5.233660340309143e-05, -5.0030648708343506e-05, -4.772469401359558e-05, -4.5418739318847656e-05, -4.311278462409973e-05, -4.080682992935181e-05, -3.850087523460388e-05, -3.619492053985596e-05, -3.388896584510803e-05, -3.158301115036011e-05, -2.9277056455612183e-05, -2.6971101760864258e-05, -2.4665147066116333e-05, -2.2359192371368408e-05, -2.0053237676620483e-05, -1.774728298187256e-05, -1.5441328287124634e-05, -1.3135373592376709e-05, -1.0829418897628784e-05, -8.52346420288086e-06, -6.2175095081329346e-06, -3.91155481338501e-06, -1.605600118637085e-06, 7.003545761108398e-07, 3.0063092708587646e-06, 5.3122639656066895e-06, 7.618218660354614e-06, 9.924173355102539e-06, 1.2230128049850464e-05, 1.4536082744598389e-05, 1.6842037439346313e-05, 1.9147992134094238e-05, 2.1453946828842163e-05, 2.3759901523590088e-05, 2.6065856218338013e-05, 2.8371810913085938e-05, 3.067776560783386e-05, 3.298372030258179e-05, 3.528967499732971e-05, 3.759562969207764e-05, 3.990158438682556e-05, 4.2207539081573486e-05, 4.451349377632141e-05, 4.6819448471069336e-05, 4.912540316581726e-05, 5.1431357860565186e-05, 5.373731255531311e-05, 5.6043267250061035e-05, 5.834922194480896e-05, 6.0655176639556885e-05, 6.296113133430481e-05, 6.526708602905273e-05]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 7.0, 10.0, 12.0, 17.0, 17.0, 22.0, 22.0, 30.0, 49.0, 74.0, 81.0, 81.0, 69.0, 78.0, 77.0, 74.0, 53.0, 48.0, 37.0, 28.0, 23.0, 15.0, 22.0, 7.0, 7.0, 6.0, 10.0, 6.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8596649169921875e-05, -1.8084421753883362e-05, -1.757219433784485e-05, -1.7059966921806335e-05, -1.6547739505767822e-05, -1.603551208972931e-05, -1.5523284673690796e-05, -1.5011057257652283e-05, -1.449882984161377e-05, -1.3986602425575256e-05, -1.3474375009536743e-05, -1.296214759349823e-05, -1.2449920177459717e-05, -1.1937692761421204e-05, -1.142546534538269e-05, -1.0913237929344177e-05, -1.0401010513305664e-05, -9.888783097267151e-06, -9.376555681228638e-06, -8.864328265190125e-06, -8.352100849151611e-06, -7.839873433113098e-06, -7.327646017074585e-06, -6.815418601036072e-06, -6.303191184997559e-06, -5.790963768959045e-06, -5.278736352920532e-06, -4.766508936882019e-06, -4.254281520843506e-06, -3.7420541048049927e-06, -3.2298266887664795e-06, -2.7175992727279663e-06, -2.205371856689453e-06, -1.69314444065094e-06, -1.1809170246124268e-06, -6.686896085739136e-07, -1.564621925354004e-07, 3.557652235031128e-07, 8.67992639541626e-07, 1.3802200555801392e-06, 1.8924474716186523e-06, 2.4046748876571655e-06, 2.9169023036956787e-06, 3.429129719734192e-06, 3.941357135772705e-06, 4.453584551811218e-06, 4.9658119678497314e-06, 5.478039383888245e-06, 5.990266799926758e-06, 6.502494215965271e-06, 7.014721632003784e-06, 7.526949048042297e-06, 8.03917646408081e-06, 8.551403880119324e-06, 9.063631296157837e-06, 9.57585871219635e-06, 1.0088086128234863e-05, 1.0600313544273376e-05, 1.111254096031189e-05, 1.1624768376350403e-05, 1.2136995792388916e-05, 1.264922320842743e-05, 1.3161450624465942e-05, 1.3673678040504456e-05, 1.4185905456542969e-05]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 16.0, 24.0, 34.0, 46.0, 81.0, 107.0, 172.0, 255.0, 370.0, 632.0, 966.0, 1532.0, 2312.0, 3627.0, 6386.0, 10370.0, 17101.0, 30542.0, 56084.0, 124524.0, 347169.0, 237437.0, 94825.0, 50149.0, 25710.0, 14789.0, 8750.0, 5290.0, 3482.0, 2049.0, 1287.0, 870.0, 546.0, 355.0, 230.0, 157.0, 95.0, 68.0, 35.0, 27.0, 7.0, 14.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.4749507904052734e-05, -3.372319042682648e-05, -3.269687294960022e-05, -3.167055547237396e-05, -3.0644237995147705e-05, -2.9617920517921448e-05, -2.859160304069519e-05, -2.7565285563468933e-05, -2.6538968086242676e-05, -2.551265060901642e-05, -2.448633313179016e-05, -2.3460015654563904e-05, -2.2433698177337646e-05, -2.140738070011139e-05, -2.0381063222885132e-05, -1.9354745745658875e-05, -1.8328428268432617e-05, -1.730211079120636e-05, -1.6275793313980103e-05, -1.5249475836753845e-05, -1.4223158359527588e-05, -1.319684088230133e-05, -1.2170523405075073e-05, -1.1144205927848816e-05, -1.0117888450622559e-05, -9.091570973396301e-06, -8.065253496170044e-06, -7.038936018943787e-06, -6.012618541717529e-06, -4.986301064491272e-06, -3.959983587265015e-06, -2.9336661100387573e-06, -1.9073486328125e-06, -8.810311555862427e-07, 1.4528632164001465e-07, 1.171603798866272e-06, 2.1979212760925293e-06, 3.2242387533187866e-06, 4.250556230545044e-06, 5.276873707771301e-06, 6.303191184997559e-06, 7.329508662223816e-06, 8.355826139450073e-06, 9.38214361667633e-06, 1.0408461093902588e-05, 1.1434778571128845e-05, 1.2461096048355103e-05, 1.348741352558136e-05, 1.4513731002807617e-05, 1.5540048480033875e-05, 1.6566365957260132e-05, 1.759268343448639e-05, 1.8619000911712646e-05, 1.9645318388938904e-05, 2.067163586616516e-05, 2.169795334339142e-05, 2.2724270820617676e-05, 2.3750588297843933e-05, 2.477690577507019e-05, 2.5803223252296448e-05, 2.6829540729522705e-05, 2.7855858206748962e-05, 2.888217568397522e-05, 2.9908493161201477e-05, 3.0934810638427734e-05]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 6.0, 16.0, 13.0, 13.0, 13.0, 13.0, 14.0, 24.0, 24.0, 26.0, 21.0, 32.0, 48.0, 57.0, 37.0, 33.0, 37.0, 34.0, 36.0, 42.0, 36.0, 49.0, 49.0, 31.0, 33.0, 31.0, 35.0, 22.0, 24.0, 18.0, 16.0, 25.0, 16.0, 11.0, 11.0, 6.0, 7.0, 3.0, 9.0, 5.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-2.8014183044433594e-05, -2.7186237275600433e-05, -2.6358291506767273e-05, -2.5530345737934113e-05, -2.4702399969100952e-05, -2.3874454200267792e-05, -2.304650843143463e-05, -2.221856266260147e-05, -2.139061689376831e-05, -2.056267112493515e-05, -1.973472535610199e-05, -1.890677958726883e-05, -1.807883381843567e-05, -1.725088804960251e-05, -1.6422942280769348e-05, -1.5594996511936188e-05, -1.4767050743103027e-05, -1.3939104974269867e-05, -1.3111159205436707e-05, -1.2283213436603546e-05, -1.1455267667770386e-05, -1.0627321898937225e-05, -9.799376130104065e-06, -8.971430361270905e-06, -8.143484592437744e-06, -7.315538823604584e-06, -6.487593054771423e-06, -5.659647285938263e-06, -4.8317015171051025e-06, -4.003755748271942e-06, -3.1758099794387817e-06, -2.3478642106056213e-06, -1.519918441772461e-06, -6.919726729393005e-07, 1.3597309589385986e-07, 9.639188647270203e-07, 1.7918646335601807e-06, 2.619810402393341e-06, 3.4477561712265015e-06, 4.275701940059662e-06, 5.103647708892822e-06, 5.931593477725983e-06, 6.759539246559143e-06, 7.5874850153923035e-06, 8.415430784225464e-06, 9.243376553058624e-06, 1.0071322321891785e-05, 1.0899268090724945e-05, 1.1727213859558105e-05, 1.2555159628391266e-05, 1.3383105397224426e-05, 1.4211051166057587e-05, 1.5038996934890747e-05, 1.5866942703723907e-05, 1.6694888472557068e-05, 1.7522834241390228e-05, 1.835078001022339e-05, 1.917872577905655e-05, 2.000667154788971e-05, 2.083461731672287e-05, 2.166256308555603e-05, 2.249050885438919e-05, 2.331845462322235e-05, 2.414640039205551e-05, 2.4974346160888672e-05]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 4.0, 0.0, 4.0, 11.0, 22.0, 28.0, 46.0, 80.0, 52.0, 158.0, 223.0, 385.0, 704.0, 1114.0, 941.0, 2905.0, 5944.0, 13716.0, 36281.0, 118848.0, 176453.0, 509336.0, 118666.0, 36195.0, 13577.0, 6216.0, 2914.0, 887.0, 1086.0, 680.0, 387.0, 248.0, 172.0, 48.0, 63.0, 53.0, 29.0, 23.0, 18.0, 8.0, 5.0, 6.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.516674041748047e-06, -3.4067779779434204e-06, -3.296881914138794e-06, -3.1869858503341675e-06, -3.077089786529541e-06, -2.9671937227249146e-06, -2.857297658920288e-06, -2.7474015951156616e-06, -2.637505531311035e-06, -2.5276094675064087e-06, -2.4177134037017822e-06, -2.3078173398971558e-06, -2.1979212760925293e-06, -2.088025212287903e-06, -1.9781291484832764e-06, -1.86823308467865e-06, -1.7583370208740234e-06, -1.648440957069397e-06, -1.5385448932647705e-06, -1.428648829460144e-06, -1.3187527656555176e-06, -1.2088567018508911e-06, -1.0989606380462646e-06, -9.890645742416382e-07, -8.791685104370117e-07, -7.692724466323853e-07, -6.593763828277588e-07, -5.494803190231323e-07, -4.3958425521850586e-07, -3.296881914138794e-07, -2.1979212760925293e-07, -1.0989606380462646e-07, 0.0, 1.0989606380462646e-07, 2.1979212760925293e-07, 3.296881914138794e-07, 4.3958425521850586e-07, 5.494803190231323e-07, 6.593763828277588e-07, 7.692724466323853e-07, 8.791685104370117e-07, 9.890645742416382e-07, 1.0989606380462646e-06, 1.2088567018508911e-06, 1.3187527656555176e-06, 1.428648829460144e-06, 1.5385448932647705e-06, 1.648440957069397e-06, 1.7583370208740234e-06, 1.86823308467865e-06, 1.9781291484832764e-06, 2.088025212287903e-06, 2.1979212760925293e-06, 2.3078173398971558e-06, 2.4177134037017822e-06, 2.5276094675064087e-06, 2.637505531311035e-06, 2.7474015951156616e-06, 2.857297658920288e-06, 2.9671937227249146e-06, 3.077089786529541e-06, 3.1869858503341675e-06, 3.296881914138794e-06, 3.4067779779434204e-06, 3.516674041748047e-06]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 8.0, 9.0, 0.0, 15.0, 0.0, 15.0, 0.0, 17.0, 0.0, 35.0, 29.0, 0.0, 41.0, 0.0, 59.0, 0.0, 83.0, 88.0, 0.0, 92.0, 0.0, 97.0, 0.0, 84.0, 0.0, 67.0, 61.0, 0.0, 44.0, 0.0, 28.0, 0.0, 34.0, 28.0, 0.0, 18.0, 0.0, 20.0, 0.0, 24.0, 0.0, 8.0, 6.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.201467037200928e-07, -8.866190910339355e-07, -8.530914783477783e-07, -8.195638656616211e-07, -7.860362529754639e-07, -7.525086402893066e-07, -7.189810276031494e-07, -6.854534149169922e-07, -6.51925802230835e-07, -6.183981895446777e-07, -5.848705768585205e-07, -5.513429641723633e-07, -5.178153514862061e-07, -4.842877388000488e-07, -4.507601261138916e-07, -4.172325134277344e-07, -3.8370490074157715e-07, -3.501772880554199e-07, -3.166496753692627e-07, -2.8312206268310547e-07, -2.4959444999694824e-07, -2.1606683731079102e-07, -1.825392246246338e-07, -1.4901161193847656e-07, -1.1548399925231934e-07, -8.195638656616211e-08, -4.842877388000488e-08, -1.4901161193847656e-08, 1.862645149230957e-08, 5.21540641784668e-08, 8.568167686462402e-08, 1.1920928955078125e-07, 1.5273690223693848e-07, 1.862645149230957e-07, 2.1979212760925293e-07, 2.5331974029541016e-07, 2.868473529815674e-07, 3.203749656677246e-07, 3.5390257835388184e-07, 3.8743019104003906e-07, 4.209578037261963e-07, 4.544854164123535e-07, 4.880130290985107e-07, 5.21540641784668e-07, 5.550682544708252e-07, 5.885958671569824e-07, 6.221234798431396e-07, 6.556510925292969e-07, 6.891787052154541e-07, 7.227063179016113e-07, 7.562339305877686e-07, 7.897615432739258e-07, 8.23289155960083e-07, 8.568167686462402e-07, 8.903443813323975e-07, 9.238719940185547e-07, 9.57399606704712e-07, 9.909272193908691e-07, 1.0244548320770264e-06, 1.0579824447631836e-06, 1.0915100574493408e-06, 1.125037670135498e-06, 1.1585652828216553e-06, 1.1920928955078125e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 8.0, 3.0, 1.0, 10.0, 10.0, 6.0, 24.0, 21.0, 31.0, 54.0, 44.0, 50.0, 156.0, 156.0, 187.0, 505.0, 421.0, 546.0, 1592.0, 1424.0, 2008.0, 7501.0, 7430.0, 13158.0, 85714.0, 181238.0, 444280.0, 241039.0, 25596.0, 13129.0, 12028.0, 2908.0, 1952.0, 2440.0, 759.0, 500.0, 683.0, 198.0, 158.0, 239.0, 83.0, 59.0, 88.0, 25.0, 29.0, 30.0, 9.0, 4.0, 13.0, 0.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3245811462402344e-06, -2.2454187273979187e-06, -2.166256308555603e-06, -2.0870938897132874e-06, -2.0079314708709717e-06, -1.928769052028656e-06, -1.8496066331863403e-06, -1.7704442143440247e-06, -1.691281795501709e-06, -1.6121193766593933e-06, -1.5329569578170776e-06, -1.453794538974762e-06, -1.3746321201324463e-06, -1.2954697012901306e-06, -1.216307282447815e-06, -1.1371448636054993e-06, -1.0579824447631836e-06, -9.78820025920868e-07, -8.996576070785522e-07, -8.204951882362366e-07, -7.413327693939209e-07, -6.621703505516052e-07, -5.830079317092896e-07, -5.038455128669739e-07, -4.246830940246582e-07, -3.4552067518234253e-07, -2.6635825634002686e-07, -1.8719583749771118e-07, -1.0803341865539551e-07, -2.8870999813079834e-08, 5.029141902923584e-08, 1.2945383787155151e-07, 2.086162567138672e-07, 2.8777867555618286e-07, 3.6694109439849854e-07, 4.461035132408142e-07, 5.252659320831299e-07, 6.044283509254456e-07, 6.835907697677612e-07, 7.627531886100769e-07, 8.419156074523926e-07, 9.210780262947083e-07, 1.000240445137024e-06, 1.0794028639793396e-06, 1.1585652828216553e-06, 1.237727701663971e-06, 1.3168901205062866e-06, 1.3960525393486023e-06, 1.475214958190918e-06, 1.5543773770332336e-06, 1.6335397958755493e-06, 1.712702214717865e-06, 1.7918646335601807e-06, 1.8710270524024963e-06, 1.950189471244812e-06, 2.0293518900871277e-06, 2.1085143089294434e-06, 2.187676727771759e-06, 2.2668391466140747e-06, 2.3460015654563904e-06, 2.425163984298706e-06, 2.5043264031410217e-06, 2.5834888219833374e-06, 2.662651240825653e-06, 2.7418136596679688e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 8.0, 11.0, 7.0, 13.0, 12.0, 23.0, 61.0, 65.0, 64.0, 74.0, 90.0, 99.0, 90.0, 73.0, 73.0, 79.0, 33.0, 26.0, 20.0, 14.0, 7.0, 9.0, 5.0, 4.0, 10.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1457672119140625e-06, -2.0796433091163635e-06, -2.0135194063186646e-06, -1.9473955035209656e-06, -1.8812716007232666e-06, -1.8151476979255676e-06, -1.7490237951278687e-06, -1.6828998923301697e-06, -1.6167759895324707e-06, -1.5506520867347717e-06, -1.4845281839370728e-06, -1.4184042811393738e-06, -1.3522803783416748e-06, -1.2861564755439758e-06, -1.2200325727462769e-06, -1.1539086699485779e-06, -1.087784767150879e-06, -1.02166086435318e-06, -9.55536961555481e-07, -8.89413058757782e-07, -8.23289155960083e-07, -7.57165253162384e-07, -6.910413503646851e-07, -6.249174475669861e-07, -5.587935447692871e-07, -4.926696419715881e-07, -4.2654573917388916e-07, -3.604218363761902e-07, -2.942979335784912e-07, -2.2817403078079224e-07, -1.6205012798309326e-07, -9.592622518539429e-08, -2.9802322387695312e-08, 3.632158041000366e-08, 1.0244548320770264e-07, 1.685693860054016e-07, 2.3469328880310059e-07, 3.0081719160079956e-07, 3.6694109439849854e-07, 4.330649971961975e-07, 4.991888999938965e-07, 5.653128027915955e-07, 6.314367055892944e-07, 6.975606083869934e-07, 7.636845111846924e-07, 8.298084139823914e-07, 8.959323167800903e-07, 9.620562195777893e-07, 1.0281801223754883e-06, 1.0943040251731873e-06, 1.1604279279708862e-06, 1.2265518307685852e-06, 1.2926757335662842e-06, 1.3587996363639832e-06, 1.4249235391616821e-06, 1.491047441959381e-06, 1.55717134475708e-06, 1.623295247554779e-06, 1.689419150352478e-06, 1.755543053150177e-06, 1.821666955947876e-06, 1.887790858745575e-06, 1.953914761543274e-06, 2.020038664340973e-06, 2.086162567138672e-06]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 13.0, 18.0, 35.0, 39.0, 60.0, 107.0, 177.0, 148.0, 88.0, 55.0, 50.0, 37.0, 35.0, 27.0, 8.0, 19.0, 13.0, 6.0, 11.0, 10.0, 8.0, 0.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011545175948413089, -0.00011127455218229443, -0.00010709734488045797, -0.0001029201375786215, -9.874293027678505e-05, -9.456572297494859e-05, -9.038852294906974e-05, -8.621130837127566e-05, -8.203410834539682e-05, -7.785690104356036e-05, -7.36796937417239e-05, -6.950248643988743e-05, -6.532527913805097e-05, -6.114807183621451e-05, -5.697086817235686e-05, -5.27936608705204e-05, -4.861644993070513e-05, -4.443924262886867e-05, -4.026203532703221e-05, -3.608482802519575e-05, -3.190762072335929e-05, -2.773041524051223e-05, -2.3553209757665172e-05, -1.937600245582871e-05, -1.519879515399225e-05, -1.102158785215579e-05, -6.844381459814031e-06, -2.6671750674722716e-06, 1.5100322343641892e-06, 5.68723953620065e-06, 9.864445019047707e-06, 1.4041652320884168e-05, 1.8218866898678243e-05, 2.2396074200514704e-05, 2.6573281502351165e-05, 3.0750488804187626e-05, 3.4927696106024086e-05, 3.910490340786055e-05, 4.32821070717182e-05, 4.745931437355466e-05, 5.163652167539112e-05, 5.5813728977227584e-05, 5.9990936279064044e-05, 6.41681399429217e-05, 6.834534724475816e-05, 7.252255454659462e-05, 7.669976184843108e-05, 8.087696915026754e-05, 8.5054176452104e-05, 8.923138375394046e-05, 9.340859105577692e-05, 9.758579835761338e-05, 0.00010176300565944985, 0.0001059402129612863, 0.00011011741298716515, 0.00011429462756495923, 0.00011847182759083807, 0.00012264902761671692, 0.000126826242194511, 0.00013100344222038984, 0.00013518065679818392, 0.00013935785682406276, 0.00014353507140185684, 0.00014771227142773569, 0.00015188948600552976]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 9.0, 5.0, 13.0, 13.0, 14.0, 14.0, 25.0, 36.0, 30.0, 25.0, 22.0, 39.0, 43.0, 39.0, 51.0, 37.0, 36.0, 36.0, 50.0, 43.0, 44.0, 32.0, 43.0, 35.0, 30.0, 28.0, 18.0, 26.0, 20.0, 26.0, 24.0, 15.0, 14.0, 12.0, 10.0, 9.0, 7.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.14199447631836e-05, -7.878243923187256e-05, -7.614493370056152e-05, -7.350742816925049e-05, -7.086992263793945e-05, -6.823241710662842e-05, -6.559491157531738e-05, -6.295740604400635e-05, -6.031990051269531e-05, -5.768239498138428e-05, -5.504488945007324e-05, -5.240738391876221e-05, -4.976987838745117e-05, -4.713237285614014e-05, -4.44948673248291e-05, -4.1857361793518066e-05, -3.921985626220703e-05, -3.6582350730895996e-05, -3.394484519958496e-05, -3.1307339668273926e-05, -2.866983413696289e-05, -2.6032328605651855e-05, -2.339482307434082e-05, -2.0757317543029785e-05, -1.811981201171875e-05, -1.5482306480407715e-05, -1.284480094909668e-05, -1.0207295417785645e-05, -7.569789886474609e-06, -4.932284355163574e-06, -2.294778823852539e-06, 3.427267074584961e-07, 2.9802322387695312e-06, 5.617737770080566e-06, 8.255243301391602e-06, 1.0892748832702637e-05, 1.3530254364013672e-05, 1.6167759895324707e-05, 1.8805265426635742e-05, 2.1442770957946777e-05, 2.4080276489257812e-05, 2.6717782020568848e-05, 2.9355287551879883e-05, 3.199279308319092e-05, 3.463029861450195e-05, 3.726780414581299e-05, 3.9905309677124023e-05, 4.254281520843506e-05, 4.5180320739746094e-05, 4.781782627105713e-05, 5.0455331802368164e-05, 5.30928373336792e-05, 5.5730342864990234e-05, 5.836784839630127e-05, 6.1005353927612305e-05, 6.364285945892334e-05, 6.628036499023438e-05, 6.891787052154541e-05, 7.155537605285645e-05, 7.419288158416748e-05, 7.683038711547852e-05, 7.946789264678955e-05, 8.210539817810059e-05, 8.474290370941162e-05, 8.738040924072266e-05]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 12.0, 16.0, 30.0, 56.0, 87.0, 158.0, 306.0, 478.0, 919.0, 1682.0, 3415.0, 7458.0, 20808.0, 94961.0, 3931319.0, 92847.0, 21331.0, 8627.0, 4012.0, 2150.0, 1289.0, 837.0, 498.0, 338.0, 194.0, 152.0, 91.0, 64.0, 30.0, 21.0, 19.0, 10.0, 7.0, 10.0, 3.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.971027374267578e-05, -4.702620208263397e-05, -4.434213042259216e-05, -4.1658058762550354e-05, -3.8973987102508545e-05, -3.6289915442466736e-05, -3.360584378242493e-05, -3.092177212238312e-05, -2.823770046234131e-05, -2.55536288022995e-05, -2.286955714225769e-05, -2.018548548221588e-05, -1.7501413822174072e-05, -1.4817342162132263e-05, -1.2133270502090454e-05, -9.449198842048645e-06, -6.765127182006836e-06, -4.081055521965027e-06, -1.3969838619232178e-06, 1.2870877981185913e-06, 3.9711594581604e-06, 6.6552311182022095e-06, 9.339302778244019e-06, 1.2023374438285828e-05, 1.4707446098327637e-05, 1.7391517758369446e-05, 2.0075589418411255e-05, 2.2759661078453064e-05, 2.5443732738494873e-05, 2.8127804398536682e-05, 3.081187605857849e-05, 3.34959477186203e-05, 3.618001937866211e-05, 3.886409103870392e-05, 4.154816269874573e-05, 4.423223435878754e-05, 4.6916306018829346e-05, 4.9600377678871155e-05, 5.2284449338912964e-05, 5.496852099895477e-05, 5.765259265899658e-05, 6.033666431903839e-05, 6.30207359790802e-05, 6.570480763912201e-05, 6.838887929916382e-05, 7.107295095920563e-05, 7.375702261924744e-05, 7.644109427928925e-05, 7.912516593933105e-05, 8.180923759937286e-05, 8.449330925941467e-05, 8.717738091945648e-05, 8.986145257949829e-05, 9.25455242395401e-05, 9.522959589958191e-05, 9.791366755962372e-05, 0.00010059773921966553, 0.00010328181087970734, 0.00010596588253974915, 0.00010864995419979095, 0.00011133402585983276, 0.00011401809751987457, 0.00011670216917991638, 0.00011938624083995819, 0.0001220703125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 17.0, 21.0, 34.0, 46.0, 81.0, 98.0, 103.0, 117.0, 108.0, 96.0, 63.0, 57.0, 42.0, 21.0, 16.0, 15.0, 9.0, 8.0, 9.0, 5.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.2862496078014374e-05, -1.2135133147239685e-05, -1.1407770216464996e-05, -1.0680407285690308e-05, -9.953044354915619e-06, -9.22568142414093e-06, -8.498318493366241e-06, -7.770955562591553e-06, -7.043592631816864e-06, -6.316229701042175e-06, -5.5888667702674866e-06, -4.861503839492798e-06, -4.134140908718109e-06, -3.4067779779434204e-06, -2.6794150471687317e-06, -1.952052116394043e-06, -1.2246891856193542e-06, -4.973262548446655e-07, 2.300366759300232e-07, 9.57399606704712e-07, 1.6847625374794006e-06, 2.4121254682540894e-06, 3.139488399028778e-06, 3.866851329803467e-06, 4.5942142605781555e-06, 5.321577191352844e-06, 6.048940122127533e-06, 6.776303052902222e-06, 7.50366598367691e-06, 8.231028914451599e-06, 8.958391845226288e-06, 9.685754776000977e-06, 1.0413117706775665e-05, 1.1140480637550354e-05, 1.1867843568325043e-05, 1.2595206499099731e-05, 1.332256942987442e-05, 1.4049932360649109e-05, 1.4777295291423798e-05, 1.5504658222198486e-05, 1.6232021152973175e-05, 1.6959384083747864e-05, 1.7686747014522552e-05, 1.841410994529724e-05, 1.914147287607193e-05, 1.986883580684662e-05, 2.0596198737621307e-05, 2.1323561668395996e-05, 2.2050924599170685e-05, 2.2778287529945374e-05, 2.3505650460720062e-05, 2.423301339149475e-05, 2.496037632226944e-05, 2.568773925304413e-05, 2.6415102183818817e-05, 2.7142465114593506e-05, 2.7869828045368195e-05, 2.8597190976142883e-05, 2.9324553906917572e-05, 3.005191683769226e-05, 3.077927976846695e-05, 3.150664269924164e-05, 3.223400563001633e-05, 3.2961368560791016e-05]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 11.0, 15.0, 22.0, 50.0, 66.0, 110.0, 187.0, 313.0, 552.0, 1000.0, 1834.0, 3619.0, 7480.0, 16572.0, 42601.0, 150917.0, 3654527.0, 228691.0, 49728.0, 18332.0, 8685.0, 4030.0, 2166.0, 1124.0, 683.0, 382.0, 228.0, 131.0, 89.0, 57.0, 25.0, 10.0, 13.0, 13.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.888938903808594e-05, -5.723442882299423e-05, -5.557946860790253e-05, -5.392450839281082e-05, -5.2269548177719116e-05, -5.061458796262741e-05, -4.8959627747535706e-05, -4.7304667532444e-05, -4.5649707317352295e-05, -4.399474710226059e-05, -4.2339786887168884e-05, -4.068482667207718e-05, -3.9029866456985474e-05, -3.737490624189377e-05, -3.571994602680206e-05, -3.406498581171036e-05, -3.241002559661865e-05, -3.075506538152695e-05, -2.9100105166435242e-05, -2.7445144951343536e-05, -2.579018473625183e-05, -2.4135224521160126e-05, -2.248026430606842e-05, -2.0825304090976715e-05, -1.917034387588501e-05, -1.7515383660793304e-05, -1.58604234457016e-05, -1.4205463230609894e-05, -1.2550503015518188e-05, -1.0895542800426483e-05, -9.240582585334778e-06, -7.5856223702430725e-06, -5.930662155151367e-06, -4.275701940059662e-06, -2.6207417249679565e-06, -9.657815098762512e-07, 6.891787052154541e-07, 2.3441389203071594e-06, 3.999099135398865e-06, 5.65405935049057e-06, 7.309019565582275e-06, 8.96397978067398e-06, 1.0618939995765686e-05, 1.2273900210857391e-05, 1.3928860425949097e-05, 1.5583820641040802e-05, 1.7238780856132507e-05, 1.8893741071224213e-05, 2.0548701286315918e-05, 2.2203661501407623e-05, 2.385862171649933e-05, 2.5513581931591034e-05, 2.716854214668274e-05, 2.8823502361774445e-05, 3.047846257686615e-05, 3.2133422791957855e-05, 3.378838300704956e-05, 3.5443343222141266e-05, 3.709830343723297e-05, 3.8753263652324677e-05, 4.040822386741638e-05, 4.206318408250809e-05, 4.371814429759979e-05, 4.53731045126915e-05, 4.70280647277832e-05]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 1.0, 4.0, 4.0, 6.0, 10.0, 5.0, 13.0, 18.0, 13.0, 21.0, 22.0, 31.0, 47.0, 44.0, 82.0, 170.0, 495.0, 1665.0, 777.0, 264.0, 98.0, 60.0, 36.0, 33.0, 26.0, 19.0, 17.0, 16.0, 11.0, 12.0, 5.0, 8.0, 5.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6464462280273438e-05, -2.5508925318717957e-05, -2.4553388357162476e-05, -2.3597851395606995e-05, -2.2642314434051514e-05, -2.1686777472496033e-05, -2.0731240510940552e-05, -1.977570354938507e-05, -1.882016658782959e-05, -1.786462962627411e-05, -1.6909092664718628e-05, -1.5953555703163147e-05, -1.4998018741607666e-05, -1.4042481780052185e-05, -1.3086944818496704e-05, -1.2131407856941223e-05, -1.1175870895385742e-05, -1.0220333933830261e-05, -9.26479697227478e-06, -8.3092600107193e-06, -7.353723049163818e-06, -6.398186087608337e-06, -5.4426491260528564e-06, -4.4871121644973755e-06, -3.5315752029418945e-06, -2.5760382413864136e-06, -1.6205012798309326e-06, -6.649643182754517e-07, 2.905726432800293e-07, 1.2461096048355103e-06, 2.201646566390991e-06, 3.157183527946472e-06, 4.112720489501953e-06, 5.068257451057434e-06, 6.023794412612915e-06, 6.979331374168396e-06, 7.934868335723877e-06, 8.890405297279358e-06, 9.845942258834839e-06, 1.080147922039032e-05, 1.17570161819458e-05, 1.2712553143501282e-05, 1.3668090105056763e-05, 1.4623627066612244e-05, 1.5579164028167725e-05, 1.6534700989723206e-05, 1.7490237951278687e-05, 1.8445774912834167e-05, 1.940131187438965e-05, 2.035684883594513e-05, 2.131238579750061e-05, 2.226792275905609e-05, 2.3223459720611572e-05, 2.4178996682167053e-05, 2.5134533643722534e-05, 2.6090070605278015e-05, 2.7045607566833496e-05, 2.8001144528388977e-05, 2.8956681489944458e-05, 2.991221845149994e-05, 3.086775541305542e-05, 3.18232923746109e-05, 3.277882933616638e-05, 3.373436629772186e-05, 3.4689903259277344e-05]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 11.0, 14.0, 21.0, 33.0, 40.0, 66.0, 106.0, 118.0, 132.0, 114.0, 70.0, 64.0, 43.0, 38.0, 25.0, 18.0, 17.0, 11.0, 9.0, 3.0, 5.0, 6.0, 5.0, 7.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010631288023432717, -0.0001009775442071259, -9.564221545588225e-05, -9.030687942868099e-05, -8.497154340147972e-05, -7.963621465023607e-05, -7.43008786230348e-05, -6.896554259583354e-05, -6.363021384458989e-05, -5.829488145536743e-05, -5.295954906614497e-05, -4.762421303894371e-05, -4.228888064972125e-05, -3.695354826049879e-05, -3.161821223329753e-05, -2.628287984407507e-05, -2.094754745485261e-05, -1.5612215065630153e-05, -1.0276880857418291e-05, -4.94154664920643e-06, 3.937857400160283e-07, 5.729118129238486e-06, 1.1064454156439751e-05, 1.639978654566221e-05, 2.1735118934884667e-05, 2.7070451324107125e-05, 3.2405783713329583e-05, 3.774111974053085e-05, 4.3076452129753307e-05, 4.8411784518975765e-05, 5.374712054617703e-05, 5.908245293539949e-05, 6.441777804866433e-05, 6.97531140758656e-05, 7.508844282710925e-05, 8.042377885431051e-05, 8.575910760555416e-05, 9.109444363275543e-05, 9.64297796599567e-05, 0.00010176510841120034, 0.00010710044443840161, 0.00011243578046560287, 0.00011777110921684653, 0.00012310643796809018, 0.00012844178127124906, 0.0001337771100224927, 0.00013911243877373636, 0.00014444778207689524, 0.0001497831108281389, 0.00015511843957938254, 0.00016045378288254142, 0.00016578911163378507, 0.00017112444038502872, 0.0001764597836881876, 0.00018179511243943125, 0.0001871304411906749, 0.00019246578449383378, 0.00019780111324507743, 0.0002031364565482363, 0.00020847178529947996, 0.0002138071140507236, 0.00021914244280196726, 0.00022447778610512614, 0.0002298131148563698, 0.00023514844360761344]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 6.0, 8.0, 8.0, 15.0, 11.0, 20.0, 14.0, 30.0, 33.0, 24.0, 28.0, 37.0, 35.0, 53.0, 36.0, 38.0, 48.0, 49.0, 51.0, 56.0, 52.0, 49.0, 45.0, 31.0, 29.0, 26.0, 26.0, 22.0, 23.0, 23.0, 18.0, 11.0, 13.0, 2.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0001024007797241211, -9.940657764673233e-05, -9.641237556934357e-05, -9.34181734919548e-05, -9.042397141456604e-05, -8.742976933717728e-05, -8.443556725978851e-05, -8.144136518239975e-05, -7.844716310501099e-05, -7.545296102762222e-05, -7.245875895023346e-05, -6.94645568728447e-05, -6.647035479545593e-05, -6.347615271806717e-05, -6.0481950640678406e-05, -5.748774856328964e-05, -5.449354648590088e-05, -5.1499344408512115e-05, -4.850514233112335e-05, -4.551094025373459e-05, -4.2516738176345825e-05, -3.952253609895706e-05, -3.65283340215683e-05, -3.3534131944179535e-05, -3.053992986679077e-05, -2.7545727789402008e-05, -2.4551525712013245e-05, -2.155732363462448e-05, -1.8563121557235718e-05, -1.5568919479846954e-05, -1.2574717402458191e-05, -9.580515325069427e-06, -6.586313247680664e-06, -3.5921111702919006e-06, -5.979090929031372e-07, 2.3962929844856262e-06, 5.39049506187439e-06, 8.384697139263153e-06, 1.1378899216651917e-05, 1.437310129404068e-05, 1.7367303371429443e-05, 2.0361505448818207e-05, 2.335570752620697e-05, 2.6349909603595734e-05, 2.9344111680984497e-05, 3.233831375837326e-05, 3.5332515835762024e-05, 3.832671791315079e-05, 4.132091999053955e-05, 4.4315122067928314e-05, 4.730932414531708e-05, 5.030352622270584e-05, 5.3297728300094604e-05, 5.629193037748337e-05, 5.928613245487213e-05, 6.22803345322609e-05, 6.527453660964966e-05, 6.826873868703842e-05, 7.126294076442719e-05, 7.425714284181595e-05, 7.725134491920471e-05, 8.024554699659348e-05, 8.323974907398224e-05, 8.6233951151371e-05, 8.922815322875977e-05]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 5.0, 11.0, 20.0, 25.0, 38.0, 78.0, 85.0, 150.0, 300.0, 657.0, 1528.0, 4202.0, 13010.0, 51032.0, 469408.0, 438900.0, 49691.0, 12264.0, 4153.0, 1648.0, 684.0, 254.0, 111.0, 79.0, 56.0, 37.0, 30.0, 24.0, 13.0, 14.0, 10.0, 6.0, 5.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014412403106689453, -0.00013947300612926483, -0.00013482198119163513, -0.00013017095625400543, -0.00012551993131637573, -0.00012086890637874603, -0.00011621788144111633, -0.00011156685650348663, -0.00010691583156585693, -0.00010226480662822723, -9.761378169059753e-05, -9.296275675296783e-05, -8.831173181533813e-05, -8.366070687770844e-05, -7.900968194007874e-05, -7.435865700244904e-05, -6.970763206481934e-05, -6.505660712718964e-05, -6.0405582189559937e-05, -5.575455725193024e-05, -5.110353231430054e-05, -4.645250737667084e-05, -4.180148243904114e-05, -3.715045750141144e-05, -3.249943256378174e-05, -2.784840762615204e-05, -2.319738268852234e-05, -1.854635775089264e-05, -1.389533281326294e-05, -9.24430787563324e-06, -4.59328293800354e-06, 5.774199962615967e-08, 4.708766937255859e-06, 9.359791874885559e-06, 1.4010816812515259e-05, 1.866184175014496e-05, 2.3312866687774658e-05, 2.7963891625404358e-05, 3.261491656303406e-05, 3.726594150066376e-05, 4.191696643829346e-05, 4.656799137592316e-05, 5.1219016313552856e-05, 5.5870041251182556e-05, 6.0521066188812256e-05, 6.517209112644196e-05, 6.982311606407166e-05, 7.447414100170135e-05, 7.912516593933105e-05, 8.377619087696075e-05, 8.842721581459045e-05, 9.307824075222015e-05, 9.772926568984985e-05, 0.00010238029062747955, 0.00010703131556510925, 0.00011168234050273895, 0.00011633336544036865, 0.00012098439037799835, 0.00012563541531562805, 0.00013028644025325775, 0.00013493746519088745, 0.00013958849012851715, 0.00014423951506614685, 0.00014889054000377655, 0.00015354156494140625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 5.0, 14.0, 15.0, 24.0, 31.0, 58.0, 72.0, 89.0, 132.0, 137.0, 109.0, 93.0, 74.0, 42.0, 36.0, 22.0, 6.0, 6.0, 11.0, 7.0, 7.0, 7.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.817941665649414e-05, -1.7374753952026367e-05, -1.6570091247558594e-05, -1.576542854309082e-05, -1.4960765838623047e-05, -1.4156103134155273e-05, -1.33514404296875e-05, -1.2546777725219727e-05, -1.1742115020751953e-05, -1.093745231628418e-05, -1.0132789611816406e-05, -9.328126907348633e-06, -8.52346420288086e-06, -7.718801498413086e-06, -6.9141387939453125e-06, -6.109476089477539e-06, -5.304813385009766e-06, -4.500150680541992e-06, -3.6954879760742188e-06, -2.8908252716064453e-06, -2.086162567138672e-06, -1.2814998626708984e-06, -4.76837158203125e-07, 3.2782554626464844e-07, 1.1324882507324219e-06, 1.9371509552001953e-06, 2.7418136596679688e-06, 3.546476364135742e-06, 4.351139068603516e-06, 5.155801773071289e-06, 5.9604644775390625e-06, 6.765127182006836e-06, 7.569789886474609e-06, 8.374452590942383e-06, 9.179115295410156e-06, 9.98377799987793e-06, 1.0788440704345703e-05, 1.1593103408813477e-05, 1.239776611328125e-05, 1.3202428817749023e-05, 1.4007091522216797e-05, 1.481175422668457e-05, 1.5616416931152344e-05, 1.6421079635620117e-05, 1.722574234008789e-05, 1.8030405044555664e-05, 1.8835067749023438e-05, 1.963973045349121e-05, 2.0444393157958984e-05, 2.1249055862426758e-05, 2.205371856689453e-05, 2.2858381271362305e-05, 2.3663043975830078e-05, 2.446770668029785e-05, 2.5272369384765625e-05, 2.60770320892334e-05, 2.6881694793701172e-05, 2.7686357498168945e-05, 2.849102020263672e-05, 2.9295682907104492e-05, 3.0100345611572266e-05, 3.090500831604004e-05, 3.170967102050781e-05, 3.2514333724975586e-05, 3.331899642944336e-05]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 10.0, 9.0, 14.0, 33.0, 60.0, 67.0, 114.0, 192.0, 342.0, 539.0, 1120.0, 1854.0, 3411.0, 6083.0, 11633.0, 21942.0, 43073.0, 101131.0, 312884.0, 346237.0, 101290.0, 47777.0, 22412.0, 11785.0, 6578.0, 3486.0, 1902.0, 1096.0, 627.0, 354.0, 184.0, 118.0, 65.0, 49.0, 27.0, 15.0, 14.0, 8.0, 5.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.863739013671875e-05, -4.724878817796707e-05, -4.586018621921539e-05, -4.4471584260463715e-05, -4.3082982301712036e-05, -4.169438034296036e-05, -4.030577838420868e-05, -3.8917176425457e-05, -3.752857446670532e-05, -3.6139972507953644e-05, -3.4751370549201965e-05, -3.336276859045029e-05, -3.197416663169861e-05, -3.058556467294693e-05, -2.919696271419525e-05, -2.7808360755443573e-05, -2.6419758796691895e-05, -2.5031156837940216e-05, -2.3642554879188538e-05, -2.225395292043686e-05, -2.086535096168518e-05, -1.9476749002933502e-05, -1.8088147044181824e-05, -1.6699545085430145e-05, -1.5310943126678467e-05, -1.3922341167926788e-05, -1.253373920917511e-05, -1.1145137250423431e-05, -9.756535291671753e-06, -8.367933332920074e-06, -6.979331374168396e-06, -5.5907294154167175e-06, -4.202127456665039e-06, -2.8135254979133606e-06, -1.4249235391616821e-06, -3.632158041000366e-08, 1.3522803783416748e-06, 2.7408823370933533e-06, 4.129484295845032e-06, 5.51808625459671e-06, 6.906688213348389e-06, 8.295290172100067e-06, 9.683892130851746e-06, 1.1072494089603424e-05, 1.2461096048355103e-05, 1.3849698007106781e-05, 1.523829996585846e-05, 1.6626901924610138e-05, 1.8015503883361816e-05, 1.9404105842113495e-05, 2.0792707800865173e-05, 2.2181309759616852e-05, 2.356991171836853e-05, 2.495851367712021e-05, 2.6347115635871887e-05, 2.7735717594623566e-05, 2.9124319553375244e-05, 3.0512921512126923e-05, 3.19015234708786e-05, 3.329012542963028e-05, 3.467872738838196e-05, 3.6067329347133636e-05, 3.7455931305885315e-05, 3.8844533264636993e-05, 4.023313522338867e-05]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 5.0, 12.0, 13.0, 14.0, 12.0, 14.0, 13.0, 21.0, 33.0, 31.0, 30.0, 36.0, 40.0, 40.0, 51.0, 50.0, 60.0, 65.0, 38.0, 37.0, 36.0, 40.0, 45.0, 43.0, 35.0, 21.0, 31.0, 26.0, 17.0, 17.0, 11.0, 15.0, 13.0, 5.0, 8.0, 3.0, 7.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.802776336669922e-05, -3.6942772567272186e-05, -3.5857781767845154e-05, -3.477279096841812e-05, -3.368780016899109e-05, -3.2602809369564056e-05, -3.1517818570137024e-05, -3.043282777070999e-05, -2.934783697128296e-05, -2.8262846171855927e-05, -2.7177855372428894e-05, -2.609286457300186e-05, -2.500787377357483e-05, -2.3922882974147797e-05, -2.2837892174720764e-05, -2.175290137529373e-05, -2.06679105758667e-05, -1.9582919776439667e-05, -1.8497928977012634e-05, -1.7412938177585602e-05, -1.632794737815857e-05, -1.5242956578731537e-05, -1.4157965779304504e-05, -1.3072974979877472e-05, -1.198798418045044e-05, -1.0902993381023407e-05, -9.818002581596375e-06, -8.733011782169342e-06, -7.64802098274231e-06, -6.563030183315277e-06, -5.478039383888245e-06, -4.393048584461212e-06, -3.3080577850341797e-06, -2.2230669856071472e-06, -1.1380761861801147e-06, -5.3085386753082275e-08, 1.0319054126739502e-06, 2.1168962121009827e-06, 3.201887011528015e-06, 4.286877810955048e-06, 5.37186861038208e-06, 6.4568594098091125e-06, 7.541850209236145e-06, 8.626841008663177e-06, 9.71183180809021e-06, 1.0796822607517242e-05, 1.1881813406944275e-05, 1.2966804206371307e-05, 1.405179500579834e-05, 1.5136785805225372e-05, 1.6221776604652405e-05, 1.7306767404079437e-05, 1.839175820350647e-05, 1.9476749002933502e-05, 2.0561739802360535e-05, 2.1646730601787567e-05, 2.27317214012146e-05, 2.3816712200641632e-05, 2.4901703000068665e-05, 2.5986693799495697e-05, 2.707168459892273e-05, 2.8156675398349762e-05, 2.9241666197776794e-05, 3.0326656997203827e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 20.0, 35.0, 30.0, 40.0, 84.0, 90.0, 113.0, 214.0, 328.0, 533.0, 897.0, 1317.0, 2292.0, 3871.0, 6503.0, 11712.0, 21259.0, 124386.0, 184350.0, 331568.0, 185184.0, 83651.0, 40596.0, 21514.0, 11676.0, 6584.0, 3814.0, 2175.0, 1318.0, 839.0, 556.0, 317.0, 222.0, 134.0, 105.0, 62.0, 53.0, 29.0, 19.0, 18.0, 9.0, 13.0, 8.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0], "bins": [-2.1457672119140625e-06, -2.084299921989441e-06, -2.0228326320648193e-06, -1.9613653421401978e-06, -1.8998980522155762e-06, -1.8384307622909546e-06, -1.776963472366333e-06, -1.7154961824417114e-06, -1.6540288925170898e-06, -1.5925616025924683e-06, -1.5310943126678467e-06, -1.469627022743225e-06, -1.4081597328186035e-06, -1.346692442893982e-06, -1.2852251529693604e-06, -1.2237578630447388e-06, -1.1622905731201172e-06, -1.1008232831954956e-06, -1.039355993270874e-06, -9.778887033462524e-07, -9.164214134216309e-07, -8.549541234970093e-07, -7.934868335723877e-07, -7.320195436477661e-07, -6.705522537231445e-07, -6.09084963798523e-07, -5.476176738739014e-07, -4.861503839492798e-07, -4.246830940246582e-07, -3.632158041000366e-07, -3.0174851417541504e-07, -2.4028122425079346e-07, -1.7881393432617188e-07, -1.1734664440155029e-07, -5.587935447692871e-08, 5.587935447692871e-09, 6.705522537231445e-08, 1.2852251529693604e-07, 1.8998980522155762e-07, 2.514570951461792e-07, 3.129243850708008e-07, 3.7439167499542236e-07, 4.3585896492004395e-07, 4.973262548446655e-07, 5.587935447692871e-07, 6.202608346939087e-07, 6.817281246185303e-07, 7.431954145431519e-07, 8.046627044677734e-07, 8.66129994392395e-07, 9.275972843170166e-07, 9.890645742416382e-07, 1.0505318641662598e-06, 1.1119991540908813e-06, 1.173466444015503e-06, 1.2349337339401245e-06, 1.296401023864746e-06, 1.3578683137893677e-06, 1.4193356037139893e-06, 1.4808028936386108e-06, 1.5422701835632324e-06, 1.603737473487854e-06, 1.6652047634124756e-06, 1.7266720533370972e-06, 1.7881393432617188e-06]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 7.0, 0.0, 10.0, 15.0, 0.0, 14.0, 0.0, 20.0, 36.0, 0.0, 51.0, 42.0, 0.0, 49.0, 0.0, 64.0, 80.0, 0.0, 65.0, 98.0, 0.0, 85.0, 0.0, 70.0, 77.0, 0.0, 49.0, 43.0, 0.0, 30.0, 0.0, 26.0, 22.0, 0.0, 19.0, 14.0, 0.0, 10.0, 0.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3336539268493652e-06, -1.296401023864746e-06, -1.259148120880127e-06, -1.2218952178955078e-06, -1.1846423149108887e-06, -1.1473894119262695e-06, -1.1101365089416504e-06, -1.0728836059570312e-06, -1.0356307029724121e-06, -9.98377799987793e-07, -9.611248970031738e-07, -9.238719940185547e-07, -8.866190910339355e-07, -8.493661880493164e-07, -8.121132850646973e-07, -7.748603820800781e-07, -7.37607479095459e-07, -7.003545761108398e-07, -6.631016731262207e-07, -6.258487701416016e-07, -5.885958671569824e-07, -5.513429641723633e-07, -5.140900611877441e-07, -4.76837158203125e-07, -4.3958425521850586e-07, -4.023313522338867e-07, -3.650784492492676e-07, -3.2782554626464844e-07, -2.905726432800293e-07, -2.5331974029541016e-07, -2.1606683731079102e-07, -1.7881393432617188e-07, -1.4156103134155273e-07, -1.043081283569336e-07, -6.705522537231445e-08, -2.9802322387695312e-08, 7.450580596923828e-09, 4.470348358154297e-08, 8.195638656616211e-08, 1.1920928955078125e-07, 1.564621925354004e-07, 1.9371509552001953e-07, 2.3096799850463867e-07, 2.682209014892578e-07, 3.0547380447387695e-07, 3.427267074584961e-07, 3.7997961044311523e-07, 4.172325134277344e-07, 4.544854164123535e-07, 4.917383193969727e-07, 5.289912223815918e-07, 5.662441253662109e-07, 6.034970283508301e-07, 6.407499313354492e-07, 6.780028343200684e-07, 7.152557373046875e-07, 7.525086402893066e-07, 7.897615432739258e-07, 8.270144462585449e-07, 8.642673492431641e-07, 9.015202522277832e-07, 9.387731552124023e-07, 9.760260581970215e-07, 1.0132789611816406e-06]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 15.0, 28.0, 0.0, 34.0, 60.0, 120.0, 208.0, 310.0, 565.0, 0.0, 1080.0, 1955.0, 3567.0, 6971.0, 13751.0, 29315.0, 0.0, 68581.0, 184460.0, 426076.0, 185368.0, 67942.0, 29443.0, 0.0, 13872.0, 6854.0, 3524.0, 1967.0, 1086.0, 590.0, 0.0, 348.0, 199.0, 93.0, 50.0, 34.0, 26.0, 0.0, 18.0, 13.0, 10.0, 2.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5581026673316956e-06, -1.5068799257278442e-06, -1.455657184123993e-06, -1.4044344425201416e-06, -1.3532117009162903e-06, -1.301988959312439e-06, -1.2507662177085876e-06, -1.1995434761047363e-06, -1.148320734500885e-06, -1.0970979928970337e-06, -1.0458752512931824e-06, -9.94652509689331e-07, -9.434297680854797e-07, -8.922070264816284e-07, -8.409842848777771e-07, -7.897615432739258e-07, -7.385388016700745e-07, -6.873160600662231e-07, -6.360933184623718e-07, -5.848705768585205e-07, -5.336478352546692e-07, -4.824250936508179e-07, -4.3120235204696655e-07, -3.7997961044311523e-07, -3.287568688392639e-07, -2.775341272354126e-07, -2.2631138563156128e-07, -1.7508864402770996e-07, -1.2386590242385864e-07, -7.264316082000732e-08, -2.1420419216156006e-08, 2.9802322387695312e-08, 8.102506399154663e-08, 1.3224780559539795e-07, 1.8347054719924927e-07, 2.3469328880310059e-07, 2.859160304069519e-07, 3.371387720108032e-07, 3.8836151361465454e-07, 4.3958425521850586e-07, 4.908069968223572e-07, 5.420297384262085e-07, 5.932524800300598e-07, 6.444752216339111e-07, 6.956979632377625e-07, 7.469207048416138e-07, 7.981434464454651e-07, 8.493661880493164e-07, 9.005889296531677e-07, 9.51811671257019e-07, 1.0030344128608704e-06, 1.0542571544647217e-06, 1.105479896068573e-06, 1.1567026376724243e-06, 1.2079253792762756e-06, 1.259148120880127e-06, 1.3103708624839783e-06, 1.3615936040878296e-06, 1.412816345691681e-06, 1.4640390872955322e-06, 1.5152618288993835e-06, 1.5664845705032349e-06, 1.6177073121070862e-06, 1.6689300537109375e-06]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 9.0, 0.0, 7.0, 10.0, 0.0, 15.0, 15.0, 0.0, 20.0, 36.0, 0.0, 34.0, 0.0, 54.0, 61.0, 0.0, 59.0, 76.0, 0.0, 72.0, 87.0, 0.0, 81.0, 0.0, 76.0, 62.0, 0.0, 45.0, 37.0, 0.0, 30.0, 29.0, 0.0, 28.0, 23.0, 0.0, 11.0, 0.0, 6.0, 4.0, 0.0, 11.0, 5.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3327226042747498e-06, -1.2945383787155151e-06, -1.2563541531562805e-06, -1.218169927597046e-06, -1.1799857020378113e-06, -1.1418014764785767e-06, -1.103617250919342e-06, -1.0654330253601074e-06, -1.0272487998008728e-06, -9.890645742416382e-07, -9.508803486824036e-07, -9.126961231231689e-07, -8.745118975639343e-07, -8.363276720046997e-07, -7.981434464454651e-07, -7.599592208862305e-07, -7.217749953269958e-07, -6.835907697677612e-07, -6.454065442085266e-07, -6.07222318649292e-07, -5.690380930900574e-07, -5.308538675308228e-07, -4.926696419715881e-07, -4.544854164123535e-07, -4.163011908531189e-07, -3.781169652938843e-07, -3.3993273973464966e-07, -3.0174851417541504e-07, -2.635642886161804e-07, -2.253800630569458e-07, -1.8719583749771118e-07, -1.4901161193847656e-07, -1.1082738637924194e-07, -7.264316082000732e-08, -3.4458935260772705e-08, 3.725290298461914e-09, 4.190951585769653e-08, 8.009374141693115e-08, 1.1827796697616577e-07, 1.564621925354004e-07, 1.94646418094635e-07, 2.3283064365386963e-07, 2.7101486921310425e-07, 3.0919909477233887e-07, 3.473833203315735e-07, 3.855675458908081e-07, 4.237517714500427e-07, 4.6193599700927734e-07, 5.00120222568512e-07, 5.383044481277466e-07, 5.764886736869812e-07, 6.146728992462158e-07, 6.528571248054504e-07, 6.910413503646851e-07, 7.292255759239197e-07, 7.674098014831543e-07, 8.055940270423889e-07, 8.437782526016235e-07, 8.819624781608582e-07, 9.201467037200928e-07, 9.583309292793274e-07, 9.96515154838562e-07, 1.0346993803977966e-06, 1.0728836059570312e-06]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 12.0, 10.0, 10.0, 22.0, 42.0, 51.0, 74.0, 177.0, 187.0, 83.0, 56.0, 48.0, 49.0, 35.0, 28.0, 24.0, 15.0, 15.0, 13.0, 8.0, 5.0, 5.0, 4.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014240063319448382, -0.00013765542826149613, -0.00013291022332850844, -0.00012816501839552075, -0.00012341981346253306, -0.00011867460852954537, -0.00011392939632060006, -0.00010918419138761237, -0.00010443898645462468, -9.969378152163699e-05, -9.49485765886493e-05, -9.020337165566161e-05, -8.545815944671631e-05, -8.071295451372862e-05, -7.596774958074093e-05, -7.122254464775324e-05, -6.647733971476555e-05, -6.173213478177786e-05, -5.698692984879017e-05, -5.224172127782367e-05, -4.749651634483598e-05, -4.275131141184829e-05, -3.8006102840881795e-05, -3.3260897907894105e-05, -2.8515692974906415e-05, -2.3770488041918725e-05, -1.902528128994163e-05, -1.428007544745924e-05, -9.534869604976848e-06, -4.789664671989158e-06, -4.445792001206428e-08, 4.700748831965029e-06, 9.445968316867948e-06, 1.419117415935034e-05, 1.893638000183273e-05, 2.3681586753809825e-05, 2.8426791686797515e-05, 3.3171996619785205e-05, 3.79172051907517e-05, 4.266241012373939e-05, 4.740761505672708e-05, 5.215281998971477e-05, 5.689802492270246e-05, 6.164322985569015e-05, 6.638844206463546e-05, 7.113364699762315e-05, 7.587885193061084e-05, 8.062405686359853e-05, 8.536926179658622e-05, 9.01144667295739e-05, 9.48596716625616e-05, 9.960487659554929e-05, 0.00010435008152853698, 0.00010909528646152467, 0.00011384049867046997, 0.00011858570360345766, 0.00012333091581240296, 0.00012807612074539065, 0.00013282132567837834, 0.00013756653061136603, 0.00014231173554435372, 0.0001470569404773414, 0.0001518021454103291, 0.0001565473503433168, 0.00016129255527630448]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 4.0, 5.0, 12.0, 6.0, 8.0, 19.0, 21.0, 17.0, 25.0, 23.0, 31.0, 47.0, 38.0, 39.0, 40.0, 29.0, 40.0, 38.0, 44.0, 48.0, 39.0, 52.0, 36.0, 35.0, 28.0, 30.0, 22.0, 35.0, 27.0, 32.0, 21.0, 15.0, 20.0, 15.0, 14.0, 7.0, 8.0, 3.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.64267349243164e-05, -8.36588442325592e-05, -8.0890953540802e-05, -7.81230628490448e-05, -7.53551721572876e-05, -7.25872814655304e-05, -6.98193907737732e-05, -6.705150008201599e-05, -6.428360939025879e-05, -6.151571869850159e-05, -5.8747828006744385e-05, -5.597993731498718e-05, -5.321204662322998e-05, -5.044415593147278e-05, -4.7676265239715576e-05, -4.4908374547958374e-05, -4.214048385620117e-05, -3.937259316444397e-05, -3.660470247268677e-05, -3.3836811780929565e-05, -3.106892108917236e-05, -2.830103039741516e-05, -2.553313970565796e-05, -2.2765249013900757e-05, -1.9997358322143555e-05, -1.7229467630386353e-05, -1.446157693862915e-05, -1.1693686246871948e-05, -8.925795555114746e-06, -6.157904863357544e-06, -3.390014171600342e-06, -6.221234798431396e-07, 2.1457672119140625e-06, 4.913657903671265e-06, 7.681548595428467e-06, 1.0449439287185669e-05, 1.3217329978942871e-05, 1.5985220670700073e-05, 1.8753111362457275e-05, 2.1521002054214478e-05, 2.428889274597168e-05, 2.7056783437728882e-05, 2.9824674129486084e-05, 3.2592564821243286e-05, 3.536045551300049e-05, 3.812834620475769e-05, 4.089623689651489e-05, 4.3664127588272095e-05, 4.64320182800293e-05, 4.91999089717865e-05, 5.19677996635437e-05, 5.47356903553009e-05, 5.7503581047058105e-05, 6.027147173881531e-05, 6.303936243057251e-05, 6.580725312232971e-05, 6.857514381408691e-05, 7.134303450584412e-05, 7.411092519760132e-05, 7.687881588935852e-05, 7.964670658111572e-05, 8.241459727287292e-05, 8.518248796463013e-05, 8.795037865638733e-05, 9.071826934814453e-05]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 13.0, 18.0, 32.0, 55.0, 87.0, 114.0, 197.0, 310.0, 513.0, 724.0, 1418.0, 2589.0, 5123.0, 12323.0, 36440.0, 450805.0, 3587970.0, 61826.0, 17932.0, 7452.0, 3423.0, 1933.0, 1111.0, 700.0, 392.0, 241.0, 153.0, 103.0, 75.0, 52.0, 26.0, 23.0, 15.0, 12.0, 12.0, 10.0, 11.0, 6.0, 6.0, 4.0, 7.0, 4.0, 6.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9948692321777344e-05, -4.769954830408096e-05, -4.545040428638458e-05, -4.32012602686882e-05, -4.095211625099182e-05, -3.870297223329544e-05, -3.645382821559906e-05, -3.420468419790268e-05, -3.19555401802063e-05, -2.9706396162509918e-05, -2.7457252144813538e-05, -2.5208108127117157e-05, -2.2958964109420776e-05, -2.0709820091724396e-05, -1.8460676074028015e-05, -1.6211532056331635e-05, -1.3962388038635254e-05, -1.1713244020938873e-05, -9.464100003242493e-06, -7.214955985546112e-06, -4.9658119678497314e-06, -2.716667950153351e-06, -4.675239324569702e-07, 1.7816200852394104e-06, 4.030764102935791e-06, 6.279908120632172e-06, 8.529052138328552e-06, 1.0778196156024933e-05, 1.3027340173721313e-05, 1.5276484191417694e-05, 1.7525628209114075e-05, 1.9774772226810455e-05, 2.2023916244506836e-05, 2.4273060262203217e-05, 2.6522204279899597e-05, 2.8771348297595978e-05, 3.102049231529236e-05, 3.326963633298874e-05, 3.551878035068512e-05, 3.77679243683815e-05, 4.001706838607788e-05, 4.226621240377426e-05, 4.451535642147064e-05, 4.676450043916702e-05, 4.90136444568634e-05, 5.1262788474559784e-05, 5.3511932492256165e-05, 5.5761076509952545e-05, 5.8010220527648926e-05, 6.0259364545345306e-05, 6.250850856304169e-05, 6.475765258073807e-05, 6.700679659843445e-05, 6.925594061613083e-05, 7.150508463382721e-05, 7.375422865152359e-05, 7.600337266921997e-05, 7.825251668691635e-05, 8.050166070461273e-05, 8.275080472230911e-05, 8.499994874000549e-05, 8.724909275770187e-05, 8.949823677539825e-05, 9.174738079309464e-05, 9.399652481079102e-05]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 3.0, 7.0, 6.0, 10.0, 14.0, 23.0, 34.0, 60.0, 60.0, 99.0, 106.0, 118.0, 101.0, 90.0, 73.0, 71.0, 27.0, 20.0, 23.0, 15.0, 8.0, 12.0, 11.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5974044799804688e-05, -1.5273690223693848e-05, -1.4573335647583008e-05, -1.3872981071472168e-05, -1.3172626495361328e-05, -1.2472271919250488e-05, -1.1771917343139648e-05, -1.1071562767028809e-05, -1.0371208190917969e-05, -9.670853614807129e-06, -8.970499038696289e-06, -8.27014446258545e-06, -7.569789886474609e-06, -6.8694353103637695e-06, -6.16908073425293e-06, -5.46872615814209e-06, -4.76837158203125e-06, -4.06801700592041e-06, -3.3676624298095703e-06, -2.6673078536987305e-06, -1.9669532775878906e-06, -1.2665987014770508e-06, -5.662441253662109e-07, 1.341104507446289e-07, 8.344650268554688e-07, 1.5348196029663086e-06, 2.2351741790771484e-06, 2.9355287551879883e-06, 3.635883331298828e-06, 4.336237907409668e-06, 5.036592483520508e-06, 5.736947059631348e-06, 6.4373016357421875e-06, 7.137656211853027e-06, 7.838010787963867e-06, 8.538365364074707e-06, 9.238719940185547e-06, 9.939074516296387e-06, 1.0639429092407227e-05, 1.1339783668518066e-05, 1.2040138244628906e-05, 1.2740492820739746e-05, 1.3440847396850586e-05, 1.4141201972961426e-05, 1.4841556549072266e-05, 1.5541911125183105e-05, 1.6242265701293945e-05, 1.6942620277404785e-05, 1.7642974853515625e-05, 1.8343329429626465e-05, 1.9043684005737305e-05, 1.9744038581848145e-05, 2.0444393157958984e-05, 2.1144747734069824e-05, 2.1845102310180664e-05, 2.2545456886291504e-05, 2.3245811462402344e-05, 2.3946166038513184e-05, 2.4646520614624023e-05, 2.5346875190734863e-05, 2.6047229766845703e-05, 2.6747584342956543e-05, 2.7447938919067383e-05, 2.8148293495178223e-05, 2.8848648071289062e-05]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 6.0, 11.0, 23.0, 42.0, 46.0, 58.0, 133.0, 199.0, 352.0, 654.0, 1186.0, 2296.0, 4208.0, 8836.0, 19001.0, 42644.0, 148170.0, 3240613.0, 592637.0, 78270.0, 27911.0, 13296.0, 6384.0, 3381.0, 1825.0, 926.0, 485.0, 269.0, 167.0, 86.0, 56.0, 30.0, 23.0, 18.0, 9.0, 8.0, 3.0, 3.0, 7.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-4.7326087951660156e-05, -4.6039000153541565e-05, -4.4751912355422974e-05, -4.346482455730438e-05, -4.217773675918579e-05, -4.08906489610672e-05, -3.960356116294861e-05, -3.831647336483002e-05, -3.7029385566711426e-05, -3.5742297768592834e-05, -3.445520997047424e-05, -3.316812217235565e-05, -3.188103437423706e-05, -3.059394657611847e-05, -2.9306858777999878e-05, -2.8019770979881287e-05, -2.6732683181762695e-05, -2.5445595383644104e-05, -2.4158507585525513e-05, -2.287141978740692e-05, -2.158433198928833e-05, -2.029724419116974e-05, -1.9010156393051147e-05, -1.7723068594932556e-05, -1.6435980796813965e-05, -1.5148892998695374e-05, -1.3861805200576782e-05, -1.2574717402458191e-05, -1.12876296043396e-05, -1.0000541806221008e-05, -8.713454008102417e-06, -7.426366209983826e-06, -6.139278411865234e-06, -4.852190613746643e-06, -3.5651028156280518e-06, -2.2780150175094604e-06, -9.909272193908691e-07, 2.9616057872772217e-07, 1.5832483768463135e-06, 2.8703361749649048e-06, 4.157423973083496e-06, 5.444511771202087e-06, 6.731599569320679e-06, 8.01868736743927e-06, 9.305775165557861e-06, 1.0592862963676453e-05, 1.1879950761795044e-05, 1.3167038559913635e-05, 1.4454126358032227e-05, 1.5741214156150818e-05, 1.702830195426941e-05, 1.8315389752388e-05, 1.9602477550506592e-05, 2.0889565348625183e-05, 2.2176653146743774e-05, 2.3463740944862366e-05, 2.4750828742980957e-05, 2.603791654109955e-05, 2.732500433921814e-05, 2.861209213733673e-05, 2.9899179935455322e-05, 3.1186267733573914e-05, 3.2473355531692505e-05, 3.3760443329811096e-05, 3.504753112792969e-05]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 9.0, 2.0, 5.0, 4.0, 3.0, 6.0, 12.0, 9.0, 12.0, 11.0, 25.0, 20.0, 17.0, 30.0, 29.0, 61.0, 78.0, 159.0, 289.0, 635.0, 1320.0, 648.0, 236.0, 116.0, 67.0, 52.0, 42.0, 30.0, 24.0, 18.0, 13.0, 17.0, 9.0, 15.0, 7.0, 8.0, 8.0, 9.0, 5.0, 2.0, 7.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.396106719970703e-05, -2.3200176656246185e-05, -2.243928611278534e-05, -2.1678395569324493e-05, -2.0917505025863647e-05, -2.01566144824028e-05, -1.9395723938941956e-05, -1.863483339548111e-05, -1.7873942852020264e-05, -1.7113052308559418e-05, -1.6352161765098572e-05, -1.5591271221637726e-05, -1.483038067817688e-05, -1.4069490134716034e-05, -1.3308599591255188e-05, -1.2547709047794342e-05, -1.1786818504333496e-05, -1.102592796087265e-05, -1.0265037417411804e-05, -9.504146873950958e-06, -8.743256330490112e-06, -7.982365787029266e-06, -7.22147524356842e-06, -6.4605847001075745e-06, -5.6996941566467285e-06, -4.9388036131858826e-06, -4.177913069725037e-06, -3.4170225262641907e-06, -2.6561319828033447e-06, -1.8952414393424988e-06, -1.1343508958816528e-06, -3.734603524208069e-07, 3.8743019104003906e-07, 1.148320734500885e-06, 1.909211277961731e-06, 2.670101821422577e-06, 3.430992364883423e-06, 4.191882908344269e-06, 4.952773451805115e-06, 5.713663995265961e-06, 6.474554538726807e-06, 7.235445082187653e-06, 7.996335625648499e-06, 8.757226169109344e-06, 9.51811671257019e-06, 1.0279007256031036e-05, 1.1039897799491882e-05, 1.1800788342952728e-05, 1.2561678886413574e-05, 1.332256942987442e-05, 1.4083459973335266e-05, 1.4844350516796112e-05, 1.5605241060256958e-05, 1.6366131603717804e-05, 1.712702214717865e-05, 1.7887912690639496e-05, 1.8648803234100342e-05, 1.9409693777561188e-05, 2.0170584321022034e-05, 2.093147486448288e-05, 2.1692365407943726e-05, 2.245325595140457e-05, 2.3214146494865417e-05, 2.3975037038326263e-05, 2.473592758178711e-05]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 9.0, 15.0, 14.0, 24.0, 40.0, 44.0, 77.0, 103.0, 115.0, 102.0, 79.0, 68.0, 49.0, 58.0, 44.0, 28.0, 31.0, 21.0, 12.0, 12.0, 8.0, 2.0, 3.0, 7.0, 2.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.485634654993191e-05, -9.103510819841176e-05, -8.721386984689161e-05, -8.339263149537146e-05, -7.957139314385131e-05, -7.575015479233116e-05, -7.192891644081101e-05, -6.810767808929086e-05, -6.42864397377707e-05, -6.0465201386250556e-05, -5.6643963034730405e-05, -5.2822724683210254e-05, -4.90014863316901e-05, -4.518024798016995e-05, -4.13590096286498e-05, -3.753777127712965e-05, -3.37165329256095e-05, -2.989529457408935e-05, -2.6074056222569197e-05, -2.2252817871049047e-05, -1.8431579519528896e-05, -1.4610341168008745e-05, -1.0789102816488594e-05, -6.967864464968443e-06, -3.146626113448292e-06, 6.746122380718589e-07, 4.49585058959201e-06, 8.31708894111216e-06, 1.2138327292632312e-05, 1.5959565644152462e-05, 1.9780803995672613e-05, 2.3602042347192764e-05, 2.74232734227553e-05, 3.124451177427545e-05, 3.50657501257956e-05, 3.8886988477315754e-05, 4.2708226828835905e-05, 4.6529465180356055e-05, 5.0350703531876206e-05, 5.417194188339636e-05, 5.799318023491651e-05, 6.181441858643666e-05, 6.563565693795681e-05, 6.945689528947696e-05, 7.327813364099711e-05, 7.709937199251726e-05, 8.092061034403741e-05, 8.474184869555756e-05, 8.856308704707772e-05, 9.238432539859787e-05, 9.620556375011802e-05, 0.00010002680210163817, 0.00010384804045315832, 0.00010766927880467847, 0.00011149051715619862, 0.00011531175550771877, 0.00011913299385923892, 0.00012295422493480146, 0.00012677547056227922, 0.000130596716189757, 0.00013441794726531953, 0.00013823917834088206, 0.00014206042396835983, 0.0001458816695958376, 0.00014970290067140013]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 4.0, 2.0, 5.0, 3.0, 12.0, 18.0, 8.0, 22.0, 19.0, 18.0, 19.0, 29.0, 24.0, 25.0, 31.0, 36.0, 36.0, 36.0, 33.0, 45.0, 37.0, 39.0, 30.0, 44.0, 34.0, 39.0, 33.0, 26.0, 34.0, 36.0, 35.0, 21.0, 20.0, 24.0, 15.0, 13.0, 23.0, 15.0, 12.0, 7.0, 3.0, 12.0, 9.0, 3.0, 5.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.104873657226562e-05, -6.895512342453003e-05, -6.686151027679443e-05, -6.476789712905884e-05, -6.267428398132324e-05, -6.0580670833587646e-05, -5.848705768585205e-05, -5.6393444538116455e-05, -5.429983139038086e-05, -5.2206218242645264e-05, -5.011260509490967e-05, -4.801899194717407e-05, -4.5925378799438477e-05, -4.383176565170288e-05, -4.1738152503967285e-05, -3.964453935623169e-05, -3.7550926208496094e-05, -3.54573130607605e-05, -3.33636999130249e-05, -3.127008676528931e-05, -2.917647361755371e-05, -2.7082860469818115e-05, -2.498924732208252e-05, -2.2895634174346924e-05, -2.0802021026611328e-05, -1.8708407878875732e-05, -1.6614794731140137e-05, -1.4521181583404541e-05, -1.2427568435668945e-05, -1.033395528793335e-05, -8.240342140197754e-06, -6.146728992462158e-06, -4.0531158447265625e-06, -1.959502696990967e-06, 1.341104507446289e-07, 2.2277235984802246e-06, 4.32133674621582e-06, 6.414949893951416e-06, 8.508563041687012e-06, 1.0602176189422607e-05, 1.2695789337158203e-05, 1.4789402484893799e-05, 1.6883015632629395e-05, 1.897662878036499e-05, 2.1070241928100586e-05, 2.316385507583618e-05, 2.5257468223571777e-05, 2.7351081371307373e-05, 2.944469451904297e-05, 3.1538307666778564e-05, 3.363192081451416e-05, 3.5725533962249756e-05, 3.781914710998535e-05, 3.991276025772095e-05, 4.200637340545654e-05, 4.409998655319214e-05, 4.6193599700927734e-05, 4.828721284866333e-05, 5.0380825996398926e-05, 5.247443914413452e-05, 5.456805229187012e-05, 5.666166543960571e-05, 5.875527858734131e-05, 6.0848891735076904e-05, 6.29425048828125e-05]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 5.0, 1.0, 5.0, 7.0, 6.0, 9.0, 10.0, 14.0, 22.0, 13.0, 19.0, 18.0, 23.0, 23.0, 44.0, 63.0, 116.0, 282.0, 635.0, 1543.0, 4135.0, 12013.0, 41804.0, 249155.0, 632245.0, 77226.0, 18842.0, 6198.0, 2281.0, 929.0, 380.0, 176.0, 70.0, 48.0, 30.0, 22.0, 20.0, 23.0, 20.0, 15.0, 7.0, 13.0, 8.0, 7.0, 7.0, 5.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.00014388561248779297, -0.00013955123722553253, -0.0001352168619632721, -0.00013088248670101166, -0.00012654811143875122, -0.00012221373617649078, -0.00011787936091423035, -0.00011354498565196991, -0.00010921061038970947, -0.00010487623512744904, -0.0001005418598651886, -9.620748460292816e-05, -9.187310934066772e-05, -8.753873407840729e-05, -8.320435881614685e-05, -7.886998355388641e-05, -7.453560829162598e-05, -7.020123302936554e-05, -6.58668577671051e-05, -6.153248250484467e-05, -5.719810724258423e-05, -5.286373198032379e-05, -4.8529356718063354e-05, -4.419498145580292e-05, -3.986060619354248e-05, -3.5526230931282043e-05, -3.1191855669021606e-05, -2.685748040676117e-05, -2.2523105144500732e-05, -1.8188729882240295e-05, -1.3854354619979858e-05, -9.519979357719421e-06, -5.185604095458984e-06, -8.512288331985474e-07, 3.4831464290618896e-06, 7.817521691322327e-06, 1.2151896953582764e-05, 1.64862722158432e-05, 2.0820647478103638e-05, 2.5155022740364075e-05, 2.9489398002624512e-05, 3.382377326488495e-05, 3.8158148527145386e-05, 4.249252378940582e-05, 4.682689905166626e-05, 5.11612743139267e-05, 5.5495649576187134e-05, 5.983002483844757e-05, 6.416440010070801e-05, 6.849877536296844e-05, 7.283315062522888e-05, 7.716752588748932e-05, 8.150190114974976e-05, 8.583627641201019e-05, 9.017065167427063e-05, 9.450502693653107e-05, 9.88394021987915e-05, 0.00010317377746105194, 0.00010750815272331238, 0.00011184252798557281, 0.00011617690324783325, 0.00012051127851009369, 0.00012484565377235413, 0.00012918002903461456, 0.000133514404296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 6.0, 12.0, 23.0, 28.0, 40.0, 57.0, 106.0, 135.0, 154.0, 111.0, 111.0, 75.0, 43.0, 34.0, 25.0, 8.0, 9.0, 10.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5735626220703125e-05, -1.485086977481842e-05, -1.3966113328933716e-05, -1.3081356883049011e-05, -1.2196600437164307e-05, -1.1311843991279602e-05, -1.0427087545394897e-05, -9.542331099510193e-06, -8.657574653625488e-06, -7.772818207740784e-06, -6.888061761856079e-06, -6.0033053159713745e-06, -5.11854887008667e-06, -4.233792424201965e-06, -3.3490359783172607e-06, -2.464279532432556e-06, -1.5795230865478516e-06, -6.94766640663147e-07, 1.8998980522155762e-07, 1.0747462511062622e-06, 1.959502696990967e-06, 2.8442591428756714e-06, 3.729015588760376e-06, 4.6137720346450806e-06, 5.498528480529785e-06, 6.38328492641449e-06, 7.268041372299194e-06, 8.152797818183899e-06, 9.037554264068604e-06, 9.922310709953308e-06, 1.0807067155838013e-05, 1.1691823601722717e-05, 1.2576580047607422e-05, 1.3461336493492126e-05, 1.4346092939376831e-05, 1.5230849385261536e-05, 1.611560583114624e-05, 1.7000362277030945e-05, 1.788511872291565e-05, 1.8769875168800354e-05, 1.965463161468506e-05, 2.0539388060569763e-05, 2.1424144506454468e-05, 2.2308900952339172e-05, 2.3193657398223877e-05, 2.407841384410858e-05, 2.4963170289993286e-05, 2.584792673587799e-05, 2.6732683181762695e-05, 2.76174396276474e-05, 2.8502196073532104e-05, 2.938695251941681e-05, 3.0271708965301514e-05, 3.115646541118622e-05, 3.204122185707092e-05, 3.292597830295563e-05, 3.381073474884033e-05, 3.469549119472504e-05, 3.558024764060974e-05, 3.6465004086494446e-05, 3.734976053237915e-05, 3.8234516978263855e-05, 3.911927342414856e-05, 4.0004029870033264e-05, 4.088878631591797e-05]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 1.0, 8.0, 17.0, 23.0, 32.0, 59.0, 77.0, 134.0, 203.0, 417.0, 859.0, 1509.0, 3081.0, 6896.0, 15865.0, 38228.0, 96101.0, 411020.0, 325374.0, 88658.0, 33162.0, 14405.0, 6323.0, 3016.0, 1356.0, 747.0, 404.0, 223.0, 130.0, 72.0, 41.0, 33.0, 23.0, 14.0, 6.0, 8.0, 8.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.131959915161133e-05, -4.954636096954346e-05, -4.7773122787475586e-05, -4.5999884605407715e-05, -4.4226646423339844e-05, -4.245340824127197e-05, -4.06801700592041e-05, -3.890693187713623e-05, -3.713369369506836e-05, -3.536045551300049e-05, -3.358721733093262e-05, -3.1813979148864746e-05, -3.0040740966796875e-05, -2.8267502784729004e-05, -2.6494264602661133e-05, -2.4721026420593262e-05, -2.294778823852539e-05, -2.117455005645752e-05, -1.940131187438965e-05, -1.7628073692321777e-05, -1.5854835510253906e-05, -1.4081597328186035e-05, -1.2308359146118164e-05, -1.0535120964050293e-05, -8.761882781982422e-06, -6.988644599914551e-06, -5.21540641784668e-06, -3.4421682357788086e-06, -1.6689300537109375e-06, 1.043081283569336e-07, 1.8775463104248047e-06, 3.6507844924926758e-06, 5.424022674560547e-06, 7.197260856628418e-06, 8.970499038696289e-06, 1.074373722076416e-05, 1.2516975402832031e-05, 1.4290213584899902e-05, 1.6063451766967773e-05, 1.7836689949035645e-05, 1.9609928131103516e-05, 2.1383166313171387e-05, 2.3156404495239258e-05, 2.492964267730713e-05, 2.6702880859375e-05, 2.847611904144287e-05, 3.0249357223510742e-05, 3.202259540557861e-05, 3.3795833587646484e-05, 3.5569071769714355e-05, 3.7342309951782227e-05, 3.91155481338501e-05, 4.088878631591797e-05, 4.266202449798584e-05, 4.443526268005371e-05, 4.620850086212158e-05, 4.798173904418945e-05, 4.9754977226257324e-05, 5.1528215408325195e-05, 5.3301453590393066e-05, 5.507469177246094e-05, 5.684792995452881e-05, 5.862116813659668e-05, 6.039440631866455e-05, 6.216764450073242e-05]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 4.0, 10.0, 12.0, 11.0, 21.0, 17.0, 28.0, 23.0, 23.0, 34.0, 32.0, 33.0, 33.0, 42.0, 46.0, 59.0, 49.0, 57.0, 45.0, 47.0, 46.0, 36.0, 45.0, 31.0, 42.0, 27.0, 29.0, 23.0, 20.0, 11.0, 14.0, 12.0, 6.0, 6.0, 6.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.129243850708008e-05, -3.0213966965675354e-05, -2.913549542427063e-05, -2.8057023882865906e-05, -2.697855234146118e-05, -2.5900080800056458e-05, -2.4821609258651733e-05, -2.374313771724701e-05, -2.2664666175842285e-05, -2.158619463443756e-05, -2.0507723093032837e-05, -1.9429251551628113e-05, -1.835078001022339e-05, -1.7272308468818665e-05, -1.619383692741394e-05, -1.5115365386009216e-05, -1.4036893844604492e-05, -1.2958422303199768e-05, -1.1879950761795044e-05, -1.080147922039032e-05, -9.723007678985596e-06, -8.644536137580872e-06, -7.5660645961761475e-06, -6.487593054771423e-06, -5.409121513366699e-06, -4.330649971961975e-06, -3.252178430557251e-06, -2.173706889152527e-06, -1.0952353477478027e-06, -1.6763806343078613e-08, 1.0617077350616455e-06, 2.1401792764663696e-06, 3.2186508178710938e-06, 4.297122359275818e-06, 5.375593900680542e-06, 6.454065442085266e-06, 7.53253698348999e-06, 8.611008524894714e-06, 9.689480066299438e-06, 1.0767951607704163e-05, 1.1846423149108887e-05, 1.292489469051361e-05, 1.4003366231918335e-05, 1.5081837773323059e-05, 1.6160309314727783e-05, 1.7238780856132507e-05, 1.831725239753723e-05, 1.9395723938941956e-05, 2.047419548034668e-05, 2.1552667021751404e-05, 2.2631138563156128e-05, 2.3709610104560852e-05, 2.4788081645965576e-05, 2.58665531873703e-05, 2.6945024728775024e-05, 2.802349627017975e-05, 2.9101967811584473e-05, 3.0180439352989197e-05, 3.125891089439392e-05, 3.2337382435798645e-05, 3.341585397720337e-05, 3.449432551860809e-05, 3.557279706001282e-05, 3.665126860141754e-05, 3.7729740142822266e-05]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 5.0, 9.0, 14.0, 19.0, 12.0, 26.0, 50.0, 34.0, 79.0, 107.0, 69.0, 202.0, 274.0, 407.0, 288.0, 828.0, 1332.0, 965.0, 3025.0, 5521.0, 4479.0, 15846.0, 39120.0, 122566.0, 175922.0, 481566.0, 123049.0, 24142.0, 24549.0, 10804.0, 5560.0, 1717.0, 2328.0, 1295.0, 445.0, 654.0, 401.0, 133.0, 208.0, 149.0, 114.0, 34.0, 67.0, 39.0, 15.0, 22.0, 18.0, 10.0, 11.0, 7.0, 6.0, 5.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0], "bins": [-3.159046173095703e-06, -3.057532012462616e-06, -2.956017851829529e-06, -2.8545036911964417e-06, -2.7529895305633545e-06, -2.6514753699302673e-06, -2.54996120929718e-06, -2.448447048664093e-06, -2.346932888031006e-06, -2.2454187273979187e-06, -2.1439045667648315e-06, -2.0423904061317444e-06, -1.9408762454986572e-06, -1.83936208486557e-06, -1.737847924232483e-06, -1.6363337635993958e-06, -1.5348196029663086e-06, -1.4333054423332214e-06, -1.3317912817001343e-06, -1.2302771210670471e-06, -1.12876296043396e-06, -1.0272487998008728e-06, -9.257346391677856e-07, -8.242204785346985e-07, -7.227063179016113e-07, -6.211921572685242e-07, -5.19677996635437e-07, -4.1816383600234985e-07, -3.166496753692627e-07, -2.1513551473617554e-07, -1.1362135410308838e-07, -1.210719347000122e-08, 8.940696716308594e-08, 1.909211277961731e-07, 2.9243528842926025e-07, 3.939494490623474e-07, 4.954636096954346e-07, 5.969777703285217e-07, 6.984919309616089e-07, 8.00006091594696e-07, 9.015202522277832e-07, 1.0030344128608704e-06, 1.1045485734939575e-06, 1.2060627341270447e-06, 1.3075768947601318e-06, 1.409091055393219e-06, 1.5106052160263062e-06, 1.6121193766593933e-06, 1.7136335372924805e-06, 1.8151476979255676e-06, 1.9166618585586548e-06, 2.018176019191742e-06, 2.119690179824829e-06, 2.2212043404579163e-06, 2.3227185010910034e-06, 2.4242326617240906e-06, 2.5257468223571777e-06, 2.627260982990265e-06, 2.728775143623352e-06, 2.830289304256439e-06, 2.9318034648895264e-06, 3.0333176255226135e-06, 3.1348317861557007e-06, 3.236345946788788e-06, 3.337860107421875e-06]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 7.0, 15.0, 0.0, 12.0, 24.0, 20.0, 44.0, 55.0, 76.0, 0.0, 84.0, 108.0, 119.0, 112.0, 89.0, 65.0, 0.0, 58.0, 25.0, 24.0, 20.0, 10.0, 11.0, 0.0, 8.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5581026673316956e-06, -1.5068799257278442e-06, -1.455657184123993e-06, -1.4044344425201416e-06, -1.3532117009162903e-06, -1.301988959312439e-06, -1.2507662177085876e-06, -1.1995434761047363e-06, -1.148320734500885e-06, -1.0970979928970337e-06, -1.0458752512931824e-06, -9.94652509689331e-07, -9.434297680854797e-07, -8.922070264816284e-07, -8.409842848777771e-07, -7.897615432739258e-07, -7.385388016700745e-07, -6.873160600662231e-07, -6.360933184623718e-07, -5.848705768585205e-07, -5.336478352546692e-07, -4.824250936508179e-07, -4.3120235204696655e-07, -3.7997961044311523e-07, -3.287568688392639e-07, -2.775341272354126e-07, -2.2631138563156128e-07, -1.7508864402770996e-07, -1.2386590242385864e-07, -7.264316082000732e-08, -2.1420419216156006e-08, 2.9802322387695312e-08, 8.102506399154663e-08, 1.3224780559539795e-07, 1.8347054719924927e-07, 2.3469328880310059e-07, 2.859160304069519e-07, 3.371387720108032e-07, 3.8836151361465454e-07, 4.3958425521850586e-07, 4.908069968223572e-07, 5.420297384262085e-07, 5.932524800300598e-07, 6.444752216339111e-07, 6.956979632377625e-07, 7.469207048416138e-07, 7.981434464454651e-07, 8.493661880493164e-07, 9.005889296531677e-07, 9.51811671257019e-07, 1.0030344128608704e-06, 1.0542571544647217e-06, 1.105479896068573e-06, 1.1567026376724243e-06, 1.2079253792762756e-06, 1.259148120880127e-06, 1.3103708624839783e-06, 1.3615936040878296e-06, 1.412816345691681e-06, 1.4640390872955322e-06, 1.5152618288993835e-06, 1.5664845705032349e-06, 1.6177073121070862e-06, 1.6689300537109375e-06]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 10.0, 13.0, 17.0, 47.0, 41.0, 61.0, 103.0, 224.0, 229.0, 387.0, 632.0, 1726.0, 2266.0, 3857.0, 8024.0, 36597.0, 106715.0, 547537.0, 285793.0, 29694.0, 11567.0, 5607.0, 3826.0, 1282.0, 819.0, 510.0, 446.0, 171.0, 120.0, 67.0, 70.0, 38.0, 19.0, 17.0, 5.0, 8.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.410743713378906e-06, -4.275701940059662e-06, -4.1406601667404175e-06, -4.005618393421173e-06, -3.870576620101929e-06, -3.7355348467826843e-06, -3.60049307346344e-06, -3.4654513001441956e-06, -3.330409526824951e-06, -3.1953677535057068e-06, -3.0603259801864624e-06, -2.925284206867218e-06, -2.7902424335479736e-06, -2.6552006602287292e-06, -2.520158886909485e-06, -2.3851171135902405e-06, -2.250075340270996e-06, -2.1150335669517517e-06, -1.9799917936325073e-06, -1.844950020313263e-06, -1.7099082469940186e-06, -1.5748664736747742e-06, -1.4398247003555298e-06, -1.3047829270362854e-06, -1.169741153717041e-06, -1.0346993803977966e-06, -8.996576070785522e-07, -7.646158337593079e-07, -6.295740604400635e-07, -4.945322871208191e-07, -3.594905138015747e-07, -2.2444874048233032e-07, -8.940696716308594e-08, 4.563480615615845e-08, 1.8067657947540283e-07, 3.157183527946472e-07, 4.507601261138916e-07, 5.85801899433136e-07, 7.208436727523804e-07, 8.558854460716248e-07, 9.909272193908691e-07, 1.1259689927101135e-06, 1.261010766029358e-06, 1.3960525393486023e-06, 1.5310943126678467e-06, 1.666136085987091e-06, 1.8011778593063354e-06, 1.93621963262558e-06, 2.0712614059448242e-06, 2.2063031792640686e-06, 2.341344952583313e-06, 2.4763867259025574e-06, 2.6114284992218018e-06, 2.746470272541046e-06, 2.8815120458602905e-06, 3.016553819179535e-06, 3.1515955924987793e-06, 3.2866373658180237e-06, 3.421679139137268e-06, 3.5567209124565125e-06, 3.691762685775757e-06, 3.826804459095001e-06, 3.961846232414246e-06, 4.09688800573349e-06, 4.231929779052734e-06]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 11.0, 6.0, 7.0, 6.0, 19.0, 20.0, 39.0, 22.0, 52.0, 62.0, 125.0, 166.0, 62.0, 110.0, 56.0, 70.0, 30.0, 37.0, 12.0, 19.0, 8.0, 16.0, 5.0, 6.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9802322387695312e-06, -2.88989394903183e-06, -2.7995556592941284e-06, -2.709217369556427e-06, -2.6188790798187256e-06, -2.528540790081024e-06, -2.4382025003433228e-06, -2.3478642106056213e-06, -2.25752592086792e-06, -2.1671876311302185e-06, -2.076849341392517e-06, -1.9865110516548157e-06, -1.8961727619171143e-06, -1.8058344721794128e-06, -1.7154961824417114e-06, -1.62515789270401e-06, -1.5348196029663086e-06, -1.4444813132286072e-06, -1.3541430234909058e-06, -1.2638047337532043e-06, -1.173466444015503e-06, -1.0831281542778015e-06, -9.927898645401e-07, -9.024515748023987e-07, -8.121132850646973e-07, -7.217749953269958e-07, -6.314367055892944e-07, -5.41098415851593e-07, -4.507601261138916e-07, -3.604218363761902e-07, -2.7008354663848877e-07, -1.7974525690078735e-07, -8.940696716308594e-08, 9.313225746154785e-10, 9.12696123123169e-08, 1.816079020500183e-07, 2.7194619178771973e-07, 3.6228448152542114e-07, 4.5262277126312256e-07, 5.42961061000824e-07, 6.332993507385254e-07, 7.236376404762268e-07, 8.139759302139282e-07, 9.043142199516296e-07, 9.94652509689331e-07, 1.0849907994270325e-06, 1.1753290891647339e-06, 1.2656673789024353e-06, 1.3560056686401367e-06, 1.4463439583778381e-06, 1.5366822481155396e-06, 1.627020537853241e-06, 1.7173588275909424e-06, 1.8076971173286438e-06, 1.8980354070663452e-06, 1.9883736968040466e-06, 2.078711986541748e-06, 2.1690502762794495e-06, 2.259388566017151e-06, 2.3497268557548523e-06, 2.4400651454925537e-06, 2.530403435230255e-06, 2.6207417249679565e-06, 2.711080014705658e-06, 2.8014183044433594e-06]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 5.0, 10.0, 21.0, 19.0, 23.0, 34.0, 51.0, 102.0, 121.0, 178.0, 85.0, 61.0, 56.0, 37.0, 37.0, 29.0, 20.0, 20.0, 14.0, 9.0, 12.0, 7.0, 3.0, 7.0, 5.0, 8.0, 4.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.611773566575721e-05, -9.229796705767512e-05, -8.847819844959304e-05, -8.465842984151095e-05, -8.083865395747125e-05, -7.701888534938917e-05, -7.319911674130708e-05, -6.9379348133225e-05, -6.555957952514291e-05, -6.173981091706082e-05, -5.792003867099993e-05, -5.4100270062917843e-05, -5.028049781685695e-05, -4.6460729208774865e-05, -4.264096060069278e-05, -3.882119199261069e-05, -3.500141610857099e-05, -3.118164750048891e-05, -2.7361875254428014e-05, -2.354210664634593e-05, -1.972233621927444e-05, -1.590256579220295e-05, -1.2082797184120864e-05, -8.263026757049374e-06, -4.443256329977885e-06, -6.234863576537464e-07, 3.196283614670392e-06, 7.01605313224718e-06, 1.0835823559318669e-05, 1.4655593986390159e-05, 1.8475362594472244e-05, 2.2295133021543734e-05, 2.611489617265761e-05, 2.99346665997291e-05, 3.375443702680059e-05, 3.7574205634882674e-05, 4.1393977880943567e-05, 4.521374648902565e-05, 4.903351509710774e-05, 5.2853283705189824e-05, 5.667305595125072e-05, 6.04928245593328e-05, 6.43125968053937e-05, 6.813236541347578e-05, 7.195213402155787e-05, 7.577190990559757e-05, 7.959167123772204e-05, 8.341144712176174e-05, 8.723121572984383e-05, 9.105098433792591e-05, 9.4870752946008e-05, 9.869052155409008e-05, 0.00010251029743812978, 0.00010633006604621187, 0.00011014983465429395, 0.00011396960326237604, 0.00011778937187045813, 0.00012160914047854021, 0.0001254289090866223, 0.000129248684970662, 0.00013306844630278647, 0.00013688822218682617, 0.00014070799807086587, 0.00014452775940299034, 0.00014834753528703004]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 6.0, 6.0, 9.0, 16.0, 13.0, 13.0, 13.0, 19.0, 24.0, 23.0, 20.0, 38.0, 34.0, 36.0, 51.0, 36.0, 50.0, 47.0, 53.0, 51.0, 33.0, 55.0, 46.0, 25.0, 45.0, 43.0, 25.0, 28.0, 23.0, 19.0, 22.0, 13.0, 13.0, 11.0, 13.0, 5.0, 7.0, 4.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.285045623779297e-05, -7.992982864379883e-05, -7.700920104980469e-05, -7.408857345581055e-05, -7.11679458618164e-05, -6.824731826782227e-05, -6.532669067382812e-05, -6.240606307983398e-05, -5.9485435485839844e-05, -5.65648078918457e-05, -5.364418029785156e-05, -5.072355270385742e-05, -4.780292510986328e-05, -4.488229751586914e-05, -4.1961669921875e-05, -3.904104232788086e-05, -3.612041473388672e-05, -3.319978713989258e-05, -3.0279159545898438e-05, -2.7358531951904297e-05, -2.4437904357910156e-05, -2.1517276763916016e-05, -1.8596649169921875e-05, -1.5676021575927734e-05, -1.2755393981933594e-05, -9.834766387939453e-06, -6.9141387939453125e-06, -3.993511199951172e-06, -1.0728836059570312e-06, 1.8477439880371094e-06, 4.76837158203125e-06, 7.68899917602539e-06, 1.0609626770019531e-05, 1.3530254364013672e-05, 1.6450881958007812e-05, 1.9371509552001953e-05, 2.2292137145996094e-05, 2.5212764739990234e-05, 2.8133392333984375e-05, 3.1054019927978516e-05, 3.3974647521972656e-05, 3.68952751159668e-05, 3.981590270996094e-05, 4.273653030395508e-05, 4.565715789794922e-05, 4.857778549194336e-05, 5.14984130859375e-05, 5.441904067993164e-05, 5.733966827392578e-05, 6.026029586791992e-05, 6.318092346191406e-05, 6.61015510559082e-05, 6.902217864990234e-05, 7.194280624389648e-05, 7.486343383789062e-05, 7.778406143188477e-05, 8.07046890258789e-05, 8.362531661987305e-05, 8.654594421386719e-05, 8.946657180786133e-05, 9.238719940185547e-05, 9.530782699584961e-05, 9.822845458984375e-05, 0.00010114908218383789, 0.00010406970977783203]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 7.0, 10.0, 14.0, 16.0, 27.0, 38.0, 45.0, 71.0, 95.0, 124.0, 220.0, 308.0, 494.0, 815.0, 1304.0, 2318.0, 4123.0, 8353.0, 19141.0, 62385.0, 3325997.0, 700502.0, 38749.0, 13890.0, 6420.0, 3407.0, 1962.0, 1065.0, 724.0, 498.0, 331.0, 220.0, 198.0, 117.0, 86.0, 61.0, 37.0, 25.0, 20.0, 18.0, 13.0, 10.0, 4.0, 12.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.0617923736572266e-05, -5.871523171663284e-05, -5.681253969669342e-05, -5.4909847676754e-05, -5.3007155656814575e-05, -5.110446363687515e-05, -4.920177161693573e-05, -4.729907959699631e-05, -4.5396387577056885e-05, -4.349369555711746e-05, -4.159100353717804e-05, -3.968831151723862e-05, -3.7785619497299194e-05, -3.588292747735977e-05, -3.398023545742035e-05, -3.2077543437480927e-05, -3.0174851417541504e-05, -2.827215939760208e-05, -2.636946737766266e-05, -2.4466775357723236e-05, -2.2564083337783813e-05, -2.066139131784439e-05, -1.8758699297904968e-05, -1.6856007277965546e-05, -1.4953315258026123e-05, -1.30506232380867e-05, -1.1147931218147278e-05, -9.245239198207855e-06, -7.342547178268433e-06, -5.43985515832901e-06, -3.5371631383895874e-06, -1.6344711184501648e-06, 2.682209014892578e-07, 2.1709129214286804e-06, 4.073604941368103e-06, 5.976296961307526e-06, 7.878988981246948e-06, 9.781681001186371e-06, 1.1684373021125793e-05, 1.3587065041065216e-05, 1.548975706100464e-05, 1.739244908094406e-05, 1.9295141100883484e-05, 2.1197833120822906e-05, 2.310052514076233e-05, 2.5003217160701752e-05, 2.6905909180641174e-05, 2.8808601200580597e-05, 3.071129322052002e-05, 3.261398524045944e-05, 3.4516677260398865e-05, 3.641936928033829e-05, 3.832206130027771e-05, 4.022475332021713e-05, 4.2127445340156555e-05, 4.403013736009598e-05, 4.59328293800354e-05, 4.783552139997482e-05, 4.9738213419914246e-05, 5.164090543985367e-05, 5.354359745979309e-05, 5.5446289479732513e-05, 5.7348981499671936e-05, 5.925167351961136e-05, 6.115436553955078e-05]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 2.0, 12.0, 10.0, 12.0, 21.0, 21.0, 16.0, 36.0, 33.0, 64.0, 75.0, 80.0, 78.0, 81.0, 96.0, 63.0, 67.0, 46.0, 36.0, 40.0, 20.0, 23.0, 14.0, 10.0, 4.0, 6.0, 4.0, 6.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.52587890625e-05, -1.4740973711013794e-05, -1.4223158359527588e-05, -1.3705343008041382e-05, -1.3187527656555176e-05, -1.266971230506897e-05, -1.2151896953582764e-05, -1.1634081602096558e-05, -1.1116266250610352e-05, -1.0598450899124146e-05, -1.008063554763794e-05, -9.562820196151733e-06, -9.045004844665527e-06, -8.527189493179321e-06, -8.009374141693115e-06, -7.491558790206909e-06, -6.973743438720703e-06, -6.455928087234497e-06, -5.938112735748291e-06, -5.420297384262085e-06, -4.902482032775879e-06, -4.384666681289673e-06, -3.866851329803467e-06, -3.3490359783172607e-06, -2.8312206268310547e-06, -2.3134052753448486e-06, -1.7955899238586426e-06, -1.2777745723724365e-06, -7.599592208862305e-07, -2.421438694000244e-07, 2.7567148208618164e-07, 7.934868335723877e-07, 1.3113021850585938e-06, 1.8291175365447998e-06, 2.346932888031006e-06, 2.864748239517212e-06, 3.382563591003418e-06, 3.900378942489624e-06, 4.41819429397583e-06, 4.936009645462036e-06, 5.453824996948242e-06, 5.971640348434448e-06, 6.489455699920654e-06, 7.00727105140686e-06, 7.525086402893066e-06, 8.042901754379272e-06, 8.560717105865479e-06, 9.078532457351685e-06, 9.59634780883789e-06, 1.0114163160324097e-05, 1.0631978511810303e-05, 1.1149793863296509e-05, 1.1667609214782715e-05, 1.2185424566268921e-05, 1.2703239917755127e-05, 1.3221055269241333e-05, 1.3738870620727539e-05, 1.4256685972213745e-05, 1.4774501323699951e-05, 1.5292316675186157e-05, 1.5810132026672363e-05, 1.632794737815857e-05, 1.6845762729644775e-05, 1.736357808113098e-05, 1.7881393432617188e-05]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 5.0, 16.0, 23.0, 28.0, 40.0, 63.0, 117.0, 185.0, 361.0, 683.0, 1316.0, 2751.0, 6010.0, 14023.0, 34822.0, 120865.0, 3437661.0, 471676.0, 61740.0, 23331.0, 9787.0, 4351.0, 2118.0, 1070.0, 515.0, 296.0, 161.0, 88.0, 61.0, 36.0, 21.0, 21.0, 17.0, 6.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2557716369628906e-05, -4.112906754016876e-05, -3.970041871070862e-05, -3.8271769881248474e-05, -3.684312105178833e-05, -3.5414472222328186e-05, -3.398582339286804e-05, -3.25571745634079e-05, -3.1128525733947754e-05, -2.969987690448761e-05, -2.8271228075027466e-05, -2.6842579245567322e-05, -2.5413930416107178e-05, -2.3985281586647034e-05, -2.255663275718689e-05, -2.1127983927726746e-05, -1.96993350982666e-05, -1.8270686268806458e-05, -1.6842037439346313e-05, -1.541338860988617e-05, -1.3984739780426025e-05, -1.2556090950965881e-05, -1.1127442121505737e-05, -9.698793292045593e-06, -8.27014446258545e-06, -6.841495633125305e-06, -5.412846803665161e-06, -3.984197974205017e-06, -2.555549144744873e-06, -1.126900315284729e-06, 3.0174851417541504e-07, 1.730397343635559e-06, 3.159046173095703e-06, 4.587695002555847e-06, 6.016343832015991e-06, 7.444992661476135e-06, 8.87364149093628e-06, 1.0302290320396423e-05, 1.1730939149856567e-05, 1.3159587979316711e-05, 1.4588236808776855e-05, 1.6016885638237e-05, 1.7445534467697144e-05, 1.8874183297157288e-05, 2.030283212661743e-05, 2.1731480956077576e-05, 2.316012978553772e-05, 2.4588778614997864e-05, 2.6017427444458008e-05, 2.7446076273918152e-05, 2.8874725103378296e-05, 3.030337393283844e-05, 3.1732022762298584e-05, 3.316067159175873e-05, 3.458932042121887e-05, 3.6017969250679016e-05, 3.744661808013916e-05, 3.8875266909599304e-05, 4.030391573905945e-05, 4.173256456851959e-05, 4.3161213397979736e-05, 4.458986222743988e-05, 4.6018511056900024e-05, 4.744715988636017e-05, 4.887580871582031e-05]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 7.0, 4.0, 4.0, 11.0, 15.0, 14.0, 19.0, 20.0, 23.0, 27.0, 36.0, 57.0, 104.0, 233.0, 640.0, 1523.0, 744.0, 246.0, 86.0, 55.0, 48.0, 32.0, 21.0, 18.0, 9.0, 20.0, 16.0, 4.0, 9.0, 7.0, 5.0, 3.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4259090423583984e-05, -2.3310072720050812e-05, -2.236105501651764e-05, -2.1412037312984467e-05, -2.0463019609451294e-05, -1.951400190591812e-05, -1.856498420238495e-05, -1.7615966498851776e-05, -1.6666948795318604e-05, -1.571793109178543e-05, -1.4768913388252258e-05, -1.3819895684719086e-05, -1.2870877981185913e-05, -1.192186027765274e-05, -1.0972842574119568e-05, -1.0023824870586395e-05, -9.074807167053223e-06, -8.12578946352005e-06, -7.1767717599868774e-06, -6.227754056453705e-06, -5.278736352920532e-06, -4.32971864938736e-06, -3.380700945854187e-06, -2.4316832423210144e-06, -1.4826655387878418e-06, -5.336478352546692e-07, 4.153698682785034e-07, 1.364387571811676e-06, 2.3134052753448486e-06, 3.2624229788780212e-06, 4.211440682411194e-06, 5.1604583859443665e-06, 6.109476089477539e-06, 7.058493793010712e-06, 8.007511496543884e-06, 8.956529200077057e-06, 9.90554690361023e-06, 1.0854564607143402e-05, 1.1803582310676575e-05, 1.2752600014209747e-05, 1.370161771774292e-05, 1.4650635421276093e-05, 1.5599653124809265e-05, 1.6548670828342438e-05, 1.749768853187561e-05, 1.8446706235408783e-05, 1.9395723938941956e-05, 2.0344741642475128e-05, 2.12937593460083e-05, 2.2242777049541473e-05, 2.3191794753074646e-05, 2.414081245660782e-05, 2.508983016014099e-05, 2.6038847863674164e-05, 2.6987865567207336e-05, 2.793688327074051e-05, 2.888590097427368e-05, 2.9834918677806854e-05, 3.078393638134003e-05, 3.17329540848732e-05, 3.268197178840637e-05, 3.3630989491939545e-05, 3.458000719547272e-05, 3.552902489900589e-05, 3.647804260253906e-05]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 5.0, 8.0, 10.0, 8.0, 12.0, 12.0, 23.0, 19.0, 17.0, 34.0, 60.0, 57.0, 62.0, 85.0, 109.0, 83.0, 89.0, 51.0, 38.0, 37.0, 24.0, 26.0, 26.0, 12.0, 20.0, 14.0, 14.0, 5.0, 10.0, 3.0, 5.0, 2.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.355880320072174e-05, -9.024501196108758e-05, -8.693122799741104e-05, -8.361743675777689e-05, -8.030364551814273e-05, -7.698986155446619e-05, -7.367607031483203e-05, -7.036227907519788e-05, -6.704848783556372e-05, -6.373469659592956e-05, -6.0420908994274214e-05, -5.7107121392618865e-05, -5.379333015298471e-05, -5.047954255132936e-05, -4.716575494967401e-05, -4.3851963710039854e-05, -4.053817974636331e-05, -3.722439214470796e-05, -3.391060090507381e-05, -3.059681330341846e-05, -2.7283023882773705e-05, -2.3969234462128952e-05, -2.0655446860473603e-05, -1.734165743982885e-05, -1.4027868019184098e-05, -1.0714078598539345e-05, -7.400290087389294e-06, -4.086501576239243e-06, -7.727121555944905e-07, 2.5410772650502622e-06, 5.854864866705611e-06, 9.168654287350364e-06, 1.2482450983952731e-05, 1.5796240404597484e-05, 1.9110029825242236e-05, 2.2423817426897585e-05, 2.5737606847542338e-05, 2.905139626818709e-05, 3.236518386984244e-05, 3.5678975109476596e-05, 3.8992762711131945e-05, 4.2306550312787294e-05, 4.562034155242145e-05, 4.89341291540768e-05, 5.224791675573215e-05, 5.5561707995366305e-05, 5.8875495597021654e-05, 6.2189283198677e-05, 6.550307443831116e-05, 6.881686567794532e-05, 7.213064964162186e-05, 7.544444088125601e-05, 7.875823212089017e-05, 8.207201608456671e-05, 8.538580732420087e-05, 8.869959856383502e-05, 9.201338980346918e-05, 9.532718104310334e-05, 9.864096500677988e-05, 0.00010195475624641404, 0.00010526854748604819, 0.00010858233144972473, 0.00011189612268935889, 0.00011520991392899305, 0.00011852369789266959]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 11.0, 3.0, 11.0, 3.0, 8.0, 7.0, 8.0, 10.0, 10.0, 15.0, 13.0, 26.0, 17.0, 27.0, 23.0, 24.0, 27.0, 40.0, 43.0, 37.0, 38.0, 36.0, 48.0, 42.0, 41.0, 29.0, 46.0, 34.0, 33.0, 40.0, 32.0, 29.0, 26.0, 20.0, 23.0, 18.0, 14.0, 25.0, 16.0, 9.0, 16.0, 10.0, 4.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.341934204101562e-05, -6.139371544122696e-05, -5.9368088841438293e-05, -5.734246224164963e-05, -5.531683564186096e-05, -5.3291209042072296e-05, -5.126558244228363e-05, -4.9239955842494965e-05, -4.72143292427063e-05, -4.518870264291763e-05, -4.316307604312897e-05, -4.11374494433403e-05, -3.9111822843551636e-05, -3.708619624376297e-05, -3.5060569643974304e-05, -3.303494304418564e-05, -3.100931644439697e-05, -2.8983689844608307e-05, -2.695806324481964e-05, -2.4932436645030975e-05, -2.290681004524231e-05, -2.0881183445453644e-05, -1.8855556845664978e-05, -1.6829930245876312e-05, -1.4804303646087646e-05, -1.277867704629898e-05, -1.0753050446510315e-05, -8.72742384672165e-06, -6.701797246932983e-06, -4.676170647144318e-06, -2.650544047355652e-06, -6.249174475669861e-07, 1.4007091522216797e-06, 3.4263357520103455e-06, 5.451962351799011e-06, 7.477588951587677e-06, 9.503215551376343e-06, 1.1528842151165009e-05, 1.3554468750953674e-05, 1.558009535074234e-05, 1.7605721950531006e-05, 1.963134855031967e-05, 2.1656975150108337e-05, 2.3682601749897003e-05, 2.570822834968567e-05, 2.7733854949474335e-05, 2.9759481549263e-05, 3.1785108149051666e-05, 3.381073474884033e-05, 3.5836361348629e-05, 3.7861987948417664e-05, 3.988761454820633e-05, 4.1913241147994995e-05, 4.393886774778366e-05, 4.596449434757233e-05, 4.799012094736099e-05, 5.001574754714966e-05, 5.2041374146938324e-05, 5.406700074672699e-05, 5.6092627346515656e-05, 5.811825394630432e-05, 6.014388054609299e-05, 6.216950714588165e-05, 6.419513374567032e-05, 6.622076034545898e-05]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 9.0, 5.0, 6.0, 12.0, 11.0, 13.0, 18.0, 24.0, 28.0, 29.0, 53.0, 76.0, 145.0, 263.0, 654.0, 1438.0, 3395.0, 8550.0, 25979.0, 107971.0, 652776.0, 187824.0, 39481.0, 11651.0, 4544.0, 1884.0, 839.0, 375.0, 187.0, 96.0, 50.0, 37.0, 24.0, 20.0, 18.0, 22.0, 7.0, 10.0, 6.0, 7.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00013744831085205078, -0.00013296492397785187, -0.00012848153710365295, -0.00012399815022945404, -0.00011951476335525513, -0.00011503137648105621, -0.0001105479896068573, -0.00010606460273265839, -0.00010158121585845947, -9.709782898426056e-05, -9.261444211006165e-05, -8.813105523586273e-05, -8.364766836166382e-05, -7.91642814874649e-05, -7.468089461326599e-05, -7.019750773906708e-05, -6.571412086486816e-05, -6.123073399066925e-05, -5.674734711647034e-05, -5.226396024227142e-05, -4.778057336807251e-05, -4.3297186493873596e-05, -3.881379961967468e-05, -3.433041274547577e-05, -2.9847025871276855e-05, -2.5363638997077942e-05, -2.088025212287903e-05, -1.6396865248680115e-05, -1.1913478374481201e-05, -7.430091500282288e-06, -2.946704626083374e-06, 1.5366822481155396e-06, 6.020069122314453e-06, 1.0503455996513367e-05, 1.498684287071228e-05, 1.9470229744911194e-05, 2.3953616619110107e-05, 2.843700349330902e-05, 3.2920390367507935e-05, 3.740377724170685e-05, 4.188716411590576e-05, 4.6370550990104675e-05, 5.085393786430359e-05, 5.53373247385025e-05, 5.9820711612701416e-05, 6.430409848690033e-05, 6.878748536109924e-05, 7.327087223529816e-05, 7.775425910949707e-05, 8.223764598369598e-05, 8.67210328578949e-05, 9.120441973209381e-05, 9.568780660629272e-05, 0.00010017119348049164, 0.00010465458035469055, 0.00010913796722888947, 0.00011362135410308838, 0.00011810474097728729, 0.0001225881278514862, 0.00012707151472568512, 0.00013155490159988403, 0.00013603828847408295, 0.00014052167534828186, 0.00014500506222248077, 0.0001494884490966797]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 14.0, 8.0, 10.0, 18.0, 58.0, 44.0, 92.0, 109.0, 129.0, 109.0, 110.0, 78.0, 60.0, 46.0, 41.0, 19.0, 14.0, 12.0, 7.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5795230865478516e-05, -1.5014782547950745e-05, -1.4234334230422974e-05, -1.3453885912895203e-05, -1.2673437595367432e-05, -1.189298927783966e-05, -1.111254096031189e-05, -1.0332092642784119e-05, -9.551644325256348e-06, -8.771196007728577e-06, -7.990747690200806e-06, -7.210299372673035e-06, -6.429851055145264e-06, -5.649402737617493e-06, -4.868954420089722e-06, -4.088506102561951e-06, -3.3080577850341797e-06, -2.5276094675064087e-06, -1.7471611499786377e-06, -9.667128324508667e-07, -1.862645149230957e-07, 5.941838026046753e-07, 1.3746321201324463e-06, 2.1550804376602173e-06, 2.9355287551879883e-06, 3.7159770727157593e-06, 4.49642539024353e-06, 5.276873707771301e-06, 6.057322025299072e-06, 6.837770342826843e-06, 7.618218660354614e-06, 8.398666977882385e-06, 9.179115295410156e-06, 9.959563612937927e-06, 1.0740011930465698e-05, 1.152046024799347e-05, 1.230090856552124e-05, 1.3081356883049011e-05, 1.3861805200576782e-05, 1.4642253518104553e-05, 1.5422701835632324e-05, 1.6203150153160095e-05, 1.6983598470687866e-05, 1.7764046788215637e-05, 1.8544495105743408e-05, 1.932494342327118e-05, 2.010539174079895e-05, 2.088584005832672e-05, 2.1666288375854492e-05, 2.2446736693382263e-05, 2.3227185010910034e-05, 2.4007633328437805e-05, 2.4788081645965576e-05, 2.5568529963493347e-05, 2.6348978281021118e-05, 2.712942659854889e-05, 2.790987491607666e-05, 2.869032323360443e-05, 2.9470771551132202e-05, 3.0251219868659973e-05, 3.1031668186187744e-05, 3.1812116503715515e-05, 3.2592564821243286e-05, 3.337301313877106e-05, 3.415346145629883e-05]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 1.0, 6.0, 18.0, 27.0, 27.0, 43.0, 60.0, 105.0, 187.0, 281.0, 462.0, 936.0, 1477.0, 2780.0, 4718.0, 8757.0, 16687.0, 29837.0, 64536.0, 149439.0, 451320.0, 177516.0, 66801.0, 33984.0, 16925.0, 9496.0, 5417.0, 2842.0, 1651.0, 909.0, 482.0, 298.0, 183.0, 124.0, 72.0, 39.0, 45.0, 31.0, 11.0, 9.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.3451786041259766e-05, -4.2117200791835785e-05, -4.0782615542411804e-05, -3.9448030292987823e-05, -3.811344504356384e-05, -3.677885979413986e-05, -3.544427454471588e-05, -3.41096892952919e-05, -3.277510404586792e-05, -3.144051879644394e-05, -3.010593354701996e-05, -2.8771348297595978e-05, -2.7436763048171997e-05, -2.6102177798748016e-05, -2.4767592549324036e-05, -2.3433007299900055e-05, -2.2098422050476074e-05, -2.0763836801052094e-05, -1.9429251551628113e-05, -1.8094666302204132e-05, -1.676008105278015e-05, -1.542549580335617e-05, -1.409091055393219e-05, -1.275632530450821e-05, -1.1421740055084229e-05, -1.0087154805660248e-05, -8.752569556236267e-06, -7.417984306812286e-06, -6.083399057388306e-06, -4.748813807964325e-06, -3.4142285585403442e-06, -2.0796433091163635e-06, -7.450580596923828e-07, 5.895271897315979e-07, 1.9241124391555786e-06, 3.2586976885795593e-06, 4.59328293800354e-06, 5.927868187427521e-06, 7.2624534368515015e-06, 8.597038686275482e-06, 9.931623935699463e-06, 1.1266209185123444e-05, 1.2600794434547424e-05, 1.3935379683971405e-05, 1.5269964933395386e-05, 1.6604550182819366e-05, 1.7939135432243347e-05, 1.9273720681667328e-05, 2.060830593109131e-05, 2.194289118051529e-05, 2.327747642993927e-05, 2.461206167936325e-05, 2.594664692878723e-05, 2.7281232178211212e-05, 2.8615817427635193e-05, 2.9950402677059174e-05, 3.1284987926483154e-05, 3.2619573175907135e-05, 3.3954158425331116e-05, 3.5288743674755096e-05, 3.662332892417908e-05, 3.795791417360306e-05, 3.929249942302704e-05, 4.062708467245102e-05, 4.1961669921875e-05]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 11.0, 13.0, 4.0, 10.0, 10.0, 14.0, 13.0, 24.0, 22.0, 14.0, 35.0, 22.0, 31.0, 44.0, 49.0, 41.0, 42.0, 37.0, 61.0, 43.0, 46.0, 35.0, 44.0, 38.0, 38.0, 32.0, 32.0, 32.0, 22.0, 31.0, 18.0, 14.0, 11.0, 16.0, 17.0, 11.0, 14.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.1113624572753906e-05, -3.016740083694458e-05, -2.9221177101135254e-05, -2.8274953365325928e-05, -2.73287296295166e-05, -2.6382505893707275e-05, -2.543628215789795e-05, -2.4490058422088623e-05, -2.3543834686279297e-05, -2.259761095046997e-05, -2.1651387214660645e-05, -2.070516347885132e-05, -1.9758939743041992e-05, -1.8812716007232666e-05, -1.786649227142334e-05, -1.6920268535614014e-05, -1.5974044799804688e-05, -1.5027821063995361e-05, -1.4081597328186035e-05, -1.3135373592376709e-05, -1.2189149856567383e-05, -1.1242926120758057e-05, -1.029670238494873e-05, -9.350478649139404e-06, -8.404254913330078e-06, -7.458031177520752e-06, -6.511807441711426e-06, -5.5655837059021e-06, -4.6193599700927734e-06, -3.6731362342834473e-06, -2.726912498474121e-06, -1.780688762664795e-06, -8.344650268554688e-07, 1.1175870895385742e-07, 1.0579824447631836e-06, 2.0042061805725098e-06, 2.950429916381836e-06, 3.896653652191162e-06, 4.842877388000488e-06, 5.7891011238098145e-06, 6.735324859619141e-06, 7.681548595428467e-06, 8.627772331237793e-06, 9.573996067047119e-06, 1.0520219802856445e-05, 1.1466443538665771e-05, 1.2412667274475098e-05, 1.3358891010284424e-05, 1.430511474609375e-05, 1.5251338481903076e-05, 1.6197562217712402e-05, 1.714378595352173e-05, 1.8090009689331055e-05, 1.903623342514038e-05, 1.9982457160949707e-05, 2.0928680896759033e-05, 2.187490463256836e-05, 2.2821128368377686e-05, 2.3767352104187012e-05, 2.4713575839996338e-05, 2.5659799575805664e-05, 2.660602331161499e-05, 2.7552247047424316e-05, 2.8498470783233643e-05, 2.944469451904297e-05]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 10.0, 21.0, 20.0, 26.0, 43.0, 101.0, 113.0, 193.0, 333.0, 485.0, 882.0, 1539.0, 2758.0, 5418.0, 11117.0, 26009.0, 71120.0, 258290.0, 464315.0, 130407.0, 41791.0, 16816.0, 7850.0, 3907.0, 2121.0, 1180.0, 882.0, 285.0, 183.0, 110.0, 63.0, 62.0, 28.0, 14.0, 20.0, 8.0, 5.0, 5.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.172325134277344e-06, -4.050321877002716e-06, -3.928318619728088e-06, -3.8063153624534607e-06, -3.684312105178833e-06, -3.5623088479042053e-06, -3.4403055906295776e-06, -3.31830233335495e-06, -3.1962990760803223e-06, -3.0742958188056946e-06, -2.952292561531067e-06, -2.830289304256439e-06, -2.7082860469818115e-06, -2.586282789707184e-06, -2.464279532432556e-06, -2.3422762751579285e-06, -2.2202730178833008e-06, -2.098269760608673e-06, -1.9762665033340454e-06, -1.8542632460594177e-06, -1.73225998878479e-06, -1.6102567315101624e-06, -1.4882534742355347e-06, -1.366250216960907e-06, -1.2442469596862793e-06, -1.1222437024116516e-06, -1.000240445137024e-06, -8.782371878623962e-07, -7.562339305877686e-07, -6.342306733131409e-07, -5.122274160385132e-07, -3.902241587638855e-07, -2.682209014892578e-07, -1.4621764421463013e-07, -2.421438694000244e-08, 9.778887033462524e-08, 2.1979212760925293e-07, 3.417953848838806e-07, 4.637986421585083e-07, 5.85801899433136e-07, 7.078051567077637e-07, 8.298084139823914e-07, 9.51811671257019e-07, 1.0738149285316467e-06, 1.1958181858062744e-06, 1.317821443080902e-06, 1.4398247003555298e-06, 1.5618279576301575e-06, 1.6838312149047852e-06, 1.8058344721794128e-06, 1.9278377294540405e-06, 2.0498409867286682e-06, 2.171844244003296e-06, 2.2938475012779236e-06, 2.4158507585525513e-06, 2.537854015827179e-06, 2.6598572731018066e-06, 2.7818605303764343e-06, 2.903863787651062e-06, 3.0258670449256897e-06, 3.1478703022003174e-06, 3.269873559474945e-06, 3.3918768167495728e-06, 3.5138800740242004e-06, 3.635883331298828e-06]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 0.0, 8.0, 0.0, 15.0, 0.0, 15.0, 0.0, 24.0, 0.0, 47.0, 0.0, 59.0, 0.0, 78.0, 0.0, 82.0, 0.0, 118.0, 0.0, 123.0, 0.0, 92.0, 0.0, 96.0, 0.0, 80.0, 0.0, 57.0, 0.0, 39.0, 0.0, 27.0, 0.0, 10.0, 0.0, 12.0, 0.0, 12.0, 0.0, 4.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0132789611816406e-06, -9.834766387939453e-07, -9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 8.0, 4.0, 10.0, 9.0, 23.0, 59.0, 57.0, 74.0, 120.0, 168.0, 258.0, 320.0, 1344.0, 1107.0, 1784.0, 2736.0, 4326.0, 7036.0, 11972.0, 58502.0, 74928.0, 179003.0, 362521.0, 177679.0, 74801.0, 37719.0, 32277.0, 7066.0, 4325.0, 2788.0, 1759.0, 1228.0, 826.0, 913.0, 269.0, 172.0, 130.0, 71.0, 60.0, 31.0, 29.0, 14.0, 12.0, 6.0, 5.0, 1.0, 3.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1457672119140625e-06, -2.0777806639671326e-06, -2.0097941160202026e-06, -1.9418075680732727e-06, -1.8738210201263428e-06, -1.8058344721794128e-06, -1.737847924232483e-06, -1.669861376285553e-06, -1.601874828338623e-06, -1.5338882803916931e-06, -1.4659017324447632e-06, -1.3979151844978333e-06, -1.3299286365509033e-06, -1.2619420886039734e-06, -1.1939555406570435e-06, -1.1259689927101135e-06, -1.0579824447631836e-06, -9.899958968162537e-07, -9.220093488693237e-07, -8.540228009223938e-07, -7.860362529754639e-07, -7.180497050285339e-07, -6.50063157081604e-07, -5.820766091346741e-07, -5.140900611877441e-07, -4.461035132408142e-07, -3.781169652938843e-07, -3.1013041734695435e-07, -2.421438694000244e-07, -1.7415732145309448e-07, -1.0617077350616455e-07, -3.818422555923462e-08, 2.9802322387695312e-08, 9.778887033462524e-08, 1.6577541828155518e-07, 2.337619662284851e-07, 3.0174851417541504e-07, 3.6973506212234497e-07, 4.377216100692749e-07, 5.057081580162048e-07, 5.736947059631348e-07, 6.416812539100647e-07, 7.096678018569946e-07, 7.776543498039246e-07, 8.456408977508545e-07, 9.136274456977844e-07, 9.816139936447144e-07, 1.0496005415916443e-06, 1.1175870895385742e-06, 1.1855736374855042e-06, 1.253560185432434e-06, 1.321546733379364e-06, 1.389533281326294e-06, 1.4575198292732239e-06, 1.5255063772201538e-06, 1.5934929251670837e-06, 1.6614794731140137e-06, 1.7294660210609436e-06, 1.7974525690078735e-06, 1.8654391169548035e-06, 1.9334256649017334e-06, 2.0014122128486633e-06, 2.0693987607955933e-06, 2.137385308742523e-06, 2.205371856689453e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 0.0, 4.0, 4.0, 15.0, 10.0, 18.0, 20.0, 0.0, 34.0, 29.0, 31.0, 36.0, 43.0, 57.0, 0.0, 65.0, 67.0, 68.0, 74.0, 61.0, 61.0, 0.0, 47.0, 38.0, 46.0, 29.0, 35.0, 21.0, 0.0, 15.0, 9.0, 14.0, 7.0, 3.0, 8.0, 0.0, 7.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5581026673316956e-06, -1.5068799257278442e-06, -1.455657184123993e-06, -1.4044344425201416e-06, -1.3532117009162903e-06, -1.301988959312439e-06, -1.2507662177085876e-06, -1.1995434761047363e-06, -1.148320734500885e-06, -1.0970979928970337e-06, -1.0458752512931824e-06, -9.94652509689331e-07, -9.434297680854797e-07, -8.922070264816284e-07, -8.409842848777771e-07, -7.897615432739258e-07, -7.385388016700745e-07, -6.873160600662231e-07, -6.360933184623718e-07, -5.848705768585205e-07, -5.336478352546692e-07, -4.824250936508179e-07, -4.3120235204696655e-07, -3.7997961044311523e-07, -3.287568688392639e-07, -2.775341272354126e-07, -2.2631138563156128e-07, -1.7508864402770996e-07, -1.2386590242385864e-07, -7.264316082000732e-08, -2.1420419216156006e-08, 2.9802322387695312e-08, 8.102506399154663e-08, 1.3224780559539795e-07, 1.8347054719924927e-07, 2.3469328880310059e-07, 2.859160304069519e-07, 3.371387720108032e-07, 3.8836151361465454e-07, 4.3958425521850586e-07, 4.908069968223572e-07, 5.420297384262085e-07, 5.932524800300598e-07, 6.444752216339111e-07, 6.956979632377625e-07, 7.469207048416138e-07, 7.981434464454651e-07, 8.493661880493164e-07, 9.005889296531677e-07, 9.51811671257019e-07, 1.0030344128608704e-06, 1.0542571544647217e-06, 1.105479896068573e-06, 1.1567026376724243e-06, 1.2079253792762756e-06, 1.259148120880127e-06, 1.3103708624839783e-06, 1.3615936040878296e-06, 1.412816345691681e-06, 1.4640390872955322e-06, 1.5152618288993835e-06, 1.5664845705032349e-06, 1.6177073121070862e-06, 1.6689300537109375e-06]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 8.0, 12.0, 16.0, 17.0, 34.0, 65.0, 120.0, 212.0, 139.0, 93.0, 68.0, 44.0, 29.0, 31.0, 26.0, 15.0, 17.0, 6.0, 12.0, 6.0, 8.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0002032840420724824, -0.00019788120698649436, -0.0001924783573485911, -0.00018707552226260304, -0.000181672687176615, -0.00017626983753871173, -0.00017086700245272368, -0.0001654641528148204, -0.00016006131772883236, -0.00015465848264284432, -0.00014925563300494105, -0.000143852797918953, -0.00013844994828104973, -0.00013304711319506168, -0.00012764427810907364, -0.0001222414430230856, -0.00011683859338518232, -0.00011143575102323666, -0.000106032908661291, -0.00010063007357530296, -9.52272312133573e-05, -8.982438885141164e-05, -8.44215537654236e-05, -7.901871140347794e-05, -7.361586904153228e-05, -6.821302667958662e-05, -6.281018431764096e-05, -5.7407349231652915e-05, -5.2004506869707257e-05, -4.66016645077616e-05, -4.1198825783794746e-05, -3.5795987059827894e-05, -3.0393159249797463e-05, -2.4990318706841208e-05, -1.9587478163884953e-05, -1.4184637620928697e-05, -8.781797077972442e-06, -3.3789565350161865e-06, 2.023884007940069e-06, 7.426722731906921e-06, 1.282956509385258e-05, 1.8232405636808835e-05, 2.363524617976509e-05, 2.9038086722721346e-05, 3.44409272656776e-05, 3.984376962762326e-05, 4.524660835159011e-05, 5.0649447075556964e-05, 5.605228943750262e-05, 6.145513179944828e-05, 6.685797416139394e-05, 7.226080924738199e-05, 7.766365160932764e-05, 8.30664939712733e-05, 8.846932905726135e-05, 9.3872171419207e-05, 9.927501378115267e-05, 0.00010467785614309832, 0.00011008069850504398, 0.00011548353359103203, 0.00012088637595297769, 0.00012628921831492335, 0.0001316920534009114, 0.00013709490303881466, 0.0001424977381248027]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 3.0, 5.0, 10.0, 6.0, 12.0, 8.0, 16.0, 13.0, 15.0, 14.0, 21.0, 24.0, 13.0, 25.0, 18.0, 35.0, 32.0, 26.0, 25.0, 16.0, 47.0, 39.0, 33.0, 38.0, 39.0, 30.0, 38.0, 39.0, 44.0, 35.0, 27.0, 30.0, 25.0, 32.0, 20.0, 14.0, 21.0, 23.0, 19.0, 17.0, 7.0, 10.0, 8.0, 8.0, 6.0, 5.0, 7.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-8.112192153930664e-05, -7.863808423280716e-05, -7.615424692630768e-05, -7.36704096198082e-05, -7.118657231330872e-05, -6.870273500680923e-05, -6.621889770030975e-05, -6.373506039381027e-05, -6.125122308731079e-05, -5.876738578081131e-05, -5.628354847431183e-05, -5.379971116781235e-05, -5.1315873861312866e-05, -4.8832036554813385e-05, -4.6348199248313904e-05, -4.386436194181442e-05, -4.138052463531494e-05, -3.889668732881546e-05, -3.641285002231598e-05, -3.39290127158165e-05, -3.1445175409317017e-05, -2.8961338102817535e-05, -2.6477500796318054e-05, -2.3993663489818573e-05, -2.1509826183319092e-05, -1.902598887681961e-05, -1.654215157032013e-05, -1.4058314263820648e-05, -1.1574476957321167e-05, -9.090639650821686e-06, -6.606802344322205e-06, -4.122965037822723e-06, -1.6391277313232422e-06, 8.44709575176239e-07, 3.3285468816757202e-06, 5.812384188175201e-06, 8.296221494674683e-06, 1.0780058801174164e-05, 1.3263896107673645e-05, 1.5747733414173126e-05, 1.8231570720672607e-05, 2.071540802717209e-05, 2.319924533367157e-05, 2.568308264017105e-05, 2.8166919946670532e-05, 3.0650757253170013e-05, 3.3134594559669495e-05, 3.5618431866168976e-05, 3.810226917266846e-05, 4.058610647916794e-05, 4.306994378566742e-05, 4.55537810921669e-05, 4.803761839866638e-05, 5.052145570516586e-05, 5.3005293011665344e-05, 5.5489130318164825e-05, 5.797296762466431e-05, 6.045680493116379e-05, 6.294064223766327e-05, 6.542447954416275e-05, 6.790831685066223e-05, 7.039215415716171e-05, 7.28759914636612e-05, 7.535982877016068e-05, 7.784366607666016e-05]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 5.0, 4.0, 13.0, 18.0, 12.0, 19.0, 39.0, 65.0, 99.0, 144.0, 264.0, 462.0, 832.0, 1691.0, 3721.0, 9007.0, 33051.0, 2839354.0, 1260741.0, 29025.0, 8755.0, 3460.0, 1644.0, 812.0, 407.0, 240.0, 130.0, 72.0, 49.0, 32.0, 13.0, 14.0, 14.0, 10.0, 8.0, 10.0, 10.0, 8.0, 4.0, 4.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.153915405273438e-05, -7.827393710613251e-05, -7.500872015953064e-05, -7.174350321292877e-05, -6.84782862663269e-05, -6.521306931972504e-05, -6.194785237312317e-05, -5.86826354265213e-05, -5.5417418479919434e-05, -5.2152201533317566e-05, -4.88869845867157e-05, -4.562176764011383e-05, -4.235655069351196e-05, -3.9091333746910095e-05, -3.582611680030823e-05, -3.256089985370636e-05, -2.9295682907104492e-05, -2.6030465960502625e-05, -2.2765249013900757e-05, -1.950003206729889e-05, -1.623481512069702e-05, -1.2969598174095154e-05, -9.704381227493286e-06, -6.4391642808914185e-06, -3.1739473342895508e-06, 9.12696123123169e-08, 3.3564865589141846e-06, 6.621703505516052e-06, 9.88692045211792e-06, 1.3152137398719788e-05, 1.6417354345321655e-05, 1.9682571291923523e-05, 2.294778823852539e-05, 2.6213005185127258e-05, 2.9478222131729126e-05, 3.2743439078330994e-05, 3.600865602493286e-05, 3.927387297153473e-05, 4.25390899181366e-05, 4.5804306864738464e-05, 4.906952381134033e-05, 5.23347407579422e-05, 5.559995770454407e-05, 5.8865174651145935e-05, 6.21303915977478e-05, 6.539560854434967e-05, 6.866082549095154e-05, 7.19260424375534e-05, 7.519125938415527e-05, 7.845647633075714e-05, 8.172169327735901e-05, 8.498691022396088e-05, 8.825212717056274e-05, 9.151734411716461e-05, 9.478256106376648e-05, 9.804777801036835e-05, 0.00010131299495697021, 0.00010457821190357208, 0.00010784342885017395, 0.00011110864579677582, 0.00011437386274337769, 0.00011763907968997955, 0.00012090429663658142, 0.0001241695135831833, 0.00012743473052978516]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 8.0, 5.0, 12.0, 14.0, 20.0, 28.0, 40.0, 77.0, 121.0, 133.0, 129.0, 125.0, 99.0, 70.0, 45.0, 26.0, 18.0, 15.0, 8.0, 4.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09808349609375e-05, -2.0121224224567413e-05, -1.9261613488197327e-05, -1.840200275182724e-05, -1.7542392015457153e-05, -1.6682781279087067e-05, -1.582317054271698e-05, -1.4963559806346893e-05, -1.4103949069976807e-05, -1.324433833360672e-05, -1.2384727597236633e-05, -1.1525116860866547e-05, -1.066550612449646e-05, -9.805895388126373e-06, -8.946284651756287e-06, -8.0866739153862e-06, -7.227063179016113e-06, -6.367452442646027e-06, -5.50784170627594e-06, -4.648230969905853e-06, -3.7886202335357666e-06, -2.92900949716568e-06, -2.0693987607955933e-06, -1.2097880244255066e-06, -3.501772880554199e-07, 5.094334483146667e-07, 1.3690441846847534e-06, 2.22865492105484e-06, 3.0882656574249268e-06, 3.9478763937950134e-06, 4.8074871301651e-06, 5.667097866535187e-06, 6.5267086029052734e-06, 7.38631933927536e-06, 8.245930075645447e-06, 9.105540812015533e-06, 9.96515154838562e-06, 1.0824762284755707e-05, 1.1684373021125793e-05, 1.254398375749588e-05, 1.3403594493865967e-05, 1.4263205230236053e-05, 1.512281596660614e-05, 1.5982426702976227e-05, 1.6842037439346313e-05, 1.77016481757164e-05, 1.8561258912086487e-05, 1.9420869648456573e-05, 2.028048038482666e-05, 2.1140091121196747e-05, 2.1999701857566833e-05, 2.285931259393692e-05, 2.3718923330307007e-05, 2.4578534066677094e-05, 2.543814480304718e-05, 2.6297755539417267e-05, 2.7157366275787354e-05, 2.801697701215744e-05, 2.8876587748527527e-05, 2.9736198484897614e-05, 3.05958092212677e-05, 3.145541995763779e-05, 3.2315030694007874e-05, 3.317464143037796e-05, 3.403425216674805e-05]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 5.0, 8.0, 8.0, 25.0, 22.0, 34.0, 45.0, 65.0, 130.0, 166.0, 265.0, 402.0, 621.0, 969.0, 1524.0, 2481.0, 4291.0, 6914.0, 12182.0, 22979.0, 48154.0, 142496.0, 3195585.0, 594878.0, 86593.0, 33017.0, 16839.0, 9123.0, 5500.0, 3282.0, 2039.0, 1296.0, 842.0, 485.0, 365.0, 223.0, 140.0, 92.0, 61.0, 53.0, 34.0, 15.0, 7.0, 6.0, 7.0, 7.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.141164779663086e-05, -3.0390918254852295e-05, -2.937018871307373e-05, -2.8349459171295166e-05, -2.73287296295166e-05, -2.6308000087738037e-05, -2.5287270545959473e-05, -2.4266541004180908e-05, -2.3245811462402344e-05, -2.222508192062378e-05, -2.1204352378845215e-05, -2.018362283706665e-05, -1.9162893295288086e-05, -1.814216375350952e-05, -1.7121434211730957e-05, -1.6100704669952393e-05, -1.5079975128173828e-05, -1.4059245586395264e-05, -1.30385160446167e-05, -1.2017786502838135e-05, -1.099705696105957e-05, -9.976327419281006e-06, -8.955597877502441e-06, -7.934868335723877e-06, -6.9141387939453125e-06, -5.893409252166748e-06, -4.872679710388184e-06, -3.851950168609619e-06, -2.8312206268310547e-06, -1.8104910850524902e-06, -7.897615432739258e-07, 2.3096799850463867e-07, 1.2516975402832031e-06, 2.2724270820617676e-06, 3.293156623840332e-06, 4.3138861656188965e-06, 5.334615707397461e-06, 6.355345249176025e-06, 7.37607479095459e-06, 8.396804332733154e-06, 9.417533874511719e-06, 1.0438263416290283e-05, 1.1458992958068848e-05, 1.2479722499847412e-05, 1.3500452041625977e-05, 1.4521181583404541e-05, 1.5541911125183105e-05, 1.656264066696167e-05, 1.7583370208740234e-05, 1.86040997505188e-05, 1.9624829292297363e-05, 2.0645558834075928e-05, 2.1666288375854492e-05, 2.2687017917633057e-05, 2.370774745941162e-05, 2.4728477001190186e-05, 2.574920654296875e-05, 2.6769936084747314e-05, 2.779066562652588e-05, 2.8811395168304443e-05, 2.9832124710083008e-05, 3.085285425186157e-05, 3.187358379364014e-05, 3.28943133354187e-05, 3.3915042877197266e-05]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 10.0, 4.0, 10.0, 11.0, 6.0, 21.0, 20.0, 22.0, 27.0, 34.0, 42.0, 71.0, 108.0, 355.0, 1038.0, 1406.0, 441.0, 123.0, 69.0, 52.0, 22.0, 25.0, 35.0, 20.0, 13.0, 12.0, 12.0, 12.0, 7.0, 5.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5451183319091797e-05, -2.4577602744102478e-05, -2.370402216911316e-05, -2.283044159412384e-05, -2.195686101913452e-05, -2.1083280444145203e-05, -2.0209699869155884e-05, -1.9336119294166565e-05, -1.8462538719177246e-05, -1.7588958144187927e-05, -1.671537756919861e-05, -1.584179699420929e-05, -1.496821641921997e-05, -1.4094635844230652e-05, -1.3221055269241333e-05, -1.2347474694252014e-05, -1.1473894119262695e-05, -1.0600313544273376e-05, -9.726732969284058e-06, -8.853152394294739e-06, -7.97957181930542e-06, -7.105991244316101e-06, -6.232410669326782e-06, -5.358830094337463e-06, -4.4852495193481445e-06, -3.6116689443588257e-06, -2.738088369369507e-06, -1.864507794380188e-06, -9.909272193908691e-07, -1.1734664440155029e-07, 7.562339305877686e-07, 1.6298145055770874e-06, 2.5033950805664062e-06, 3.376975655555725e-06, 4.250556230545044e-06, 5.124136805534363e-06, 5.997717380523682e-06, 6.8712979555130005e-06, 7.74487853050232e-06, 8.618459105491638e-06, 9.492039680480957e-06, 1.0365620255470276e-05, 1.1239200830459595e-05, 1.2112781405448914e-05, 1.2986361980438232e-05, 1.3859942555427551e-05, 1.473352313041687e-05, 1.560710370540619e-05, 1.6480684280395508e-05, 1.7354264855384827e-05, 1.8227845430374146e-05, 1.9101426005363464e-05, 1.9975006580352783e-05, 2.0848587155342102e-05, 2.172216773033142e-05, 2.259574830532074e-05, 2.346932888031006e-05, 2.4342909455299377e-05, 2.5216490030288696e-05, 2.6090070605278015e-05, 2.6963651180267334e-05, 2.7837231755256653e-05, 2.871081233024597e-05, 2.958439290523529e-05, 3.045797348022461e-05]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 5.0, 5.0, 12.0, 12.0, 12.0, 27.0, 25.0, 44.0, 46.0, 101.0, 112.0, 135.0, 111.0, 55.0, 64.0, 35.0, 43.0, 37.0, 25.0, 19.0, 21.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012105625501135364, -0.0001169121460407041, -0.00011276803707005456, -0.0001086239208234474, -0.00010447981185279787, -0.00010033570288214833, -9.619159391149879e-05, -9.204748494084924e-05, -8.79033759701997e-05, -8.375926699955016e-05, -7.961515802890062e-05, -7.547104905825108e-05, -7.132693281164393e-05, -6.718282384099439e-05, -6.303871487034485e-05, -5.889460589969531e-05, -5.475048965308815e-05, -5.060638068243861e-05, -4.6462268073810264e-05, -4.2318159103160724e-05, -3.8174046494532377e-05, -3.4029937523882836e-05, -2.9885828553233296e-05, -2.5741717763594352e-05, -2.1597606973955408e-05, -1.7453496184316464e-05, -1.3309386304172222e-05, -9.16527642402798e-06, -5.021165634389035e-06, -8.770548447500914e-07, 3.267054125899449e-06, 7.411164915538393e-06, 1.1555268429219723e-05, 1.5699379218858667e-05, 1.984349000849761e-05, 2.398759897914715e-05, 2.8131709768786095e-05, 3.227582055842504e-05, 3.641992952907458e-05, 4.056403849972412e-05, 4.470815110835247e-05, 4.885226007900201e-05, 5.2996372687630355e-05, 5.7140481658279896e-05, 6.128459062892944e-05, 6.542869959957898e-05, 6.957280857022852e-05, 7.371692481683567e-05, 7.786103378748521e-05, 8.200514275813475e-05, 8.614925172878429e-05, 9.029336797539145e-05, 9.443747694604099e-05, 9.858158591669053e-05, 0.00010272569488734007, 0.00010686980385798961, 0.00011101391282863915, 0.00011515802179928869, 0.00011930213076993823, 0.00012344623974058777, 0.0001275903487112373, 0.00013173447223380208, 0.0001358785666525364, 0.00014002269017510116, 0.0001441667991457507]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 8.0, 8.0, 13.0, 11.0, 13.0, 16.0, 23.0, 15.0, 14.0, 23.0, 30.0, 23.0, 29.0, 41.0, 27.0, 37.0, 43.0, 36.0, 36.0, 41.0, 33.0, 32.0, 42.0, 42.0, 39.0, 46.0, 35.0, 31.0, 27.0, 25.0, 26.0, 15.0, 16.0, 15.0, 14.0, 20.0, 9.0, 8.0, 6.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.896257400512695e-05, -6.688293069601059e-05, -6.480328738689423e-05, -6.272364407777786e-05, -6.06440007686615e-05, -5.8564357459545135e-05, -5.648471415042877e-05, -5.440507084131241e-05, -5.2325427532196045e-05, -5.024578422307968e-05, -4.816614091396332e-05, -4.6086497604846954e-05, -4.400685429573059e-05, -4.192721098661423e-05, -3.9847567677497864e-05, -3.77679243683815e-05, -3.568828105926514e-05, -3.360863775014877e-05, -3.152899444103241e-05, -2.9449351131916046e-05, -2.7369707822799683e-05, -2.529006451368332e-05, -2.3210421204566956e-05, -2.1130777895450592e-05, -1.905113458633423e-05, -1.6971491277217865e-05, -1.4891847968101501e-05, -1.2812204658985138e-05, -1.0732561349868774e-05, -8.652918040752411e-06, -6.573274731636047e-06, -4.493631422519684e-06, -2.4139881134033203e-06, -3.343448042869568e-07, 1.7452985048294067e-06, 3.82494181394577e-06, 5.904585123062134e-06, 7.984228432178497e-06, 1.006387174129486e-05, 1.2143515050411224e-05, 1.4223158359527588e-05, 1.630280166864395e-05, 1.8382444977760315e-05, 2.046208828687668e-05, 2.2541731595993042e-05, 2.4621374905109406e-05, 2.670101821422577e-05, 2.8780661523342133e-05, 3.0860304832458496e-05, 3.293994814157486e-05, 3.501959145069122e-05, 3.709923475980759e-05, 3.917887806892395e-05, 4.1258521378040314e-05, 4.333816468715668e-05, 4.541780799627304e-05, 4.7497451305389404e-05, 4.957709461450577e-05, 5.165673792362213e-05, 5.3736381232738495e-05, 5.581602454185486e-05, 5.789566785097122e-05, 5.9975311160087585e-05, 6.205495446920395e-05, 6.413459777832031e-05]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 2.0, 8.0, 8.0, 6.0, 10.0, 8.0, 10.0, 13.0, 19.0, 36.0, 47.0, 61.0, 70.0, 123.0, 170.0, 333.0, 523.0, 1045.0, 2031.0, 4372.0, 10691.0, 31776.0, 128043.0, 667676.0, 145715.0, 34934.0, 11249.0, 4833.0, 2100.0, 1159.0, 540.0, 343.0, 161.0, 127.0, 85.0, 53.0, 47.0, 32.0, 19.0, 15.0, 17.0, 11.0, 5.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0], "bins": [-0.0001430511474609375, -0.0001390259712934494, -0.0001350007951259613, -0.0001309756189584732, -0.0001269504427909851, -0.000122925266623497, -0.00011890009045600891, -0.00011487491428852081, -0.00011084973812103271, -0.00010682456195354462, -0.00010279938578605652, -9.877420961856842e-05, -9.474903345108032e-05, -9.072385728359222e-05, -8.669868111610413e-05, -8.267350494861603e-05, -7.864832878112793e-05, -7.462315261363983e-05, -7.059797644615173e-05, -6.657280027866364e-05, -6.254762411117554e-05, -5.852244794368744e-05, -5.449727177619934e-05, -5.047209560871124e-05, -4.6446919441223145e-05, -4.2421743273735046e-05, -3.839656710624695e-05, -3.437139093875885e-05, -3.0346214771270752e-05, -2.6321038603782654e-05, -2.2295862436294556e-05, -1.8270686268806458e-05, -1.424551010131836e-05, -1.0220333933830261e-05, -6.195157766342163e-06, -2.169981598854065e-06, 1.8551945686340332e-06, 5.880370736122131e-06, 9.90554690361023e-06, 1.3930723071098328e-05, 1.7955899238586426e-05, 2.1981075406074524e-05, 2.6006251573562622e-05, 3.003142774105072e-05, 3.405660390853882e-05, 3.8081780076026917e-05, 4.2106956243515015e-05, 4.613213241100311e-05, 5.015730857849121e-05, 5.418248474597931e-05, 5.820766091346741e-05, 6.22328370809555e-05, 6.62580132484436e-05, 7.02831894159317e-05, 7.43083655834198e-05, 7.83335417509079e-05, 8.2358717918396e-05, 8.63838940858841e-05, 9.040907025337219e-05, 9.443424642086029e-05, 9.845942258834839e-05, 0.00010248459875583649, 0.00010650977492332458, 0.00011053495109081268, 0.00011456012725830078]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 7.0, 9.0, 11.0, 25.0, 19.0, 23.0, 74.0, 85.0, 111.0, 108.0, 130.0, 120.0, 67.0, 72.0, 40.0, 35.0, 18.0, 14.0, 10.0, 5.0, 9.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.633167266845703e-05, -1.5566125512123108e-05, -1.4800578355789185e-05, -1.4035031199455261e-05, -1.3269484043121338e-05, -1.2503936886787415e-05, -1.1738389730453491e-05, -1.0972842574119568e-05, -1.0207295417785645e-05, -9.441748261451721e-06, -8.676201105117798e-06, -7.910653948783875e-06, -7.145106792449951e-06, -6.379559636116028e-06, -5.6140124797821045e-06, -4.848465323448181e-06, -4.082918167114258e-06, -3.3173710107803345e-06, -2.551823854446411e-06, -1.7862766981124878e-06, -1.0207295417785645e-06, -2.551823854446411e-07, 5.103647708892822e-07, 1.2759119272232056e-06, 2.041459083557129e-06, 2.8070062398910522e-06, 3.5725533962249756e-06, 4.338100552558899e-06, 5.103647708892822e-06, 5.869194865226746e-06, 6.634742021560669e-06, 7.400289177894592e-06, 8.165836334228516e-06, 8.931383490562439e-06, 9.696930646896362e-06, 1.0462477803230286e-05, 1.1228024959564209e-05, 1.1993572115898132e-05, 1.2759119272232056e-05, 1.3524666428565979e-05, 1.4290213584899902e-05, 1.5055760741233826e-05, 1.582130789756775e-05, 1.6586855053901672e-05, 1.7352402210235596e-05, 1.811794936656952e-05, 1.8883496522903442e-05, 1.9649043679237366e-05, 2.041459083557129e-05, 2.1180137991905212e-05, 2.1945685148239136e-05, 2.271123230457306e-05, 2.3476779460906982e-05, 2.4242326617240906e-05, 2.500787377357483e-05, 2.5773420929908752e-05, 2.6538968086242676e-05, 2.73045152425766e-05, 2.8070062398910522e-05, 2.8835609555244446e-05, 2.960115671157837e-05, 3.0366703867912292e-05, 3.1132251024246216e-05, 3.189779818058014e-05, 3.266334533691406e-05]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 15.0, 20.0, 21.0, 40.0, 55.0, 91.0, 148.0, 176.0, 279.0, 432.0, 694.0, 949.0, 1380.0, 1936.0, 2943.0, 4404.0, 6711.0, 10339.0, 16007.0, 26615.0, 44060.0, 78566.0, 163558.0, 373119.0, 138750.0, 70074.0, 40007.0, 23936.0, 14867.0, 9575.0, 6195.0, 4098.0, 2687.0, 1799.0, 1275.0, 933.0, 583.0, 403.0, 254.0, 159.0, 150.0, 80.0, 61.0, 37.0, 15.0, 24.0, 12.0, 8.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0934810638427734e-05, -2.998020499944687e-05, -2.9025599360466003e-05, -2.8070993721485138e-05, -2.7116388082504272e-05, -2.6161782443523407e-05, -2.520717680454254e-05, -2.4252571165561676e-05, -2.329796552658081e-05, -2.2343359887599945e-05, -2.138875424861908e-05, -2.0434148609638214e-05, -1.947954297065735e-05, -1.8524937331676483e-05, -1.7570331692695618e-05, -1.6615726053714752e-05, -1.5661120414733887e-05, -1.4706514775753021e-05, -1.3751909136772156e-05, -1.279730349779129e-05, -1.1842697858810425e-05, -1.088809221982956e-05, -9.933486580848694e-06, -8.978880941867828e-06, -8.024275302886963e-06, -7.069669663906097e-06, -6.115064024925232e-06, -5.1604583859443665e-06, -4.205852746963501e-06, -3.2512471079826355e-06, -2.29664146900177e-06, -1.3420358300209045e-06, -3.8743019104003906e-07, 5.671754479408264e-07, 1.521781086921692e-06, 2.4763867259025574e-06, 3.430992364883423e-06, 4.385598003864288e-06, 5.340203642845154e-06, 6.294809281826019e-06, 7.249414920806885e-06, 8.20402055978775e-06, 9.158626198768616e-06, 1.0113231837749481e-05, 1.1067837476730347e-05, 1.2022443115711212e-05, 1.2977048754692078e-05, 1.3931654393672943e-05, 1.4886260032653809e-05, 1.5840865671634674e-05, 1.679547131061554e-05, 1.7750076949596405e-05, 1.870468258857727e-05, 1.9659288227558136e-05, 2.0613893866539e-05, 2.1568499505519867e-05, 2.2523105144500732e-05, 2.3477710783481598e-05, 2.4432316422462463e-05, 2.538692206144333e-05, 2.6341527700424194e-05, 2.729613333940506e-05, 2.8250738978385925e-05, 2.920534461736679e-05, 3.0159950256347656e-05]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 3.0, 6.0, 3.0, 10.0, 10.0, 9.0, 12.0, 14.0, 20.0, 22.0, 22.0, 19.0, 27.0, 33.0, 28.0, 37.0, 27.0, 29.0, 45.0, 35.0, 44.0, 48.0, 43.0, 46.0, 30.0, 29.0, 44.0, 32.0, 33.0, 36.0, 21.0, 24.0, 24.0, 27.0, 18.0, 11.0, 8.0, 8.0, 12.0, 7.0, 7.0, 6.0, 2.0, 3.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9265880584716797e-05, -2.8370879590511322e-05, -2.7475878596305847e-05, -2.6580877602100372e-05, -2.5685876607894897e-05, -2.4790875613689423e-05, -2.3895874619483948e-05, -2.3000873625278473e-05, -2.2105872631072998e-05, -2.1210871636867523e-05, -2.031587064266205e-05, -1.9420869648456573e-05, -1.85258686542511e-05, -1.7630867660045624e-05, -1.673586666584015e-05, -1.5840865671634674e-05, -1.49458646774292e-05, -1.4050863683223724e-05, -1.315586268901825e-05, -1.2260861694812775e-05, -1.13658607006073e-05, -1.0470859706401825e-05, -9.57585871219635e-06, -8.680857717990875e-06, -7.7858567237854e-06, -6.8908557295799255e-06, -5.995854735374451e-06, -5.100853741168976e-06, -4.205852746963501e-06, -3.310851752758026e-06, -2.4158507585525513e-06, -1.5208497643470764e-06, -6.258487701416016e-07, 2.691522240638733e-07, 1.1641532182693481e-06, 2.059154212474823e-06, 2.954155206680298e-06, 3.849156200885773e-06, 4.7441571950912476e-06, 5.639158189296722e-06, 6.534159183502197e-06, 7.429160177707672e-06, 8.324161171913147e-06, 9.219162166118622e-06, 1.0114163160324097e-05, 1.1009164154529572e-05, 1.1904165148735046e-05, 1.2799166142940521e-05, 1.3694167137145996e-05, 1.4589168131351471e-05, 1.5484169125556946e-05, 1.637917011976242e-05, 1.7274171113967896e-05, 1.816917210817337e-05, 1.9064173102378845e-05, 1.995917409658432e-05, 2.0854175090789795e-05, 2.174917608499527e-05, 2.2644177079200745e-05, 2.353917807340622e-05, 2.4434179067611694e-05, 2.532918006181717e-05, 2.6224181056022644e-05, 2.711918205022812e-05, 2.8014183044433594e-05]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 2.0, 7.0, 3.0, 10.0, 11.0, 25.0, 22.0, 34.0, 43.0, 102.0, 91.0, 206.0, 224.0, 504.0, 543.0, 1256.0, 1570.0, 4014.0, 4996.0, 15350.0, 22524.0, 96887.0, 243548.0, 426237.0, 159677.0, 32346.0, 21011.0, 6412.0, 5077.0, 1900.0, 1665.0, 652.0, 661.0, 268.0, 252.0, 109.0, 122.0, 43.0, 52.0, 30.0, 24.0, 7.0, 13.0, 7.0, 11.0, 2.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.76837158203125e-06, -4.620291292667389e-06, -4.472211003303528e-06, -4.324130713939667e-06, -4.176050424575806e-06, -4.027970135211945e-06, -3.8798898458480835e-06, -3.7318095564842224e-06, -3.5837292671203613e-06, -3.4356489777565002e-06, -3.287568688392639e-06, -3.139488399028778e-06, -2.991408109664917e-06, -2.843327820301056e-06, -2.695247530937195e-06, -2.5471672415733337e-06, -2.3990869522094727e-06, -2.2510066628456116e-06, -2.1029263734817505e-06, -1.9548460841178894e-06, -1.8067657947540283e-06, -1.6586855053901672e-06, -1.5106052160263062e-06, -1.362524926662445e-06, -1.214444637298584e-06, -1.066364347934723e-06, -9.182840585708618e-07, -7.702037692070007e-07, -6.221234798431396e-07, -4.7404319047927856e-07, -3.259629011154175e-07, -1.778826117515564e-07, -2.9802322387695312e-08, 1.1827796697616577e-07, 2.6635825634002686e-07, 4.1443854570388794e-07, 5.62518835067749e-07, 7.105991244316101e-07, 8.586794137954712e-07, 1.0067597031593323e-06, 1.1548399925231934e-06, 1.3029202818870544e-06, 1.4510005712509155e-06, 1.5990808606147766e-06, 1.7471611499786377e-06, 1.8952414393424988e-06, 2.04332172870636e-06, 2.191402018070221e-06, 2.339482307434082e-06, 2.487562596797943e-06, 2.635642886161804e-06, 2.7837231755256653e-06, 2.9318034648895264e-06, 3.0798837542533875e-06, 3.2279640436172485e-06, 3.3760443329811096e-06, 3.5241246223449707e-06, 3.6722049117088318e-06, 3.820285201072693e-06, 3.968365490436554e-06, 4.116445779800415e-06, 4.264526069164276e-06, 4.412606358528137e-06, 4.560686647891998e-06, 4.708766937255859e-06]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 7.0, 7.0, 4.0, 11.0, 6.0, 0.0, 12.0, 20.0, 36.0, 31.0, 46.0, 60.0, 87.0, 110.0, 116.0, 111.0, 92.0, 66.0, 47.0, 45.0, 22.0, 0.0, 17.0, 13.0, 12.0, 5.0, 5.0, 8.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.2649765014648438e-06, -2.209097146987915e-06, -2.1532177925109863e-06, -2.0973384380340576e-06, -2.041459083557129e-06, -1.9855797290802e-06, -1.9297003746032715e-06, -1.8738210201263428e-06, -1.817941665649414e-06, -1.7620623111724854e-06, -1.7061829566955566e-06, -1.650303602218628e-06, -1.5944242477416992e-06, -1.5385448932647705e-06, -1.4826655387878418e-06, -1.426786184310913e-06, -1.3709068298339844e-06, -1.3150274753570557e-06, -1.259148120880127e-06, -1.2032687664031982e-06, -1.1473894119262695e-06, -1.0915100574493408e-06, -1.0356307029724121e-06, -9.797513484954834e-07, -9.238719940185547e-07, -8.67992639541626e-07, -8.121132850646973e-07, -7.562339305877686e-07, -7.003545761108398e-07, -6.444752216339111e-07, -5.885958671569824e-07, -5.327165126800537e-07, -4.76837158203125e-07, -4.209578037261963e-07, -3.650784492492676e-07, -3.0919909477233887e-07, -2.5331974029541016e-07, -1.9744038581848145e-07, -1.4156103134155273e-07, -8.568167686462402e-08, -2.9802322387695312e-08, 2.60770320892334e-08, 8.195638656616211e-08, 1.3783574104309082e-07, 1.9371509552001953e-07, 2.4959444999694824e-07, 3.0547380447387695e-07, 3.6135315895080566e-07, 4.172325134277344e-07, 4.731118679046631e-07, 5.289912223815918e-07, 5.848705768585205e-07, 6.407499313354492e-07, 6.966292858123779e-07, 7.525086402893066e-07, 8.083879947662354e-07, 8.642673492431641e-07, 9.201467037200928e-07, 9.760260581970215e-07, 1.0319054126739502e-06, 1.087784767150879e-06, 1.1436641216278076e-06, 1.1995434761047363e-06, 1.255422830581665e-06, 1.3113021850585938e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 3.0, 11.0, 17.0, 36.0, 30.0, 60.0, 97.0, 57.0, 200.0, 323.0, 546.0, 405.0, 1166.0, 1910.0, 3470.0, 2545.0, 8339.0, 16867.0, 38607.0, 39291.0, 243373.0, 502802.0, 73833.0, 63434.0, 25124.0, 11673.0, 3424.0, 4443.0, 2578.0, 1509.0, 530.0, 730.0, 401.0, 279.0, 83.0, 120.0, 72.0, 28.0, 53.0, 30.0, 22.0, 6.0, 13.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.337860107421875e-06, -3.234483301639557e-06, -3.1311064958572388e-06, -3.0277296900749207e-06, -2.9243528842926025e-06, -2.8209760785102844e-06, -2.7175992727279663e-06, -2.614222466945648e-06, -2.51084566116333e-06, -2.407468855381012e-06, -2.304092049598694e-06, -2.2007152438163757e-06, -2.0973384380340576e-06, -1.9939616322517395e-06, -1.8905848264694214e-06, -1.7872080206871033e-06, -1.6838312149047852e-06, -1.580454409122467e-06, -1.477077603340149e-06, -1.3737007975578308e-06, -1.2703239917755127e-06, -1.1669471859931946e-06, -1.0635703802108765e-06, -9.601935744285583e-07, -8.568167686462402e-07, -7.534399628639221e-07, -6.50063157081604e-07, -5.466863512992859e-07, -4.4330954551696777e-07, -3.3993273973464966e-07, -2.3655593395233154e-07, -1.3317912817001343e-07, -2.9802322387695312e-08, 7.35744833946228e-08, 1.7695128917694092e-07, 2.8032809495925903e-07, 3.8370490074157715e-07, 4.870817065238953e-07, 5.904585123062134e-07, 6.938353180885315e-07, 7.972121238708496e-07, 9.005889296531677e-07, 1.0039657354354858e-06, 1.107342541217804e-06, 1.210719347000122e-06, 1.3140961527824402e-06, 1.4174729585647583e-06, 1.5208497643470764e-06, 1.6242265701293945e-06, 1.7276033759117126e-06, 1.8309801816940308e-06, 1.934356987476349e-06, 2.037733793258667e-06, 2.141110599040985e-06, 2.2444874048233032e-06, 2.3478642106056213e-06, 2.4512410163879395e-06, 2.5546178221702576e-06, 2.6579946279525757e-06, 2.761371433734894e-06, 2.864748239517212e-06, 2.96812504529953e-06, 3.071501851081848e-06, 3.1748786568641663e-06, 3.2782554626464844e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 2.0, 2.0, 4.0, 10.0, 5.0, 5.0, 4.0, 11.0, 30.0, 21.0, 13.0, 18.0, 41.0, 23.0, 30.0, 34.0, 104.0, 64.0, 62.0, 74.0, 107.0, 37.0, 47.0, 35.0, 28.0, 56.0, 26.0, 12.0, 12.0, 15.0, 7.0, 6.0, 6.0, 9.0, 5.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.9529834389686584e-06, -1.8794089555740356e-06, -1.8058344721794128e-06, -1.73225998878479e-06, -1.6586855053901672e-06, -1.5851110219955444e-06, -1.5115365386009216e-06, -1.4379620552062988e-06, -1.364387571811676e-06, -1.2908130884170532e-06, -1.2172386050224304e-06, -1.1436641216278076e-06, -1.0700896382331848e-06, -9.96515154838562e-07, -9.229406714439392e-07, -8.493661880493164e-07, -7.757917046546936e-07, -7.022172212600708e-07, -6.28642737865448e-07, -5.550682544708252e-07, -4.814937710762024e-07, -4.079192876815796e-07, -3.343448042869568e-07, -2.60770320892334e-07, -1.8719583749771118e-07, -1.1362135410308838e-07, -4.0046870708465576e-08, 3.3527612686157227e-08, 1.0710209608078003e-07, 1.8067657947540283e-07, 2.5425106287002563e-07, 3.2782554626464844e-07, 4.0140002965927124e-07, 4.7497451305389404e-07, 5.485489964485168e-07, 6.221234798431396e-07, 6.956979632377625e-07, 7.692724466323853e-07, 8.428469300270081e-07, 9.164214134216309e-07, 9.899958968162537e-07, 1.0635703802108765e-06, 1.1371448636054993e-06, 1.210719347000122e-06, 1.2842938303947449e-06, 1.3578683137893677e-06, 1.4314427971839905e-06, 1.5050172805786133e-06, 1.578591763973236e-06, 1.6521662473678589e-06, 1.7257407307624817e-06, 1.7993152141571045e-06, 1.8728896975517273e-06, 1.94646418094635e-06, 2.020038664340973e-06, 2.0936131477355957e-06, 2.1671876311302185e-06, 2.2407621145248413e-06, 2.314336597919464e-06, 2.387911081314087e-06, 2.4614855647087097e-06, 2.5350600481033325e-06, 2.6086345314979553e-06, 2.682209014892578e-06]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 1.0, 9.0, 17.0, 14.0, 26.0, 49.0, 115.0, 206.0, 153.0, 106.0, 62.0, 62.0, 47.0, 26.0, 23.0, 14.0, 13.0, 10.0, 7.0, 7.0, 11.0, 4.0, 2.0, 5.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.647011756896973e-05, -9.062661411007866e-05, -8.47831106511876e-05, -7.893961446825415e-05, -7.309611100936309e-05, -6.725260755047202e-05, -6.140911136753857e-05, -5.556560790864751e-05, -4.9722104449756444e-05, -4.387860099086538e-05, -3.803510116995312e-05, -3.2191601349040866e-05, -2.6348097890149802e-05, -2.050459625024814e-05, -1.4661094610346481e-05, -8.817594789434224e-06, -2.9740913305431604e-06, 2.8694103093585e-06, 8.71291194926016e-06, 1.455641358916182e-05, 2.039991522906348e-05, 2.624341686896514e-05, 3.20869185088668e-05, 3.793041832977906e-05, 4.377392178867012e-05, 4.9617425247561187e-05, 5.5460925068473443e-05, 6.13044248893857e-05, 6.714792834827676e-05, 7.299143180716783e-05, 7.883492799010128e-05, 8.467843144899234e-05, 9.05219349078834e-05, 9.636543836677447e-05, 0.00010220894182566553, 0.00010805243800859898, 0.00011389594146749005, 0.00011973944492638111, 0.00012558294110931456, 0.000131426437292248, 0.0001372699480270967, 0.00014311344421003014, 0.00014895695494487882, 0.00015480045112781227, 0.00016064394731074572, 0.0001664874580455944, 0.00017233095422852784, 0.00017817446496337652, 0.00018401796114630997, 0.00018986145732924342, 0.0001957049680640921, 0.00020154846424702555, 0.00020739197498187423, 0.00021323547116480768, 0.00021907896734774113, 0.00022492246353067458, 0.00023076597426552325, 0.0002366094704484567, 0.00024245298118330538, 0.00024829647736623883, 0.0002541399735491723, 0.00025998346973210573, 0.00026582699501886964, 0.0002716704912018031, 0.00027751398738473654]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 9.0, 8.0, 6.0, 8.0, 7.0, 17.0, 10.0, 16.0, 22.0, 19.0, 30.0, 17.0, 31.0, 29.0, 34.0, 30.0, 35.0, 43.0, 40.0, 47.0, 42.0, 31.0, 40.0, 52.0, 30.0, 41.0, 31.0, 37.0, 25.0, 31.0, 28.0, 27.0, 23.0, 15.0, 11.0, 18.0, 12.0, 4.0, 12.0, 4.0, 6.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-9.578466415405273e-05, -9.285099804401398e-05, -8.991733193397522e-05, -8.698366582393646e-05, -8.40499997138977e-05, -8.111633360385895e-05, -7.818266749382019e-05, -7.524900138378143e-05, -7.231533527374268e-05, -6.938166916370392e-05, -6.644800305366516e-05, -6.35143369436264e-05, -6.0580670833587646e-05, -5.764700472354889e-05, -5.471333861351013e-05, -5.1779672503471375e-05, -4.884600639343262e-05, -4.591234028339386e-05, -4.29786741733551e-05, -4.0045008063316345e-05, -3.711134195327759e-05, -3.417767584323883e-05, -3.124400973320007e-05, -2.8310343623161316e-05, -2.537667751312256e-05, -2.24430114030838e-05, -1.9509345293045044e-05, -1.6575679183006287e-05, -1.364201307296753e-05, -1.0708346962928772e-05, -7.774680852890015e-06, -4.841014742851257e-06, -1.9073486328125e-06, 1.0263174772262573e-06, 3.959983587265015e-06, 6.893649697303772e-06, 9.82731580734253e-06, 1.2760981917381287e-05, 1.5694648027420044e-05, 1.86283141374588e-05, 2.156198024749756e-05, 2.4495646357536316e-05, 2.7429312467575073e-05, 3.036297857761383e-05, 3.329664468765259e-05, 3.6230310797691345e-05, 3.91639769077301e-05, 4.209764301776886e-05, 4.503130912780762e-05, 4.7964975237846375e-05, 5.089864134788513e-05, 5.383230745792389e-05, 5.6765973567962646e-05, 5.9699639678001404e-05, 6.263330578804016e-05, 6.556697189807892e-05, 6.850063800811768e-05, 7.143430411815643e-05, 7.436797022819519e-05, 7.730163633823395e-05, 8.02353024482727e-05, 8.316896855831146e-05, 8.610263466835022e-05, 8.903630077838898e-05, 9.196996688842773e-05]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 13.0, 23.0, 45.0, 66.0, 144.0, 255.0, 549.0, 966.0, 2006.0, 4693.0, 13169.0, 59508.0, 3919744.0, 161384.0, 18738.0, 6540.0, 2825.0, 1491.0, 773.0, 472.0, 266.0, 201.0, 122.0, 82.0, 47.0, 36.0, 25.0, 19.0, 18.0, 9.0, 6.0, 7.0, 8.0, 4.0, 7.0, 8.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.793571472167969e-05, -5.513150244951248e-05, -5.2327290177345276e-05, -4.952307790517807e-05, -4.6718865633010864e-05, -4.391465336084366e-05, -4.111044108867645e-05, -3.830622881650925e-05, -3.550201654434204e-05, -3.2697804272174835e-05, -2.989359200000763e-05, -2.7089379727840424e-05, -2.4285167455673218e-05, -2.1480955183506012e-05, -1.8676742911338806e-05, -1.58725306391716e-05, -1.3068318367004395e-05, -1.0264106094837189e-05, -7.459893822669983e-06, -4.655681550502777e-06, -1.8514692783355713e-06, 9.527429938316345e-07, 3.7569552659988403e-06, 6.561167538166046e-06, 9.365379810333252e-06, 1.2169592082500458e-05, 1.4973804354667664e-05, 1.777801662683487e-05, 2.0582228899002075e-05, 2.338644117116928e-05, 2.6190653443336487e-05, 2.8994865715503693e-05, 3.17990779876709e-05, 3.4603290259838104e-05, 3.740750253200531e-05, 4.0211714804172516e-05, 4.301592707633972e-05, 4.582013934850693e-05, 4.862435162067413e-05, 5.142856389284134e-05, 5.4232776165008545e-05, 5.703698843717575e-05, 5.9841200709342957e-05, 6.264541298151016e-05, 6.544962525367737e-05, 6.825383752584457e-05, 7.105804979801178e-05, 7.386226207017899e-05, 7.666647434234619e-05, 7.94706866145134e-05, 8.22748988866806e-05, 8.507911115884781e-05, 8.788332343101501e-05, 9.068753570318222e-05, 9.349174797534943e-05, 9.629596024751663e-05, 9.910017251968384e-05, 0.00010190438479185104, 0.00010470859706401825, 0.00010751280933618546, 0.00011031702160835266, 0.00011312123388051987, 0.00011592544615268707, 0.00011872965842485428, 0.00012153387069702148]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 8.0, 4.0, 8.0, 13.0, 10.0, 17.0, 22.0, 26.0, 38.0, 63.0, 76.0, 90.0, 101.0, 111.0, 90.0, 79.0, 59.0, 50.0, 38.0, 28.0, 19.0, 9.0, 9.0, 8.0, 7.0, 4.0, 4.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0967254638671875e-05, -1.0334886610507965e-05, -9.702518582344055e-06, -9.070150554180145e-06, -8.437782526016235e-06, -7.805414497852325e-06, -7.1730464696884155e-06, -6.540678441524506e-06, -5.908310413360596e-06, -5.275942385196686e-06, -4.643574357032776e-06, -4.011206328868866e-06, -3.378838300704956e-06, -2.746470272541046e-06, -2.1141022443771362e-06, -1.4817342162132263e-06, -8.493661880493164e-07, -2.169981598854065e-07, 4.153698682785034e-07, 1.0477378964424133e-06, 1.6801059246063232e-06, 2.312473952770233e-06, 2.944841980934143e-06, 3.577210009098053e-06, 4.209578037261963e-06, 4.841946065425873e-06, 5.474314093589783e-06, 6.106682121753693e-06, 6.7390501499176025e-06, 7.3714181780815125e-06, 8.003786206245422e-06, 8.636154234409332e-06, 9.268522262573242e-06, 9.900890290737152e-06, 1.0533258318901062e-05, 1.1165626347064972e-05, 1.1797994375228882e-05, 1.2430362403392792e-05, 1.3062730431556702e-05, 1.3695098459720612e-05, 1.4327466487884521e-05, 1.4959834516048431e-05, 1.559220254421234e-05, 1.622457057237625e-05, 1.685693860054016e-05, 1.748930662870407e-05, 1.812167465686798e-05, 1.875404268503189e-05, 1.93864107131958e-05, 2.001877874135971e-05, 2.065114676952362e-05, 2.128351479768753e-05, 2.191588282585144e-05, 2.254825085401535e-05, 2.318061888217926e-05, 2.381298691034317e-05, 2.444535493850708e-05, 2.507772296667099e-05, 2.57100909948349e-05, 2.634245902299881e-05, 2.697482705116272e-05, 2.760719507932663e-05, 2.823956310749054e-05, 2.887193113565445e-05, 2.950429916381836e-05]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 9.0, 8.0, 17.0, 19.0, 34.0, 47.0, 63.0, 77.0, 149.0, 238.0, 380.0, 563.0, 936.0, 1396.0, 2370.0, 4163.0, 7748.0, 14833.0, 32386.0, 91755.0, 1090632.0, 2759018.0, 116649.0, 35596.0, 16121.0, 7995.0, 4498.0, 2489.0, 1452.0, 958.0, 626.0, 342.0, 242.0, 159.0, 107.0, 56.0, 45.0, 37.0, 17.0, 13.0, 9.0, 10.0, 7.0, 5.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.522634506225586e-05, -3.4091994166374207e-05, -3.2957643270492554e-05, -3.18232923746109e-05, -3.068894147872925e-05, -2.9554590582847595e-05, -2.8420239686965942e-05, -2.728588879108429e-05, -2.6151537895202637e-05, -2.5017186999320984e-05, -2.388283610343933e-05, -2.2748485207557678e-05, -2.1614134311676025e-05, -2.0479783415794373e-05, -1.934543251991272e-05, -1.8211081624031067e-05, -1.7076730728149414e-05, -1.594237983226776e-05, -1.4808028936386108e-05, -1.3673678040504456e-05, -1.2539327144622803e-05, -1.140497624874115e-05, -1.0270625352859497e-05, -9.136274456977844e-06, -8.001923561096191e-06, -6.8675726652145386e-06, -5.733221769332886e-06, -4.598870873451233e-06, -3.46451997756958e-06, -2.3301690816879272e-06, -1.1958181858062744e-06, -6.146728992462158e-08, 1.0728836059570312e-06, 2.207234501838684e-06, 3.341585397720337e-06, 4.47593629360199e-06, 5.610287189483643e-06, 6.744638085365295e-06, 7.878988981246948e-06, 9.013339877128601e-06, 1.0147690773010254e-05, 1.1282041668891907e-05, 1.241639256477356e-05, 1.3550743460655212e-05, 1.4685094356536865e-05, 1.5819445252418518e-05, 1.695379614830017e-05, 1.8088147044181824e-05, 1.9222497940063477e-05, 2.035684883594513e-05, 2.1491199731826782e-05, 2.2625550627708435e-05, 2.3759901523590088e-05, 2.489425241947174e-05, 2.6028603315353394e-05, 2.7162954211235046e-05, 2.82973051071167e-05, 2.9431656002998352e-05, 3.0566006898880005e-05, 3.170035779476166e-05, 3.283470869064331e-05, 3.396905958652496e-05, 3.5103410482406616e-05, 3.623776137828827e-05, 3.737211227416992e-05]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 10.0, 4.0, 6.0, 7.0, 7.0, 18.0, 12.0, 17.0, 26.0, 28.0, 38.0, 54.0, 85.0, 146.0, 547.0, 1405.0, 955.0, 290.0, 133.0, 62.0, 48.0, 45.0, 25.0, 16.0, 15.0, 11.0, 16.0, 9.0, 8.0, 13.0, 1.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7358531951904297e-05, -2.644117921590805e-05, -2.5523826479911804e-05, -2.4606473743915558e-05, -2.368912100791931e-05, -2.2771768271923065e-05, -2.185441553592682e-05, -2.0937062799930573e-05, -2.0019710063934326e-05, -1.910235732793808e-05, -1.8185004591941833e-05, -1.7267651855945587e-05, -1.635029911994934e-05, -1.5432946383953094e-05, -1.4515593647956848e-05, -1.3598240911960602e-05, -1.2680888175964355e-05, -1.1763535439968109e-05, -1.0846182703971863e-05, -9.928829967975616e-06, -9.01147723197937e-06, -8.094124495983124e-06, -7.1767717599868774e-06, -6.259419023990631e-06, -5.342066287994385e-06, -4.4247135519981384e-06, -3.507360816001892e-06, -2.5900080800056458e-06, -1.6726553440093994e-06, -7.553026080131531e-07, 1.6205012798309326e-07, 1.0794028639793396e-06, 1.996755599975586e-06, 2.9141083359718323e-06, 3.831461071968079e-06, 4.748813807964325e-06, 5.666166543960571e-06, 6.583519279956818e-06, 7.500872015953064e-06, 8.41822475194931e-06, 9.335577487945557e-06, 1.0252930223941803e-05, 1.117028295993805e-05, 1.2087635695934296e-05, 1.3004988431930542e-05, 1.3922341167926788e-05, 1.4839693903923035e-05, 1.575704663991928e-05, 1.6674399375915527e-05, 1.7591752111911774e-05, 1.850910484790802e-05, 1.9426457583904266e-05, 2.0343810319900513e-05, 2.126116305589676e-05, 2.2178515791893005e-05, 2.3095868527889252e-05, 2.4013221263885498e-05, 2.4930573999881744e-05, 2.584792673587799e-05, 2.6765279471874237e-05, 2.7682632207870483e-05, 2.859998494386673e-05, 2.9517337679862976e-05, 3.0434690415859222e-05, 3.135204315185547e-05]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 9.0, 8.0, 10.0, 18.0, 21.0, 22.0, 42.0, 43.0, 78.0, 102.0, 128.0, 132.0, 85.0, 67.0, 57.0, 33.0, 32.0, 24.0, 14.0, 10.0, 10.0, 12.0, 9.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00012851697101723403, -0.0001244941959157586, -0.00012047141353832558, -0.00011644863843685016, -0.00011242585605941713, -0.00010840308095794171, -0.0001043803058564663, -0.00010035753075499088, -9.633474837755784e-05, -9.231197327608243e-05, -8.82891908986494e-05, -8.426641579717398e-05, -8.024364069569856e-05, -7.622085831826553e-05, -7.219808321679011e-05, -6.817530083935708e-05, -6.415252573788166e-05, -6.0129746998427436e-05, -5.610696825897321e-05, -5.2084193157497793e-05, -4.806141441804357e-05, -4.4038635678589344e-05, -4.0015860577113926e-05, -3.59930818376597e-05, -3.197030309820548e-05, -2.7947524358751252e-05, -2.392474743828643e-05, -1.990197051782161e-05, -1.5879191778367385e-05, -1.185641303891316e-05, -7.83363611844834e-06, -3.8108591979835182e-06, 2.1191954147070646e-07, 4.234697371430229e-06, 8.257475201389752e-06, 1.2280253031349275e-05, 1.6303030861308798e-05, 2.0325809600763023e-05, 2.4348586521227844e-05, 2.8371363441692665e-05, 3.239414218114689e-05, 3.6416920920601115e-05, 4.043969966005534e-05, 4.446247476153076e-05, 4.848525350098498e-05, 5.2508032240439206e-05, 5.6530807341914624e-05, 6.055358608136885e-05, 6.457636482082307e-05, 6.859913992229849e-05, 7.262192229973152e-05, 7.664469740120694e-05, 8.066747977863997e-05, 8.469025488011539e-05, 8.871302998159081e-05, 9.273580508306623e-05, 9.675858746049926e-05, 0.00010078136256197467, 0.0001048041449394077, 0.00010882692004088312, 0.00011284969514235854, 0.00011687247751979157, 0.00012089525262126699, 0.00012491803499870002, 0.00012894081010017544]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 8.0, 5.0, 5.0, 4.0, 9.0, 16.0, 19.0, 26.0, 20.0, 21.0, 29.0, 33.0, 40.0, 48.0, 39.0, 44.0, 52.0, 59.0, 45.0, 45.0, 35.0, 51.0, 39.0, 49.0, 42.0, 32.0, 32.0, 25.0, 25.0, 27.0, 13.0, 14.0, 17.0, 6.0, 8.0, 7.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.586313247680664e-05, -6.340816617012024e-05, -6.095319986343384e-05, -5.8498233556747437e-05, -5.6043267250061035e-05, -5.3588300943374634e-05, -5.113333463668823e-05, -4.867836833000183e-05, -4.622340202331543e-05, -4.376843571662903e-05, -4.131346940994263e-05, -3.8858503103256226e-05, -3.6403536796569824e-05, -3.394857048988342e-05, -3.149360418319702e-05, -2.903863787651062e-05, -2.658367156982422e-05, -2.4128705263137817e-05, -2.1673738956451416e-05, -1.9218772649765015e-05, -1.6763806343078613e-05, -1.4308840036392212e-05, -1.185387372970581e-05, -9.39890742301941e-06, -6.943941116333008e-06, -4.4889748096466064e-06, -2.034008502960205e-06, 4.209578037261963e-07, 2.8759241104125977e-06, 5.330890417098999e-06, 7.7858567237854e-06, 1.0240823030471802e-05, 1.2695789337158203e-05, 1.5150755643844604e-05, 1.7605721950531006e-05, 2.0060688257217407e-05, 2.251565456390381e-05, 2.497062087059021e-05, 2.742558717727661e-05, 2.9880553483963013e-05, 3.2335519790649414e-05, 3.4790486097335815e-05, 3.724545240402222e-05, 3.970041871070862e-05, 4.215538501739502e-05, 4.461035132408142e-05, 4.706531763076782e-05, 4.9520283937454224e-05, 5.1975250244140625e-05, 5.4430216550827026e-05, 5.688518285751343e-05, 5.934014916419983e-05, 6.179511547088623e-05, 6.425008177757263e-05, 6.670504808425903e-05, 6.916001439094543e-05, 7.161498069763184e-05, 7.406994700431824e-05, 7.652491331100464e-05, 7.897987961769104e-05, 8.143484592437744e-05, 8.388981223106384e-05, 8.634477853775024e-05, 8.879974484443665e-05, 9.125471115112305e-05]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 10.0, 9.0, 12.0, 22.0, 28.0, 44.0, 50.0, 78.0, 130.0, 230.0, 452.0, 885.0, 1863.0, 4218.0, 10506.0, 31957.0, 142292.0, 690704.0, 119787.0, 28229.0, 9609.0, 3906.0, 1707.0, 791.0, 418.0, 223.0, 140.0, 77.0, 46.0, 27.0, 29.0, 16.0, 12.0, 14.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00012254714965820312, -0.00011838600039482117, -0.00011422485113143921, -0.00011006370186805725, -0.00010590255260467529, -0.00010174140334129333, -9.758025407791138e-05, -9.341910481452942e-05, -8.925795555114746e-05, -8.50968062877655e-05, -8.093565702438354e-05, -7.677450776100159e-05, -7.261335849761963e-05, -6.845220923423767e-05, -6.429105997085571e-05, -6.0129910707473755e-05, -5.59687614440918e-05, -5.180761218070984e-05, -4.764646291732788e-05, -4.348531365394592e-05, -3.9324164390563965e-05, -3.516301512718201e-05, -3.100186586380005e-05, -2.684071660041809e-05, -2.2679567337036133e-05, -1.8518418073654175e-05, -1.4357268810272217e-05, -1.0196119546890259e-05, -6.034970283508301e-06, -1.8738210201263428e-06, 2.2873282432556152e-06, 6.448477506637573e-06, 1.0609626770019531e-05, 1.477077603340149e-05, 1.8931925296783447e-05, 2.3093074560165405e-05, 2.7254223823547363e-05, 3.141537308692932e-05, 3.557652235031128e-05, 3.973767161369324e-05, 4.3898820877075195e-05, 4.805997014045715e-05, 5.222111940383911e-05, 5.638226866722107e-05, 6.054341793060303e-05, 6.470456719398499e-05, 6.886571645736694e-05, 7.30268657207489e-05, 7.718801498413086e-05, 8.134916424751282e-05, 8.551031351089478e-05, 8.967146277427673e-05, 9.383261203765869e-05, 9.799376130104065e-05, 0.00010215491056442261, 0.00010631605982780457, 0.00011047720909118652, 0.00011463835835456848, 0.00011879950761795044, 0.0001229606568813324, 0.00012712180614471436, 0.0001312829554080963, 0.00013544410467147827, 0.00013960525393486023, 0.0001437664031982422]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 9.0, 4.0, 10.0, 16.0, 17.0, 18.0, 39.0, 47.0, 72.0, 110.0, 95.0, 126.0, 112.0, 89.0, 63.0, 41.0, 46.0, 20.0, 26.0, 9.0, 8.0, 8.0, 5.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5437602996826172e-05, -1.4727003872394562e-05, -1.4016404747962952e-05, -1.3305805623531342e-05, -1.2595206499099731e-05, -1.1884607374668121e-05, -1.1174008250236511e-05, -1.0463409125804901e-05, -9.752810001373291e-06, -9.042210876941681e-06, -8.33161175251007e-06, -7.621012628078461e-06, -6.910413503646851e-06, -6.1998143792152405e-06, -5.48921525478363e-06, -4.77861613035202e-06, -4.06801700592041e-06, -3.3574178814888e-06, -2.64681875705719e-06, -1.93621963262558e-06, -1.2256205081939697e-06, -5.150213837623596e-07, 1.955777406692505e-07, 9.061768651008606e-07, 1.6167759895324707e-06, 2.327375113964081e-06, 3.037974238395691e-06, 3.748573362827301e-06, 4.459172487258911e-06, 5.169771611690521e-06, 5.880370736122131e-06, 6.5909698605537415e-06, 7.3015689849853516e-06, 8.012168109416962e-06, 8.722767233848572e-06, 9.433366358280182e-06, 1.0143965482711792e-05, 1.0854564607143402e-05, 1.1565163731575012e-05, 1.2275762856006622e-05, 1.2986361980438232e-05, 1.3696961104869843e-05, 1.4407560229301453e-05, 1.5118159353733063e-05, 1.5828758478164673e-05, 1.6539357602596283e-05, 1.7249956727027893e-05, 1.7960555851459503e-05, 1.8671154975891113e-05, 1.9381754100322723e-05, 2.0092353224754333e-05, 2.0802952349185944e-05, 2.1513551473617554e-05, 2.2224150598049164e-05, 2.2934749722480774e-05, 2.3645348846912384e-05, 2.4355947971343994e-05, 2.5066547095775604e-05, 2.5777146220207214e-05, 2.6487745344638824e-05, 2.7198344469070435e-05, 2.7908943593502045e-05, 2.8619542717933655e-05, 2.9330141842365265e-05, 3.0040740966796875e-05]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 8.0, 7.0, 16.0, 16.0, 27.0, 52.0, 85.0, 116.0, 205.0, 337.0, 470.0, 788.0, 1137.0, 1855.0, 3065.0, 5435.0, 8669.0, 14569.0, 25141.0, 45503.0, 88560.0, 220963.0, 386990.0, 114375.0, 55948.0, 30815.0, 17247.0, 9999.0, 6420.0, 3679.0, 2223.0, 1423.0, 865.0, 558.0, 364.0, 228.0, 147.0, 89.0, 49.0, 42.0, 21.0, 20.0, 12.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4809112548828125e-05, -3.372691571712494e-05, -3.264471888542175e-05, -3.156252205371857e-05, -3.048032522201538e-05, -2.9398128390312195e-05, -2.831593155860901e-05, -2.7233734726905823e-05, -2.6151537895202637e-05, -2.506934106349945e-05, -2.3987144231796265e-05, -2.290494740009308e-05, -2.1822750568389893e-05, -2.0740553736686707e-05, -1.965835690498352e-05, -1.8576160073280334e-05, -1.749396324157715e-05, -1.6411766409873962e-05, -1.5329569578170776e-05, -1.424737274646759e-05, -1.3165175914764404e-05, -1.2082979083061218e-05, -1.1000782251358032e-05, -9.918585419654846e-06, -8.83638858795166e-06, -7.754191756248474e-06, -6.671994924545288e-06, -5.589798092842102e-06, -4.507601261138916e-06, -3.42540442943573e-06, -2.343207597732544e-06, -1.261010766029358e-06, -1.7881393432617188e-07, 9.033828973770142e-07, 1.9855797290802e-06, 3.0677765607833862e-06, 4.149973392486572e-06, 5.232170224189758e-06, 6.314367055892944e-06, 7.39656388759613e-06, 8.478760719299316e-06, 9.560957551002502e-06, 1.0643154382705688e-05, 1.1725351214408875e-05, 1.280754804611206e-05, 1.3889744877815247e-05, 1.4971941709518433e-05, 1.605413854122162e-05, 1.7136335372924805e-05, 1.821853220462799e-05, 1.9300729036331177e-05, 2.0382925868034363e-05, 2.146512269973755e-05, 2.2547319531440735e-05, 2.362951636314392e-05, 2.4711713194847107e-05, 2.5793910026550293e-05, 2.687610685825348e-05, 2.7958303689956665e-05, 2.904050052165985e-05, 3.0122697353363037e-05, 3.120489418506622e-05, 3.228709101676941e-05, 3.3369287848472595e-05, 3.445148468017578e-05]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 10.0, 3.0, 5.0, 12.0, 8.0, 18.0, 19.0, 19.0, 24.0, 26.0, 25.0, 28.0, 44.0, 40.0, 47.0, 40.0, 52.0, 55.0, 41.0, 65.0, 52.0, 45.0, 43.0, 32.0, 29.0, 34.0, 30.0, 21.0, 23.0, 26.0, 24.0, 22.0, 7.0, 6.0, 4.0, 7.0, 6.0, 4.0, 6.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7610530853271484e-05, -3.655627369880676e-05, -3.550201654434204e-05, -3.444775938987732e-05, -3.33935022354126e-05, -3.2339245080947876e-05, -3.1284987926483154e-05, -3.0230730772018433e-05, -2.917647361755371e-05, -2.812221646308899e-05, -2.7067959308624268e-05, -2.6013702154159546e-05, -2.4959444999694824e-05, -2.3905187845230103e-05, -2.285093069076538e-05, -2.179667353630066e-05, -2.0742416381835938e-05, -1.9688159227371216e-05, -1.8633902072906494e-05, -1.7579644918441772e-05, -1.652538776397705e-05, -1.547113060951233e-05, -1.4416873455047607e-05, -1.3362616300582886e-05, -1.2308359146118164e-05, -1.1254101991653442e-05, -1.019984483718872e-05, -9.145587682723999e-06, -8.091330528259277e-06, -7.037073373794556e-06, -5.982816219329834e-06, -4.928559064865112e-06, -3.874301910400391e-06, -2.820044755935669e-06, -1.7657876014709473e-06, -7.115304470062256e-07, 3.427267074584961e-07, 1.3969838619232178e-06, 2.4512410163879395e-06, 3.505498170852661e-06, 4.559755325317383e-06, 5.6140124797821045e-06, 6.668269634246826e-06, 7.722526788711548e-06, 8.77678394317627e-06, 9.831041097640991e-06, 1.0885298252105713e-05, 1.1939555406570435e-05, 1.2993812561035156e-05, 1.4048069715499878e-05, 1.51023268699646e-05, 1.615658402442932e-05, 1.7210841178894043e-05, 1.8265098333358765e-05, 1.9319355487823486e-05, 2.0373612642288208e-05, 2.142786979675293e-05, 2.248212695121765e-05, 2.3536384105682373e-05, 2.4590641260147095e-05, 2.5644898414611816e-05, 2.6699155569076538e-05, 2.775341272354126e-05, 2.880766987800598e-05, 2.9861927032470703e-05]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 8.0, 12.0, 22.0, 30.0, 36.0, 69.0, 86.0, 182.0, 223.0, 396.0, 950.0, 1347.0, 4034.0, 7387.0, 18827.0, 110404.0, 508337.0, 331497.0, 39828.0, 15837.0, 4297.0, 2004.0, 1308.0, 518.0, 383.0, 159.0, 112.0, 104.0, 42.0, 30.0, 18.0, 21.0, 12.0, 13.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.854534149169922e-06, -6.6515058279037476e-06, -6.448477506637573e-06, -6.245449185371399e-06, -6.042420864105225e-06, -5.83939254283905e-06, -5.636364221572876e-06, -5.433335900306702e-06, -5.230307579040527e-06, -5.027279257774353e-06, -4.824250936508179e-06, -4.621222615242004e-06, -4.41819429397583e-06, -4.215165972709656e-06, -4.0121376514434814e-06, -3.809109330177307e-06, -3.606081008911133e-06, -3.4030526876449585e-06, -3.200024366378784e-06, -2.99699604511261e-06, -2.7939677238464355e-06, -2.5909394025802612e-06, -2.387911081314087e-06, -2.1848827600479126e-06, -1.9818544387817383e-06, -1.778826117515564e-06, -1.5757977962493896e-06, -1.3727694749832153e-06, -1.169741153717041e-06, -9.667128324508667e-07, -7.636845111846924e-07, -5.606561899185181e-07, -3.5762786865234375e-07, -1.5459954738616943e-07, 4.842877388000488e-08, 2.514570951461792e-07, 4.544854164123535e-07, 6.575137376785278e-07, 8.605420589447021e-07, 1.0635703802108765e-06, 1.2665987014770508e-06, 1.469627022743225e-06, 1.6726553440093994e-06, 1.8756836652755737e-06, 2.078711986541748e-06, 2.2817403078079224e-06, 2.4847686290740967e-06, 2.687796950340271e-06, 2.8908252716064453e-06, 3.0938535928726196e-06, 3.296881914138794e-06, 3.4999102354049683e-06, 3.7029385566711426e-06, 3.905966877937317e-06, 4.108995199203491e-06, 4.3120235204696655e-06, 4.51505184173584e-06, 4.718080163002014e-06, 4.9211084842681885e-06, 5.124136805534363e-06, 5.327165126800537e-06, 5.5301934480667114e-06, 5.733221769332886e-06, 5.93625009059906e-06, 6.139278411865234e-06]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 6.0, 3.0, 0.0, 9.0, 0.0, 19.0, 0.0, 27.0, 32.0, 0.0, 46.0, 0.0, 47.0, 0.0, 66.0, 0.0, 95.0, 117.0, 0.0, 103.0, 0.0, 96.0, 0.0, 94.0, 66.0, 0.0, 56.0, 0.0, 39.0, 0.0, 24.0, 0.0, 20.0, 20.0, 0.0, 10.0, 0.0, 8.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1585652828216553e-06, -1.125037670135498e-06, -1.0915100574493408e-06, -1.0579824447631836e-06, -1.0244548320770264e-06, -9.909272193908691e-07, -9.57399606704712e-07, -9.238719940185547e-07, -8.903443813323975e-07, -8.568167686462402e-07, -8.23289155960083e-07, -7.897615432739258e-07, -7.562339305877686e-07, -7.227063179016113e-07, -6.891787052154541e-07, -6.556510925292969e-07, -6.221234798431396e-07, -5.885958671569824e-07, -5.550682544708252e-07, -5.21540641784668e-07, -4.880130290985107e-07, -4.544854164123535e-07, -4.209578037261963e-07, -3.8743019104003906e-07, -3.5390257835388184e-07, -3.203749656677246e-07, -2.868473529815674e-07, -2.5331974029541016e-07, -2.1979212760925293e-07, -1.862645149230957e-07, -1.5273690223693848e-07, -1.1920928955078125e-07, -8.568167686462402e-08, -5.21540641784668e-08, -1.862645149230957e-08, 1.4901161193847656e-08, 4.842877388000488e-08, 8.195638656616211e-08, 1.1548399925231934e-07, 1.4901161193847656e-07, 1.825392246246338e-07, 2.1606683731079102e-07, 2.4959444999694824e-07, 2.8312206268310547e-07, 3.166496753692627e-07, 3.501772880554199e-07, 3.8370490074157715e-07, 4.172325134277344e-07, 4.507601261138916e-07, 4.842877388000488e-07, 5.178153514862061e-07, 5.513429641723633e-07, 5.848705768585205e-07, 6.183981895446777e-07, 6.51925802230835e-07, 6.854534149169922e-07, 7.189810276031494e-07, 7.525086402893066e-07, 7.860362529754639e-07, 8.195638656616211e-07, 8.530914783477783e-07, 8.866190910339355e-07, 9.201467037200928e-07, 9.5367431640625e-07]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 11.0, 7.0, 25.0, 10.0, 36.0, 55.0, 39.0, 105.0, 67.0, 178.0, 139.0, 426.0, 673.0, 579.0, 1767.0, 1363.0, 4743.0, 10648.0, 9654.0, 41389.0, 45141.0, 257208.0, 299216.0, 257941.0, 71023.0, 15827.0, 15867.0, 4191.0, 4809.0, 1443.0, 1674.0, 943.0, 314.0, 391.0, 128.0, 175.0, 111.0, 47.0, 65.0, 28.0, 37.0, 11.0, 22.0, 16.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.86102294921875e-06, -2.7669593691825867e-06, -2.6728957891464233e-06, -2.57883220911026e-06, -2.4847686290740967e-06, -2.3907050490379333e-06, -2.29664146900177e-06, -2.2025778889656067e-06, -2.1085143089294434e-06, -2.01445072889328e-06, -1.9203871488571167e-06, -1.8263235688209534e-06, -1.73225998878479e-06, -1.6381964087486267e-06, -1.5441328287124634e-06, -1.4500692486763e-06, -1.3560056686401367e-06, -1.2619420886039734e-06, -1.16787850856781e-06, -1.0738149285316467e-06, -9.797513484954834e-07, -8.856877684593201e-07, -7.916241884231567e-07, -6.975606083869934e-07, -6.034970283508301e-07, -5.094334483146667e-07, -4.153698682785034e-07, -3.213062882423401e-07, -2.2724270820617676e-07, -1.3317912817001343e-07, -3.91155481338501e-08, 5.494803190231323e-08, 1.4901161193847656e-07, 2.430751919746399e-07, 3.371387720108032e-07, 4.3120235204696655e-07, 5.252659320831299e-07, 6.193295121192932e-07, 7.133930921554565e-07, 8.074566721916199e-07, 9.015202522277832e-07, 9.955838322639465e-07, 1.0896474123001099e-06, 1.1837109923362732e-06, 1.2777745723724365e-06, 1.3718381524085999e-06, 1.4659017324447632e-06, 1.5599653124809265e-06, 1.6540288925170898e-06, 1.7480924725532532e-06, 1.8421560525894165e-06, 1.93621963262558e-06, 2.030283212661743e-06, 2.1243467926979065e-06, 2.21841037273407e-06, 2.312473952770233e-06, 2.4065375328063965e-06, 2.50060111284256e-06, 2.594664692878723e-06, 2.6887282729148865e-06, 2.78279185295105e-06, 2.876855432987213e-06, 2.9709190130233765e-06, 3.06498259305954e-06, 3.159046173095703e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 6.0, 5.0, 11.0, 5.0, 9.0, 15.0, 3.0, 37.0, 13.0, 38.0, 54.0, 36.0, 88.0, 46.0, 43.0, 113.0, 42.0, 136.0, 52.0, 57.0, 36.0, 26.0, 42.0, 15.0, 27.0, 9.0, 7.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7418136596679688e-06, -2.6579946279525757e-06, -2.5741755962371826e-06, -2.4903565645217896e-06, -2.4065375328063965e-06, -2.3227185010910034e-06, -2.2388994693756104e-06, -2.1550804376602173e-06, -2.0712614059448242e-06, -1.987442374229431e-06, -1.903623342514038e-06, -1.819804310798645e-06, -1.735985279083252e-06, -1.6521662473678589e-06, -1.5683472156524658e-06, -1.4845281839370728e-06, -1.4007091522216797e-06, -1.3168901205062866e-06, -1.2330710887908936e-06, -1.1492520570755005e-06, -1.0654330253601074e-06, -9.816139936447144e-07, -8.977949619293213e-07, -8.139759302139282e-07, -7.301568984985352e-07, -6.463378667831421e-07, -5.62518835067749e-07, -4.78699803352356e-07, -3.948807716369629e-07, -3.110617399215698e-07, -2.2724270820617676e-07, -1.434236764907837e-07, -5.960464477539063e-08, 2.421438694000244e-08, 1.0803341865539551e-07, 1.9185245037078857e-07, 2.7567148208618164e-07, 3.594905138015747e-07, 4.4330954551696777e-07, 5.271285772323608e-07, 6.109476089477539e-07, 6.94766640663147e-07, 7.7858567237854e-07, 8.624047040939331e-07, 9.462237358093262e-07, 1.0300427675247192e-06, 1.1138617992401123e-06, 1.1976808309555054e-06, 1.2814998626708984e-06, 1.3653188943862915e-06, 1.4491379261016846e-06, 1.5329569578170776e-06, 1.6167759895324707e-06, 1.7005950212478638e-06, 1.7844140529632568e-06, 1.86823308467865e-06, 1.952052116394043e-06, 2.035871148109436e-06, 2.119690179824829e-06, 2.203509211540222e-06, 2.2873282432556152e-06, 2.3711472749710083e-06, 2.4549663066864014e-06, 2.5387853384017944e-06, 2.6226043701171875e-06]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 0.0, 2.0, 8.0, 4.0, 9.0, 7.0, 4.0, 10.0, 5.0, 29.0, 26.0, 34.0, 56.0, 65.0, 117.0, 131.0, 124.0, 75.0, 65.0, 36.0, 32.0, 27.0, 25.0, 18.0, 16.0, 13.0, 13.0, 8.0, 6.0, 11.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.812255353201181e-05, -7.48077072785236e-05, -7.149286102503538e-05, -6.817802204750478e-05, -6.486317579401657e-05, -6.154832954052836e-05, -5.8233483287040144e-05, -5.491863703355193e-05, -5.160379078006372e-05, -4.8288944526575506e-05, -4.49741019110661e-05, -4.165925565757789e-05, -3.8344409404089674e-05, -3.502956678858027e-05, -3.1714720535092056e-05, -2.8399874281603843e-05, -2.5085031666094437e-05, -2.1770187231595628e-05, -1.8455340978107415e-05, -1.5140496543608606e-05, -1.1825651199615095e-05, -8.510805855621584e-06, -5.1959614211227745e-06, -1.8811151676345617e-06, 1.4337292668642476e-06, 4.748574610857759e-06, 8.06341995485127e-06, 1.1378264389350079e-05, 1.469310973334359e-05, 1.80079550773371e-05, 2.132279951183591e-05, 2.4637645765324123e-05, 2.7952490199822932e-05, 3.1267336453311145e-05, 3.458217906882055e-05, 3.7897025322308764e-05, 4.121187157579698e-05, 4.452671419130638e-05, 4.7841560444794595e-05, 5.115640669828281e-05, 5.447125295177102e-05, 5.7786099205259234e-05, 6.110094545874745e-05, 6.441578443627805e-05, 6.773063068976626e-05, 7.104547694325447e-05, 7.436032319674268e-05, 7.76751694502309e-05, 8.09900084277615e-05, 8.430485468124971e-05, 8.761970093473792e-05, 9.093453991226852e-05, 9.424938616575673e-05, 9.756423241924495e-05, 0.00010087907867273316, 0.00010419392492622137, 0.00010750877117970958, 0.0001108236174331978, 0.00011413846368668601, 0.00011745330994017422, 0.00012076814891770482, 0.00012408300244715065, 0.00012739784142468125, 0.00013071269495412707, 0.00013402753393165767]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 1.0, 9.0, 8.0, 14.0, 11.0, 9.0, 11.0, 16.0, 17.0, 17.0, 25.0, 31.0, 31.0, 27.0, 29.0, 35.0, 40.0, 33.0, 40.0, 44.0, 35.0, 44.0, 48.0, 41.0, 30.0, 34.0, 25.0, 37.0, 35.0, 36.0, 31.0, 21.0, 12.0, 20.0, 20.0, 11.0, 9.0, 18.0, 14.0, 4.0, 11.0, 7.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.699562072753906e-05, -6.470177322626114e-05, -6.240792572498322e-05, -6.011407822370529e-05, -5.782023072242737e-05, -5.5526383221149445e-05, -5.323253571987152e-05, -5.09386882185936e-05, -4.8644840717315674e-05, -4.635099321603775e-05, -4.405714571475983e-05, -4.17632982134819e-05, -3.946945071220398e-05, -3.7175603210926056e-05, -3.488175570964813e-05, -3.258790820837021e-05, -3.0294060707092285e-05, -2.800021320581436e-05, -2.5706365704536438e-05, -2.3412518203258514e-05, -2.111867070198059e-05, -1.8824823200702667e-05, -1.6530975699424744e-05, -1.423712819814682e-05, -1.1943280696868896e-05, -9.649433195590973e-06, -7.355585694313049e-06, -5.061738193035126e-06, -2.767890691757202e-06, -4.7404319047927856e-07, 1.819804310798645e-06, 4.113651812076569e-06, 6.407499313354492e-06, 8.701346814632416e-06, 1.099519431591034e-05, 1.3289041817188263e-05, 1.5582889318466187e-05, 1.787673681974411e-05, 2.0170584321022034e-05, 2.2464431822299957e-05, 2.475827932357788e-05, 2.7052126824855804e-05, 2.9345974326133728e-05, 3.163982182741165e-05, 3.3933669328689575e-05, 3.62275168299675e-05, 3.852136433124542e-05, 4.0815211832523346e-05, 4.310905933380127e-05, 4.540290683507919e-05, 4.769675433635712e-05, 4.999060183763504e-05, 5.2284449338912964e-05, 5.457829684019089e-05, 5.687214434146881e-05, 5.9165991842746735e-05, 6.145983934402466e-05, 6.375368684530258e-05, 6.60475343465805e-05, 6.834138184785843e-05, 7.063522934913635e-05, 7.292907685041428e-05, 7.52229243516922e-05, 7.751677185297012e-05, 7.981061935424805e-05]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 2.0, 1.0, 5.0, 9.0, 28.0, 24.0, 59.0, 108.0, 172.0, 311.0, 633.0, 1110.0, 2147.0, 4675.0, 13447.0, 48377.0, 3266163.0, 803081.0, 34976.0, 10678.0, 4111.0, 1952.0, 986.0, 502.0, 264.0, 145.0, 91.0, 52.0, 28.0, 23.0, 19.0, 12.0, 14.0, 6.0, 7.0, 6.0, 6.0, 6.0, 5.0, 4.0, 7.0, 9.0, 3.0, 10.0, 8.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.346536636352539e-05, -5.048047751188278e-05, -4.749558866024017e-05, -4.4510699808597565e-05, -4.1525810956954956e-05, -3.854092210531235e-05, -3.555603325366974e-05, -3.257114440202713e-05, -2.958625555038452e-05, -2.6601366698741913e-05, -2.3616477847099304e-05, -2.0631588995456696e-05, -1.7646700143814087e-05, -1.4661811292171478e-05, -1.167692244052887e-05, -8.692033588886261e-06, -5.707144737243652e-06, -2.7222558856010437e-06, 2.6263296604156494e-07, 3.2475218176841736e-06, 6.232410669326782e-06, 9.217299520969391e-06, 1.2202188372612e-05, 1.5187077224254608e-05, 1.8171966075897217e-05, 2.1156854927539825e-05, 2.4141743779182434e-05, 2.7126632630825043e-05, 3.011152148246765e-05, 3.309641033411026e-05, 3.608129918575287e-05, 3.906618803739548e-05, 4.2051076889038086e-05, 4.5035965740680695e-05, 4.80208545923233e-05, 5.100574344396591e-05, 5.399063229560852e-05, 5.697552114725113e-05, 5.996040999889374e-05, 6.294529885053635e-05, 6.593018770217896e-05, 6.891507655382156e-05, 7.189996540546417e-05, 7.488485425710678e-05, 7.786974310874939e-05, 8.0854631960392e-05, 8.383952081203461e-05, 8.682440966367722e-05, 8.980929851531982e-05, 9.279418736696243e-05, 9.577907621860504e-05, 9.876396507024765e-05, 0.00010174885392189026, 0.00010473374277353287, 0.00010771863162517548, 0.00011070352047681808, 0.0001136884093284607, 0.0001166732981801033, 0.00011965818703174591, 0.00012264307588338852, 0.00012562796473503113, 0.00012861285358667374, 0.00013159774243831635, 0.00013458263128995895, 0.00013756752014160156]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 6.0, 6.0, 5.0, 7.0, 9.0, 9.0, 11.0, 19.0, 49.0, 66.0, 95.0, 136.0, 134.0, 137.0, 103.0, 64.0, 59.0, 35.0, 19.0, 11.0, 7.0, 11.0, 11.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3887882232666016e-05, -1.3059936463832855e-05, -1.2231990694999695e-05, -1.1404044926166534e-05, -1.0576099157333374e-05, -9.748153388500214e-06, -8.920207619667053e-06, -8.092261850833893e-06, -7.264316082000732e-06, -6.436370313167572e-06, -5.608424544334412e-06, -4.780478775501251e-06, -3.952533006668091e-06, -3.1245872378349304e-06, -2.29664146900177e-06, -1.4686957001686096e-06, -6.407499313354492e-07, 1.8719583749771118e-07, 1.0151416063308716e-06, 1.843087375164032e-06, 2.6710331439971924e-06, 3.4989789128303528e-06, 4.326924681663513e-06, 5.154870450496674e-06, 5.982816219329834e-06, 6.810761988162994e-06, 7.638707756996155e-06, 8.466653525829315e-06, 9.294599294662476e-06, 1.0122545063495636e-05, 1.0950490832328796e-05, 1.1778436601161957e-05, 1.2606382369995117e-05, 1.3434328138828278e-05, 1.4262273907661438e-05, 1.5090219676494598e-05, 1.591816544532776e-05, 1.674611121416092e-05, 1.757405698299408e-05, 1.840200275182724e-05, 1.92299485206604e-05, 2.005789428949356e-05, 2.088584005832672e-05, 2.171378582715988e-05, 2.2541731595993042e-05, 2.3369677364826202e-05, 2.4197623133659363e-05, 2.5025568902492523e-05, 2.5853514671325684e-05, 2.6681460440158844e-05, 2.7509406208992004e-05, 2.8337351977825165e-05, 2.9165297746658325e-05, 2.9993243515491486e-05, 3.0821189284324646e-05, 3.1649135053157806e-05, 3.247708082199097e-05, 3.330502659082413e-05, 3.413297235965729e-05, 3.496091812849045e-05, 3.578886389732361e-05, 3.661680966615677e-05, 3.744475543498993e-05, 3.827270120382309e-05, 3.910064697265625e-05]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 11.0, 9.0, 17.0, 23.0, 25.0, 45.0, 65.0, 107.0, 144.0, 244.0, 356.0, 487.0, 794.0, 1226.0, 1967.0, 3122.0, 5056.0, 8806.0, 15515.0, 29625.0, 63471.0, 195738.0, 3260707.0, 431214.0, 90322.0, 38390.0, 19384.0, 10808.0, 6282.0, 3740.0, 2409.0, 1422.0, 909.0, 620.0, 392.0, 266.0, 176.0, 123.0, 99.0, 46.0, 33.0, 21.0, 11.0, 15.0, 7.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-3.141164779663086e-05, -3.0450522899627686e-05, -2.9489398002624512e-05, -2.8528273105621338e-05, -2.7567148208618164e-05, -2.660602331161499e-05, -2.5644898414611816e-05, -2.4683773517608643e-05, -2.372264862060547e-05, -2.2761523723602295e-05, -2.180039882659912e-05, -2.0839273929595947e-05, -1.9878149032592773e-05, -1.89170241355896e-05, -1.7955899238586426e-05, -1.6994774341583252e-05, -1.6033649444580078e-05, -1.5072524547576904e-05, -1.411139965057373e-05, -1.3150274753570557e-05, -1.2189149856567383e-05, -1.1228024959564209e-05, -1.0266900062561035e-05, -9.305775165557861e-06, -8.344650268554688e-06, -7.383525371551514e-06, -6.42240047454834e-06, -5.461275577545166e-06, -4.500150680541992e-06, -3.5390257835388184e-06, -2.5779008865356445e-06, -1.6167759895324707e-06, -6.556510925292969e-07, 3.0547380447387695e-07, 1.2665987014770508e-06, 2.2277235984802246e-06, 3.1888484954833984e-06, 4.149973392486572e-06, 5.111098289489746e-06, 6.07222318649292e-06, 7.033348083496094e-06, 7.994472980499268e-06, 8.955597877502441e-06, 9.916722774505615e-06, 1.0877847671508789e-05, 1.1838972568511963e-05, 1.2800097465515137e-05, 1.376122236251831e-05, 1.4722347259521484e-05, 1.5683472156524658e-05, 1.6644597053527832e-05, 1.7605721950531006e-05, 1.856684684753418e-05, 1.9527971744537354e-05, 2.0489096641540527e-05, 2.14502215385437e-05, 2.2411346435546875e-05, 2.337247133255005e-05, 2.4333596229553223e-05, 2.5294721126556396e-05, 2.625584602355957e-05, 2.7216970920562744e-05, 2.8178095817565918e-05, 2.9139220714569092e-05, 3.0100345611572266e-05]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 7.0, 6.0, 8.0, 10.0, 19.0, 15.0, 20.0, 20.0, 22.0, 23.0, 36.0, 40.0, 63.0, 83.0, 227.0, 585.0, 1242.0, 792.0, 288.0, 138.0, 73.0, 75.0, 41.0, 33.0, 34.0, 28.0, 21.0, 23.0, 12.0, 8.0, 15.0, 13.0, 9.0, 6.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-2.5033950805664062e-05, -2.4267472326755524e-05, -2.3500993847846985e-05, -2.2734515368938446e-05, -2.1968036890029907e-05, -2.120155841112137e-05, -2.043507993221283e-05, -1.966860145330429e-05, -1.8902122974395752e-05, -1.8135644495487213e-05, -1.7369166016578674e-05, -1.6602687537670135e-05, -1.5836209058761597e-05, -1.5069730579853058e-05, -1.4303252100944519e-05, -1.353677362203598e-05, -1.2770295143127441e-05, -1.2003816664218903e-05, -1.1237338185310364e-05, -1.0470859706401825e-05, -9.704381227493286e-06, -8.937902748584747e-06, -8.171424269676208e-06, -7.40494579076767e-06, -6.638467311859131e-06, -5.871988832950592e-06, -5.105510354042053e-06, -4.339031875133514e-06, -3.5725533962249756e-06, -2.8060749173164368e-06, -2.039596438407898e-06, -1.2731179594993591e-06, -5.066394805908203e-07, 2.598389983177185e-07, 1.0263174772262573e-06, 1.7927959561347961e-06, 2.559274435043335e-06, 3.3257529139518738e-06, 4.092231392860413e-06, 4.858709871768951e-06, 5.62518835067749e-06, 6.391666829586029e-06, 7.158145308494568e-06, 7.924623787403107e-06, 8.691102266311646e-06, 9.457580745220184e-06, 1.0224059224128723e-05, 1.0990537703037262e-05, 1.17570161819458e-05, 1.252349466085434e-05, 1.3289973139762878e-05, 1.4056451618671417e-05, 1.4822930097579956e-05, 1.5589408576488495e-05, 1.6355887055397034e-05, 1.7122365534305573e-05, 1.788884401321411e-05, 1.865532249212265e-05, 1.942180097103119e-05, 2.0188279449939728e-05, 2.0954757928848267e-05, 2.1721236407756805e-05, 2.2487714886665344e-05, 2.3254193365573883e-05, 2.4020671844482422e-05]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 8.0, 20.0, 18.0, 30.0, 51.0, 73.0, 92.0, 127.0, 127.0, 97.0, 84.0, 57.0, 36.0, 32.0, 23.0, 15.0, 18.0, 13.0, 12.0, 7.0, 10.0, 8.0, 5.0, 9.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017429336730856448, -0.00016915309242904186, -0.00016401281754951924, -0.00015887254266999662, -0.000153732267790474, -0.00014859199291095138, -0.00014345171803142875, -0.00013831144315190613, -0.0001331711682723835, -0.0001280308933928609, -0.00012289061851333827, -0.00011775034363381565, -0.00011261006875429302, -0.0001074697938747704, -0.00010232951899524778, -9.718924411572516e-05, -9.204897651216015e-05, -8.690870163263753e-05, -8.176842675311491e-05, -7.662815187359229e-05, -7.148787699406967e-05, -6.634760211454704e-05, -6.120733451098204e-05, -5.606705599348061e-05, -5.0926781113957986e-05, -4.5786506234435365e-05, -4.064623135491274e-05, -3.550596011336893e-05, -3.0365683414856903e-05, -2.522540853533428e-05, -2.0085135474801064e-05, -1.4944860595278442e-05, -9.80458571575582e-06, -4.6643112909805495e-06, 4.759631337947212e-07, 5.616237103822641e-06, 1.0756511983345263e-05, 1.5896786862867884e-05, 2.1037059923401102e-05, 2.6177334802923724e-05, 3.1317609682446346e-05, 3.645788456196897e-05, 4.159815944149159e-05, 4.6738430683035403e-05, 5.1878705562558025e-05, 5.701898044208065e-05, 6.215925532160327e-05, 6.729953020112589e-05, 7.243980508064851e-05, 7.758007996017113e-05, 8.272035483969375e-05, 8.786062971921638e-05, 9.3000904598739e-05, 9.814117947826162e-05, 0.00010328144708182663, 0.00010842172196134925, 0.00011356199684087187, 0.00011870227172039449, 0.00012384254659991711, 0.00012898282147943974, 0.00013412309635896236, 0.00013926337123848498, 0.0001444036461180076, 0.00014954392099753022, 0.00015468419587705284]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 6.0, 4.0, 7.0, 6.0, 10.0, 3.0, 16.0, 16.0, 18.0, 14.0, 14.0, 18.0, 25.0, 28.0, 31.0, 39.0, 37.0, 32.0, 35.0, 35.0, 44.0, 41.0, 36.0, 54.0, 38.0, 40.0, 32.0, 40.0, 32.0, 30.0, 37.0, 33.0, 23.0, 21.0, 18.0, 18.0, 8.0, 12.0, 10.0, 10.0, 5.0, 6.0, 5.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.08970832824707e-05, -8.826423436403275e-05, -8.563138544559479e-05, -8.299853652715683e-05, -8.036568760871887e-05, -7.773283869028091e-05, -7.509998977184296e-05, -7.2467140853405e-05, -6.983429193496704e-05, -6.720144301652908e-05, -6.456859409809113e-05, -6.193574517965317e-05, -5.930289626121521e-05, -5.667004734277725e-05, -5.4037198424339294e-05, -5.140434950590134e-05, -4.877150058746338e-05, -4.613865166902542e-05, -4.350580275058746e-05, -4.0872953832149506e-05, -3.824010491371155e-05, -3.560725599527359e-05, -3.297440707683563e-05, -3.0341558158397675e-05, -2.7708709239959717e-05, -2.507586032152176e-05, -2.24430114030838e-05, -1.9810162484645844e-05, -1.7177313566207886e-05, -1.4544464647769928e-05, -1.191161572933197e-05, -9.278766810894012e-06, -6.645917892456055e-06, -4.013068974018097e-06, -1.3802200555801392e-06, 1.2526288628578186e-06, 3.885477781295776e-06, 6.518326699733734e-06, 9.151175618171692e-06, 1.178402453660965e-05, 1.4416873455047607e-05, 1.7049722373485565e-05, 1.9682571291923523e-05, 2.231542021036148e-05, 2.494826912879944e-05, 2.7581118047237396e-05, 3.0213966965675354e-05, 3.284681588411331e-05, 3.547966480255127e-05, 3.811251372098923e-05, 4.0745362639427185e-05, 4.337821155786514e-05, 4.60110604763031e-05, 4.864390939474106e-05, 5.1276758313179016e-05, 5.3909607231616974e-05, 5.654245615005493e-05, 5.917530506849289e-05, 6.180815398693085e-05, 6.44410029053688e-05, 6.707385182380676e-05, 6.970670074224472e-05, 7.233954966068268e-05, 7.497239857912064e-05, 7.76052474975586e-05]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 4.0, 2.0, 8.0, 14.0, 10.0, 14.0, 16.0, 17.0, 21.0, 23.0, 40.0, 55.0, 115.0, 217.0, 527.0, 1280.0, 3407.0, 9713.0, 34200.0, 200724.0, 690355.0, 79738.0, 18421.0, 5910.0, 2121.0, 787.0, 362.0, 155.0, 73.0, 41.0, 42.0, 27.0, 21.0, 19.0, 13.0, 11.0, 16.0, 9.0, 6.0, 5.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001342296600341797, -0.00012979470193386078, -0.00012535974383354187, -0.00012092478573322296, -0.00011648982763290405, -0.00011205486953258514, -0.00010761991143226624, -0.00010318495333194733, -9.874999523162842e-05, -9.431503713130951e-05, -8.98800790309906e-05, -8.544512093067169e-05, -8.101016283035278e-05, -7.657520473003387e-05, -7.214024662971497e-05, -6.770528852939606e-05, -6.327033042907715e-05, -5.883537232875824e-05, -5.440041422843933e-05, -4.996545612812042e-05, -4.5530498027801514e-05, -4.1095539927482605e-05, -3.6660581827163696e-05, -3.222562372684479e-05, -2.779066562652588e-05, -2.335570752620697e-05, -1.892074942588806e-05, -1.4485791325569153e-05, -1.0050833225250244e-05, -5.6158751249313354e-06, -1.1809170246124268e-06, 3.254041075706482e-06, 7.68899917602539e-06, 1.21239572763443e-05, 1.6558915376663208e-05, 2.0993873476982117e-05, 2.5428831577301025e-05, 2.9863789677619934e-05, 3.429874777793884e-05, 3.873370587825775e-05, 4.316866397857666e-05, 4.760362207889557e-05, 5.203858017921448e-05, 5.6473538279533386e-05, 6.0908496379852295e-05, 6.53434544801712e-05, 6.977841258049011e-05, 7.421337068080902e-05, 7.864832878112793e-05, 8.308328688144684e-05, 8.751824498176575e-05, 9.195320308208466e-05, 9.638816118240356e-05, 0.00010082311928272247, 0.00010525807738304138, 0.00010969303548336029, 0.0001141279935836792, 0.00011856295168399811, 0.00012299790978431702, 0.00012743286788463593, 0.00013186782598495483, 0.00013630278408527374, 0.00014073774218559265, 0.00014517270028591156, 0.00014960765838623047]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 7.0, 12.0, 12.0, 17.0, 40.0, 57.0, 84.0, 91.0, 143.0, 143.0, 113.0, 75.0, 64.0, 52.0, 23.0, 19.0, 12.0, 15.0, 8.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6033649444580078e-05, -1.5201978385448456e-05, -1.4370307326316833e-05, -1.3538636267185211e-05, -1.2706965208053589e-05, -1.1875294148921967e-05, -1.1043623089790344e-05, -1.0211952030658722e-05, -9.3802809715271e-06, -8.548609912395477e-06, -7.716938853263855e-06, -6.885267794132233e-06, -6.05359673500061e-06, -5.221925675868988e-06, -4.390254616737366e-06, -3.5585835576057434e-06, -2.726912498474121e-06, -1.8952414393424988e-06, -1.0635703802108765e-06, -2.3189932107925415e-07, 5.997717380523682e-07, 1.4314427971839905e-06, 2.263113856315613e-06, 3.094784915447235e-06, 3.926455974578857e-06, 4.75812703371048e-06, 5.589798092842102e-06, 6.421469151973724e-06, 7.253140211105347e-06, 8.084811270236969e-06, 8.916482329368591e-06, 9.748153388500214e-06, 1.0579824447631836e-05, 1.1411495506763458e-05, 1.224316656589508e-05, 1.3074837625026703e-05, 1.3906508684158325e-05, 1.4738179743289948e-05, 1.556985080242157e-05, 1.6401521861553192e-05, 1.7233192920684814e-05, 1.8064863979816437e-05, 1.889653503894806e-05, 1.972820609807968e-05, 2.0559877157211304e-05, 2.1391548216342926e-05, 2.222321927547455e-05, 2.305489033460617e-05, 2.3886561393737793e-05, 2.4718232452869415e-05, 2.5549903512001038e-05, 2.638157457113266e-05, 2.7213245630264282e-05, 2.8044916689395905e-05, 2.8876587748527527e-05, 2.970825880765915e-05, 3.053992986679077e-05, 3.1371600925922394e-05, 3.2203271985054016e-05, 3.303494304418564e-05, 3.386661410331726e-05, 3.469828516244888e-05, 3.5529956221580505e-05, 3.636162728071213e-05, 3.719329833984375e-05]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 9.0, 11.0, 22.0, 28.0, 39.0, 54.0, 78.0, 112.0, 143.0, 228.0, 386.0, 516.0, 811.0, 1148.0, 1891.0, 2849.0, 4621.0, 7406.0, 12195.0, 18571.0, 34623.0, 64559.0, 135647.0, 384554.0, 183379.0, 86543.0, 44589.0, 24960.0, 14509.0, 8822.0, 5087.0, 3555.0, 2290.0, 1446.0, 958.0, 603.0, 384.0, 317.0, 183.0, 148.0, 86.0, 54.0, 46.0, 29.0, 16.0, 16.0, 8.0, 16.0, 4.0, 6.0, 0.0, 3.0, 3.0, 3.0], "bins": [-2.777576446533203e-05, -2.6951543986797333e-05, -2.6127323508262634e-05, -2.5303103029727936e-05, -2.4478882551193237e-05, -2.365466207265854e-05, -2.283044159412384e-05, -2.2006221115589142e-05, -2.1182000637054443e-05, -2.0357780158519745e-05, -1.9533559679985046e-05, -1.8709339201450348e-05, -1.788511872291565e-05, -1.706089824438095e-05, -1.6236677765846252e-05, -1.5412457287311554e-05, -1.4588236808776855e-05, -1.3764016330242157e-05, -1.2939795851707458e-05, -1.211557537317276e-05, -1.1291354894638062e-05, -1.0467134416103363e-05, -9.642913937568665e-06, -8.818693459033966e-06, -7.994472980499268e-06, -7.170252501964569e-06, -6.346032023429871e-06, -5.521811544895172e-06, -4.697591066360474e-06, -3.873370587825775e-06, -3.0491501092910767e-06, -2.224929630756378e-06, -1.4007091522216797e-06, -5.764886736869812e-07, 2.477318048477173e-07, 1.0719522833824158e-06, 1.8961727619171143e-06, 2.7203932404518127e-06, 3.5446137189865112e-06, 4.36883419752121e-06, 5.193054676055908e-06, 6.017275154590607e-06, 6.841495633125305e-06, 7.665716111660004e-06, 8.489936590194702e-06, 9.3141570687294e-06, 1.0138377547264099e-05, 1.0962598025798798e-05, 1.1786818504333496e-05, 1.2611038982868195e-05, 1.3435259461402893e-05, 1.4259479939937592e-05, 1.508370041847229e-05, 1.590792089700699e-05, 1.6732141375541687e-05, 1.7556361854076385e-05, 1.8380582332611084e-05, 1.9204802811145782e-05, 2.002902328968048e-05, 2.085324376821518e-05, 2.1677464246749878e-05, 2.2501684725284576e-05, 2.3325905203819275e-05, 2.4150125682353973e-05, 2.4974346160888672e-05]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 4.0, 9.0, 15.0, 13.0, 13.0, 18.0, 24.0, 17.0, 22.0, 32.0, 29.0, 42.0, 33.0, 44.0, 43.0, 44.0, 35.0, 37.0, 37.0, 50.0, 48.0, 33.0, 43.0, 42.0, 40.0, 33.0, 21.0, 24.0, 25.0, 29.0, 11.0, 10.0, 10.0, 12.0, 14.0, 8.0, 6.0, 4.0, 7.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5987625122070312e-05, -2.511683851480484e-05, -2.4246051907539368e-05, -2.3375265300273895e-05, -2.2504478693008423e-05, -2.163369208574295e-05, -2.0762905478477478e-05, -1.9892118871212006e-05, -1.9021332263946533e-05, -1.815054565668106e-05, -1.727975904941559e-05, -1.6408972442150116e-05, -1.5538185834884644e-05, -1.4667399227619171e-05, -1.3796612620353699e-05, -1.2925826013088226e-05, -1.2055039405822754e-05, -1.1184252798557281e-05, -1.0313466191291809e-05, -9.442679584026337e-06, -8.571892976760864e-06, -7.701106369495392e-06, -6.8303197622299194e-06, -5.959533154964447e-06, -5.088746547698975e-06, -4.217959940433502e-06, -3.3471733331680298e-06, -2.4763867259025574e-06, -1.605600118637085e-06, -7.348135113716125e-07, 1.3597309589385986e-07, 1.0067597031593323e-06, 1.8775463104248047e-06, 2.748332917690277e-06, 3.6191195249557495e-06, 4.489906132221222e-06, 5.360692739486694e-06, 6.231479346752167e-06, 7.102265954017639e-06, 7.973052561283112e-06, 8.843839168548584e-06, 9.714625775814056e-06, 1.0585412383079529e-05, 1.1456198990345001e-05, 1.2326985597610474e-05, 1.3197772204875946e-05, 1.4068558812141418e-05, 1.4939345419406891e-05, 1.5810132026672363e-05, 1.6680918633937836e-05, 1.7551705241203308e-05, 1.842249184846878e-05, 1.9293278455734253e-05, 2.0164065062999725e-05, 2.1034851670265198e-05, 2.190563827753067e-05, 2.2776424884796143e-05, 2.3647211492061615e-05, 2.4517998099327087e-05, 2.538878470659256e-05, 2.6259571313858032e-05, 2.7130357921123505e-05, 2.8001144528388977e-05, 2.887193113565445e-05, 2.9742717742919922e-05]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 11.0, 12.0, 19.0, 20.0, 41.0, 60.0, 73.0, 123.0, 186.0, 343.0, 573.0, 1033.0, 2002.0, 5491.0, 21881.0, 342889.0, 633471.0, 28989.0, 6247.0, 2410.0, 1023.0, 634.0, 359.0, 214.0, 145.0, 103.0, 56.0, 51.0, 25.0, 27.0, 10.0, 12.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1265277862548828e-05, -1.0849907994270325e-05, -1.0434538125991821e-05, -1.0019168257713318e-05, -9.603798389434814e-06, -9.188428521156311e-06, -8.773058652877808e-06, -8.357688784599304e-06, -7.9423189163208e-06, -7.526949048042297e-06, -7.111579179763794e-06, -6.6962093114852905e-06, -6.280839443206787e-06, -5.865469574928284e-06, -5.45009970664978e-06, -5.034729838371277e-06, -4.6193599700927734e-06, -4.20399010181427e-06, -3.7886202335357666e-06, -3.373250365257263e-06, -2.9578804969787598e-06, -2.5425106287002563e-06, -2.127140760421753e-06, -1.7117708921432495e-06, -1.296401023864746e-06, -8.810311555862427e-07, -4.6566128730773926e-07, -5.029141902923584e-08, 3.650784492492676e-07, 7.80448317527771e-07, 1.1958181858062744e-06, 1.6111880540847778e-06, 2.0265579223632812e-06, 2.4419277906417847e-06, 2.857297658920288e-06, 3.2726675271987915e-06, 3.688037395477295e-06, 4.103407263755798e-06, 4.518777132034302e-06, 4.934147000312805e-06, 5.349516868591309e-06, 5.764886736869812e-06, 6.1802566051483154e-06, 6.595626473426819e-06, 7.010996341705322e-06, 7.426366209983826e-06, 7.841736078262329e-06, 8.257105946540833e-06, 8.672475814819336e-06, 9.08784568309784e-06, 9.503215551376343e-06, 9.918585419654846e-06, 1.033395528793335e-05, 1.0749325156211853e-05, 1.1164695024490356e-05, 1.158006489276886e-05, 1.1995434761047363e-05, 1.2410804629325867e-05, 1.282617449760437e-05, 1.3241544365882874e-05, 1.3656914234161377e-05, 1.407228410243988e-05, 1.4487653970718384e-05, 1.4903023838996887e-05, 1.531839370727539e-05]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 7.0, 18.0, 0.0, 11.0, 17.0, 0.0, 30.0, 40.0, 0.0, 50.0, 70.0, 0.0, 88.0, 108.0, 0.0, 105.0, 90.0, 0.0, 91.0, 74.0, 0.0, 52.0, 46.0, 0.0, 31.0, 22.0, 0.0, 25.0, 8.0, 0.0, 10.0, 4.0, 0.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3308599591255188e-06, -1.2908130884170532e-06, -1.2507662177085876e-06, -1.210719347000122e-06, -1.1706724762916565e-06, -1.130625605583191e-06, -1.0905787348747253e-06, -1.0505318641662598e-06, -1.0104849934577942e-06, -9.704381227493286e-07, -9.30391252040863e-07, -8.903443813323975e-07, -8.502975106239319e-07, -8.102506399154663e-07, -7.702037692070007e-07, -7.301568984985352e-07, -6.901100277900696e-07, -6.50063157081604e-07, -6.100162863731384e-07, -5.699694156646729e-07, -5.299225449562073e-07, -4.898756742477417e-07, -4.498288035392761e-07, -4.0978193283081055e-07, -3.6973506212234497e-07, -3.296881914138794e-07, -2.896413207054138e-07, -2.4959444999694824e-07, -2.0954757928848267e-07, -1.695007085800171e-07, -1.2945383787155151e-07, -8.940696716308594e-08, -4.936009645462036e-08, -9.313225746154785e-09, 3.073364496231079e-08, 7.078051567077637e-08, 1.1082738637924194e-07, 1.5087425708770752e-07, 1.909211277961731e-07, 2.3096799850463867e-07, 2.7101486921310425e-07, 3.110617399215698e-07, 3.511086106300354e-07, 3.91155481338501e-07, 4.3120235204696655e-07, 4.7124922275543213e-07, 5.112960934638977e-07, 5.513429641723633e-07, 5.913898348808289e-07, 6.314367055892944e-07, 6.7148357629776e-07, 7.115304470062256e-07, 7.515773177146912e-07, 7.916241884231567e-07, 8.316710591316223e-07, 8.717179298400879e-07, 9.117648005485535e-07, 9.51811671257019e-07, 9.918585419654846e-07, 1.0319054126739502e-06, 1.0719522833824158e-06, 1.1119991540908813e-06, 1.152046024799347e-06, 1.1920928955078125e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 7.0, 3.0, 8.0, 19.0, 11.0, 29.0, 15.0, 58.0, 61.0, 40.0, 142.0, 195.0, 129.0, 379.0, 545.0, 394.0, 1208.0, 2084.0, 1613.0, 5185.0, 4327.0, 15285.0, 37371.0, 39393.0, 240778.0, 517278.0, 73595.0, 62168.0, 23567.0, 6336.0, 7276.0, 2165.0, 2760.0, 1541.0, 503.0, 729.0, 475.0, 143.0, 260.0, 168.0, 49.0, 85.0, 52.0, 25.0, 31.0, 6.0, 17.0, 15.0, 8.0, 14.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-3.159046173095703e-06, -3.061257302761078e-06, -2.9634684324264526e-06, -2.8656795620918274e-06, -2.767890691757202e-06, -2.670101821422577e-06, -2.5723129510879517e-06, -2.4745240807533264e-06, -2.376735210418701e-06, -2.278946340084076e-06, -2.1811574697494507e-06, -2.0833685994148254e-06, -1.9855797290802e-06, -1.887790858745575e-06, -1.7900019884109497e-06, -1.6922131180763245e-06, -1.5944242477416992e-06, -1.496635377407074e-06, -1.3988465070724487e-06, -1.3010576367378235e-06, -1.2032687664031982e-06, -1.105479896068573e-06, -1.0076910257339478e-06, -9.099021553993225e-07, -8.121132850646973e-07, -7.14324414730072e-07, -6.165355443954468e-07, -5.187466740608215e-07, -4.209578037261963e-07, -3.2316893339157104e-07, -2.253800630569458e-07, -1.2759119272232056e-07, -2.9802322387695312e-08, 6.798654794692993e-08, 1.6577541828155518e-07, 2.635642886161804e-07, 3.6135315895080566e-07, 4.591420292854309e-07, 5.569308996200562e-07, 6.547197699546814e-07, 7.525086402893066e-07, 8.502975106239319e-07, 9.480863809585571e-07, 1.0458752512931824e-06, 1.1436641216278076e-06, 1.2414529919624329e-06, 1.339241862297058e-06, 1.4370307326316833e-06, 1.5348196029663086e-06, 1.6326084733009338e-06, 1.730397343635559e-06, 1.8281862139701843e-06, 1.9259750843048096e-06, 2.023763954639435e-06, 2.12155282497406e-06, 2.2193416953086853e-06, 2.3171305656433105e-06, 2.414919435977936e-06, 2.512708306312561e-06, 2.6104971766471863e-06, 2.7082860469818115e-06, 2.8060749173164368e-06, 2.903863787651062e-06, 3.0016526579856873e-06, 3.0994415283203125e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 7.0, 4.0, 3.0, 13.0, 12.0, 11.0, 23.0, 26.0, 14.0, 42.0, 51.0, 34.0, 76.0, 97.0, 60.0, 113.0, 57.0, 72.0, 72.0, 28.0, 52.0, 34.0, 11.0, 22.0, 22.0, 4.0, 10.0, 8.0, 2.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-06, -2.8815120458602905e-06, -2.78279185295105e-06, -2.684071660041809e-06, -2.5853514671325684e-06, -2.4866312742233276e-06, -2.387911081314087e-06, -2.289190888404846e-06, -2.1904706954956055e-06, -2.0917505025863647e-06, -1.993030309677124e-06, -1.8943101167678833e-06, -1.7955899238586426e-06, -1.6968697309494019e-06, -1.5981495380401611e-06, -1.4994293451309204e-06, -1.4007091522216797e-06, -1.301988959312439e-06, -1.2032687664031982e-06, -1.1045485734939575e-06, -1.0058283805847168e-06, -9.071081876754761e-07, -8.083879947662354e-07, -7.096678018569946e-07, -6.109476089477539e-07, -5.122274160385132e-07, -4.1350722312927246e-07, -3.1478703022003174e-07, -2.1606683731079102e-07, -1.1734664440155029e-07, -1.862645149230957e-08, 8.009374141693115e-08, 1.7881393432617188e-07, 2.775341272354126e-07, 3.762543201446533e-07, 4.7497451305389404e-07, 5.736947059631348e-07, 6.724148988723755e-07, 7.711350917816162e-07, 8.698552846908569e-07, 9.685754776000977e-07, 1.0672956705093384e-06, 1.166015863418579e-06, 1.2647360563278198e-06, 1.3634562492370605e-06, 1.4621764421463013e-06, 1.560896635055542e-06, 1.6596168279647827e-06, 1.7583370208740234e-06, 1.8570572137832642e-06, 1.955777406692505e-06, 2.0544975996017456e-06, 2.1532177925109863e-06, 2.251937985420227e-06, 2.3506581783294678e-06, 2.4493783712387085e-06, 2.5480985641479492e-06, 2.64681875705719e-06, 2.7455389499664307e-06, 2.8442591428756714e-06, 2.942979335784912e-06, 3.041699528694153e-06, 3.1404197216033936e-06, 3.2391399145126343e-06, 3.337860107421875e-06]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 3.0, 6.0, 4.0, 6.0, 4.0, 9.0, 8.0, 10.0, 14.0, 21.0, 24.0, 31.0, 50.0, 42.0, 109.0, 119.0, 156.0, 97.0, 69.0, 57.0, 42.0, 34.0, 23.0, 13.0, 12.0, 13.0, 7.0, 5.0, 3.0, 2.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00011754751903936267, -0.00011379676288925111, -0.00011004601401509717, -0.00010629525786498562, -0.00010254450899083167, -9.879375284072012e-05, -9.504299669060856e-05, -9.1292240540497e-05, -8.754149166634306e-05, -8.379073551623151e-05, -8.003998664207757e-05, -7.628923049196601e-05, -7.253847434185445e-05, -6.878772546770051e-05, -6.503696931758896e-05, -6.128622044343501e-05, -5.753546429332346e-05, -5.378471178119071e-05, -5.003395926905796e-05, -4.62832031189464e-05, -4.2532450606813654e-05, -3.8781698094680905e-05, -3.503094194456935e-05, -3.12801894324366e-05, -2.752943692030385e-05, -2.3778684408171102e-05, -2.002793007704895e-05, -1.6277175745926797e-05, -1.2526423233794048e-05, -8.7756707216613e-06, -5.024916390539147e-06, -1.2741620594169945e-06, 2.4765904527157545e-06, 6.227343874343205e-06, 9.978097295970656e-06, 1.3728850717598107e-05, 1.7479604139225557e-05, 2.1230356651358306e-05, 2.498111098248046e-05, 2.873186531360261e-05, 3.248261782573536e-05, 3.623337033786811e-05, 3.998412285000086e-05, 4.3734879000112414e-05, 4.748563151224516e-05, 5.123638402437791e-05, 5.498714017448947e-05, 5.873789268662222e-05, 6.248864519875497e-05, 6.623940134886652e-05, 6.999015022302046e-05, 7.374090637313202e-05, 7.749165524728596e-05, 8.124241139739752e-05, 8.499316754750907e-05, 8.874392369762063e-05, 9.249467257177457e-05, 9.624542872188613e-05, 9.999617759604007e-05, 0.00010374693374615163, 0.00010749768989626318, 0.00011124843877041712, 0.00011499919492052868, 0.00011874994379468262, 0.00012250069994479418]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 6.0, 10.0, 16.0, 13.0, 24.0, 17.0, 29.0, 31.0, 34.0, 56.0, 39.0, 62.0, 51.0, 53.0, 48.0, 52.0, 52.0, 55.0, 55.0, 43.0, 36.0, 36.0, 22.0, 30.0, 22.0, 17.0, 21.0, 8.0, 6.0, 17.0, 6.0, 8.0, 2.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.225440979003906e-05, -7.950793951749802e-05, -7.676146924495697e-05, -7.401499897241592e-05, -7.126852869987488e-05, -6.852205842733383e-05, -6.577558815479279e-05, -6.302911788225174e-05, -6.028264760971069e-05, -5.753617733716965e-05, -5.47897070646286e-05, -5.2043236792087555e-05, -4.929676651954651e-05, -4.655029624700546e-05, -4.3803825974464417e-05, -4.105735570192337e-05, -3.8310885429382324e-05, -3.556441515684128e-05, -3.281794488430023e-05, -3.0071474611759186e-05, -2.732500433921814e-05, -2.4578534066677094e-05, -2.1832063794136047e-05, -1.9085593521595e-05, -1.6339123249053955e-05, -1.3592652976512909e-05, -1.0846182703971863e-05, -8.099712431430817e-06, -5.3532421588897705e-06, -2.6067718863487244e-06, 1.3969838619232178e-07, 2.886168658733368e-06, 5.632638931274414e-06, 8.37910920381546e-06, 1.1125579476356506e-05, 1.3872049748897552e-05, 1.66185200214386e-05, 1.9364990293979645e-05, 2.211146056652069e-05, 2.4857930839061737e-05, 2.7604401111602783e-05, 3.035087138414383e-05, 3.3097341656684875e-05, 3.584381192922592e-05, 3.859028220176697e-05, 4.1336752474308014e-05, 4.408322274684906e-05, 4.6829693019390106e-05, 4.957616329193115e-05, 5.23226335644722e-05, 5.5069103837013245e-05, 5.781557410955429e-05, 6.056204438209534e-05, 6.330851465463638e-05, 6.605498492717743e-05, 6.880145519971848e-05, 7.154792547225952e-05, 7.429439574480057e-05, 7.704086601734161e-05, 7.978733628988266e-05, 8.25338065624237e-05, 8.528027683496475e-05, 8.80267471075058e-05, 9.077321738004684e-05, 9.351968765258789e-05]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 2.0, 16.0, 15.0, 22.0, 42.0, 58.0, 73.0, 144.0, 221.0, 341.0, 518.0, 872.0, 1401.0, 2773.0, 6048.0, 14903.0, 55269.0, 3534785.0, 523412.0, 31058.0, 11338.0, 5032.0, 2415.0, 1339.0, 738.0, 454.0, 327.0, 208.0, 119.0, 84.0, 66.0, 50.0, 36.0, 19.0, 17.0, 17.0, 10.0, 9.0, 7.0, 7.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4001808166503906e-05, -5.173590034246445e-05, -4.946999251842499e-05, -4.720408469438553e-05, -4.493817687034607e-05, -4.267226904630661e-05, -4.040636122226715e-05, -3.814045339822769e-05, -3.587454557418823e-05, -3.360863775014877e-05, -3.1342729926109314e-05, -2.9076822102069855e-05, -2.6810914278030396e-05, -2.4545006453990936e-05, -2.2279098629951477e-05, -2.0013190805912018e-05, -1.774728298187256e-05, -1.54813751578331e-05, -1.321546733379364e-05, -1.0949559509754181e-05, -8.683651685714722e-06, -6.4177438616752625e-06, -4.151836037635803e-06, -1.885928213596344e-06, 3.7997961044311523e-07, 2.6458874344825745e-06, 4.911795258522034e-06, 7.177703082561493e-06, 9.443610906600952e-06, 1.1709518730640411e-05, 1.397542655467987e-05, 1.624133437871933e-05, 1.850724220275879e-05, 2.0773150026798248e-05, 2.3039057850837708e-05, 2.5304965674877167e-05, 2.7570873498916626e-05, 2.9836781322956085e-05, 3.2102689146995544e-05, 3.4368596971035004e-05, 3.663450479507446e-05, 3.890041261911392e-05, 4.116632044315338e-05, 4.343222826719284e-05, 4.56981360912323e-05, 4.796404391527176e-05, 5.022995173931122e-05, 5.249585956335068e-05, 5.476176738739014e-05, 5.7027675211429596e-05, 5.9293583035469055e-05, 6.155949085950851e-05, 6.382539868354797e-05, 6.609130650758743e-05, 6.835721433162689e-05, 7.062312215566635e-05, 7.288902997970581e-05, 7.515493780374527e-05, 7.742084562778473e-05, 7.968675345182419e-05, 8.195266127586365e-05, 8.42185690999031e-05, 8.648447692394257e-05, 8.875038474798203e-05, 9.101629257202148e-05]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 9.0, 3.0, 5.0, 3.0, 7.0, 9.0, 12.0, 13.0, 21.0, 42.0, 41.0, 58.0, 75.0, 116.0, 90.0, 112.0, 81.0, 76.0, 53.0, 46.0, 40.0, 26.0, 13.0, 17.0, 10.0, 5.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4007091522216797e-05, -1.3397075235843658e-05, -1.278705894947052e-05, -1.2177042663097382e-05, -1.1567026376724243e-05, -1.0957010090351105e-05, -1.0346993803977966e-05, -9.736977517604828e-06, -9.12696123123169e-06, -8.516944944858551e-06, -7.906928658485413e-06, -7.296912372112274e-06, -6.686896085739136e-06, -6.076879799365997e-06, -5.466863512992859e-06, -4.8568472266197205e-06, -4.246830940246582e-06, -3.6368146538734436e-06, -3.026798367500305e-06, -2.4167820811271667e-06, -1.8067657947540283e-06, -1.1967495083808899e-06, -5.867332220077515e-07, 2.3283064365386963e-08, 6.332993507385254e-07, 1.2433156371116638e-06, 1.8533319234848022e-06, 2.4633482098579407e-06, 3.073364496231079e-06, 3.6833807826042175e-06, 4.293397068977356e-06, 4.903413355350494e-06, 5.513429641723633e-06, 6.123445928096771e-06, 6.73346221446991e-06, 7.343478500843048e-06, 7.953494787216187e-06, 8.563511073589325e-06, 9.173527359962463e-06, 9.783543646335602e-06, 1.039355993270874e-05, 1.1003576219081879e-05, 1.1613592505455017e-05, 1.2223608791828156e-05, 1.2833625078201294e-05, 1.3443641364574432e-05, 1.405365765094757e-05, 1.466367393732071e-05, 1.5273690223693848e-05, 1.5883706510066986e-05, 1.6493722796440125e-05, 1.7103739082813263e-05, 1.77137553691864e-05, 1.832377165555954e-05, 1.8933787941932678e-05, 1.9543804228305817e-05, 2.0153820514678955e-05, 2.0763836801052094e-05, 2.1373853087425232e-05, 2.198386937379837e-05, 2.259388566017151e-05, 2.3203901946544647e-05, 2.3813918232917786e-05, 2.4423934519290924e-05, 2.5033950805664062e-05]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 13.0, 7.0, 15.0, 22.0, 39.0, 41.0, 85.0, 120.0, 164.0, 221.0, 377.0, 545.0, 902.0, 1496.0, 2403.0, 3979.0, 7039.0, 14363.0, 28122.0, 65918.0, 325488.0, 3429587.0, 205487.0, 54973.0, 24311.0, 12137.0, 6582.0, 3879.0, 2179.0, 1344.0, 817.0, 530.0, 335.0, 253.0, 155.0, 104.0, 75.0, 52.0, 30.0, 20.0, 19.0, 19.0, 7.0, 8.0, 9.0, 1.0, 4.0, 1.0, 5.0], "bins": [-3.4928321838378906e-05, -3.396905958652496e-05, -3.300979733467102e-05, -3.205053508281708e-05, -3.1091272830963135e-05, -3.0132010579109192e-05, -2.917274832725525e-05, -2.8213486075401306e-05, -2.7254223823547363e-05, -2.629496157169342e-05, -2.5335699319839478e-05, -2.4376437067985535e-05, -2.3417174816131592e-05, -2.245791256427765e-05, -2.1498650312423706e-05, -2.0539388060569763e-05, -1.958012580871582e-05, -1.8620863556861877e-05, -1.7661601305007935e-05, -1.6702339053153992e-05, -1.574307680130005e-05, -1.4783814549446106e-05, -1.3824552297592163e-05, -1.286529004573822e-05, -1.1906027793884277e-05, -1.0946765542030334e-05, -9.987503290176392e-06, -9.028241038322449e-06, -8.068978786468506e-06, -7.109716534614563e-06, -6.15045428276062e-06, -5.191192030906677e-06, -4.231929779052734e-06, -3.2726675271987915e-06, -2.3134052753448486e-06, -1.3541430234909058e-06, -3.948807716369629e-07, 5.6438148021698e-07, 1.5236437320709229e-06, 2.4829059839248657e-06, 3.4421682357788086e-06, 4.4014304876327515e-06, 5.360692739486694e-06, 6.319954991340637e-06, 7.27921724319458e-06, 8.238479495048523e-06, 9.197741746902466e-06, 1.0157003998756409e-05, 1.1116266250610352e-05, 1.2075528502464294e-05, 1.3034790754318237e-05, 1.399405300617218e-05, 1.4953315258026123e-05, 1.5912577509880066e-05, 1.687183976173401e-05, 1.783110201358795e-05, 1.8790364265441895e-05, 1.9749626517295837e-05, 2.070888876914978e-05, 2.1668151021003723e-05, 2.2627413272857666e-05, 2.358667552471161e-05, 2.4545937776565552e-05, 2.5505200028419495e-05, 2.6464462280273438e-05]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 7.0, 15.0, 18.0, 11.0, 9.0, 17.0, 31.0, 35.0, 33.0, 47.0, 84.0, 171.0, 464.0, 1218.0, 973.0, 457.0, 141.0, 63.0, 43.0, 34.0, 42.0, 18.0, 24.0, 13.0, 16.0, 6.0, 17.0, 5.0, 7.0, 7.0, 9.0, 1.0, 2.0, 2.0, 0.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.7179718017578125e-05, -2.6377849280834198e-05, -2.557598054409027e-05, -2.4774111807346344e-05, -2.3972243070602417e-05, -2.317037433385849e-05, -2.2368505597114563e-05, -2.1566636860370636e-05, -2.076476812362671e-05, -1.9962899386882782e-05, -1.9161030650138855e-05, -1.8359161913394928e-05, -1.7557293176651e-05, -1.6755424439907074e-05, -1.5953555703163147e-05, -1.515168696641922e-05, -1.4349818229675293e-05, -1.3547949492931366e-05, -1.2746080756187439e-05, -1.1944212019443512e-05, -1.1142343282699585e-05, -1.0340474545955658e-05, -9.538605809211731e-06, -8.736737072467804e-06, -7.934868335723877e-06, -7.13299959897995e-06, -6.331130862236023e-06, -5.529262125492096e-06, -4.727393388748169e-06, -3.925524652004242e-06, -3.123655915260315e-06, -2.321787178516388e-06, -1.519918441772461e-06, -7.180497050285339e-07, 8.381903171539307e-08, 8.856877684593201e-07, 1.687556505203247e-06, 2.489425241947174e-06, 3.291293978691101e-06, 4.093162715435028e-06, 4.895031452178955e-06, 5.696900188922882e-06, 6.498768925666809e-06, 7.300637662410736e-06, 8.102506399154663e-06, 8.90437513589859e-06, 9.706243872642517e-06, 1.0508112609386444e-05, 1.1309981346130371e-05, 1.2111850082874298e-05, 1.2913718819618225e-05, 1.3715587556362152e-05, 1.4517456293106079e-05, 1.5319325029850006e-05, 1.6121193766593933e-05, 1.692306250333786e-05, 1.7724931240081787e-05, 1.8526799976825714e-05, 1.932866871356964e-05, 2.0130537450313568e-05, 2.0932406187057495e-05, 2.1734274923801422e-05, 2.253614366054535e-05, 2.3338012397289276e-05, 2.4139881134033203e-05]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 6.0, 13.0, 16.0, 23.0, 34.0, 38.0, 52.0, 76.0, 130.0, 176.0, 135.0, 92.0, 49.0, 36.0, 33.0, 22.0, 23.0, 13.0, 5.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015494637773372233, -0.00014970886695664376, -0.0001444713561795652, -0.0001392338308505714, -0.00013399632007349283, -0.00012875880929641426, -0.0001235212985193357, -0.00011828378774225712, -0.00011304626968922094, -0.00010780875891214237, -0.00010257124085910618, -9.733373008202761e-05, -9.209621930494905e-05, -8.685870125191286e-05, -8.162119047483429e-05, -7.638367242179811e-05, -7.114616164471954e-05, -6.590865086764097e-05, -6.067113281460479e-05, -5.543362203752622e-05, -5.0196107622468844e-05, -4.495859320741147e-05, -3.97210824303329e-05, -3.448356801527552e-05, -2.9246053600218147e-05, -2.400853918516077e-05, -1.87710265890928e-05, -1.3533513993024826e-05, -8.29599957796745e-06, -3.058485162910074e-06, 2.179025614168495e-06, 7.416540029225871e-06, 1.2654054444283247e-05, 1.7891568859340623e-05, 2.3129081455408596e-05, 2.8366594051476568e-05, 3.3604108466533944e-05, 3.884162288159132e-05, 4.407913365866989e-05, 4.9316648073727265e-05, 5.455416248878464e-05, 5.979167690384202e-05, 6.502919131889939e-05, 7.026670209597796e-05, 7.550421287305653e-05, 8.074173092609271e-05, 8.597924170317128e-05, 9.121675975620747e-05, 9.645427053328604e-05, 0.0001016917813103646, 0.00010692929936340079, 0.00011216681014047936, 0.00011740432819351554, 0.0001226418389705941, 0.00012787934974767268, 0.00013311686052475125, 0.00013835437130182981, 0.00014359188207890838, 0.00014882939285598695, 0.00015406691818498075, 0.00015930442896205932, 0.0001645419397391379, 0.00016977945051621646, 0.00017501696129329503, 0.00018025448662228882]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 2.0, 14.0, 13.0, 13.0, 12.0, 21.0, 35.0, 41.0, 33.0, 28.0, 46.0, 45.0, 51.0, 56.0, 66.0, 64.0, 57.0, 54.0, 52.0, 41.0, 51.0, 27.0, 33.0, 34.0, 28.0, 25.0, 14.0, 20.0, 5.0, 1.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.916854858398438e-05, -8.638110011816025e-05, -8.359365165233612e-05, -8.0806203186512e-05, -7.801875472068787e-05, -7.523130625486374e-05, -7.244385778903961e-05, -6.965640932321548e-05, -6.686896085739136e-05, -6.408151239156723e-05, -6.12940639257431e-05, -5.8506615459918976e-05, -5.571916699409485e-05, -5.293171852827072e-05, -5.0144270062446594e-05, -4.735682159662247e-05, -4.456937313079834e-05, -4.178192466497421e-05, -3.8994476199150085e-05, -3.620702773332596e-05, -3.341957926750183e-05, -3.0632130801677704e-05, -2.7844682335853577e-05, -2.505723387002945e-05, -2.2269785404205322e-05, -1.9482336938381195e-05, -1.6694888472557068e-05, -1.390744000673294e-05, -1.1119991540908813e-05, -8.332543075084686e-06, -5.545094609260559e-06, -2.757646143436432e-06, 2.9802322387695312e-08, 2.8172507882118225e-06, 5.60469925403595e-06, 8.392147719860077e-06, 1.1179596185684204e-05, 1.3967044651508331e-05, 1.675449311733246e-05, 1.9541941583156586e-05, 2.2329390048980713e-05, 2.511683851480484e-05, 2.7904286980628967e-05, 3.0691735446453094e-05, 3.347918391227722e-05, 3.626663237810135e-05, 3.9054080843925476e-05, 4.18415293097496e-05, 4.462897777557373e-05, 4.741642624139786e-05, 5.0203874707221985e-05, 5.299132317304611e-05, 5.577877163887024e-05, 5.8566220104694366e-05, 6.13536685705185e-05, 6.414111703634262e-05, 6.692856550216675e-05, 6.971601396799088e-05, 7.2503462433815e-05, 7.529091089963913e-05, 7.807835936546326e-05, 8.086580783128738e-05, 8.365325629711151e-05, 8.644070476293564e-05, 8.922815322875977e-05]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 8.0, 7.0, 21.0, 17.0, 13.0, 20.0, 32.0, 33.0, 56.0, 90.0, 134.0, 200.0, 299.0, 571.0, 1107.0, 2106.0, 4412.0, 10525.0, 26764.0, 82465.0, 382084.0, 408589.0, 82475.0, 26803.0, 10292.0, 4609.0, 2197.0, 1128.0, 549.0, 326.0, 192.0, 127.0, 76.0, 57.0, 37.0, 22.0, 21.0, 19.0, 13.0, 8.0, 10.0, 10.0, 10.0, 6.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-9.548664093017578e-05, -9.275879710912704e-05, -9.003095328807831e-05, -8.730310946702957e-05, -8.457526564598083e-05, -8.18474218249321e-05, -7.911957800388336e-05, -7.639173418283463e-05, -7.366389036178589e-05, -7.093604654073715e-05, -6.820820271968842e-05, -6.548035889863968e-05, -6.275251507759094e-05, -6.0024671256542206e-05, -5.729682743549347e-05, -5.456898361444473e-05, -5.1841139793395996e-05, -4.911329597234726e-05, -4.638545215129852e-05, -4.3657608330249786e-05, -4.092976450920105e-05, -3.820192068815231e-05, -3.547407686710358e-05, -3.274623304605484e-05, -3.0018389225006104e-05, -2.7290545403957367e-05, -2.456270158290863e-05, -2.1834857761859894e-05, -1.9107013940811157e-05, -1.637917011976242e-05, -1.3651326298713684e-05, -1.0923482477664948e-05, -8.195638656616211e-06, -5.467794835567474e-06, -2.739951014518738e-06, -1.210719347000122e-08, 2.7157366275787354e-06, 5.443580448627472e-06, 8.171424269676208e-06, 1.0899268090724945e-05, 1.3627111911773682e-05, 1.6354955732822418e-05, 1.9082799553871155e-05, 2.181064337491989e-05, 2.4538487195968628e-05, 2.7266331017017365e-05, 2.99941748380661e-05, 3.272201865911484e-05, 3.5449862480163574e-05, 3.817770630121231e-05, 4.090555012226105e-05, 4.3633393943309784e-05, 4.636123776435852e-05, 4.908908158540726e-05, 5.1816925406455994e-05, 5.454476922750473e-05, 5.727261304855347e-05, 6.00004568696022e-05, 6.272830069065094e-05, 6.545614451169968e-05, 6.818398833274841e-05, 7.091183215379715e-05, 7.363967597484589e-05, 7.636751979589462e-05, 7.909536361694336e-05]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 12.0, 9.0, 8.0, 26.0, 32.0, 65.0, 73.0, 93.0, 91.0, 134.0, 104.0, 94.0, 78.0, 64.0, 30.0, 27.0, 19.0, 12.0, 11.0, 6.0, 11.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3066997528076172e-05, -2.2291205823421478e-05, -2.1515414118766785e-05, -2.073962241411209e-05, -1.9963830709457397e-05, -1.9188039004802704e-05, -1.841224730014801e-05, -1.7636455595493317e-05, -1.6860663890838623e-05, -1.608487218618393e-05, -1.5309080481529236e-05, -1.4533288776874542e-05, -1.3757497072219849e-05, -1.2981705367565155e-05, -1.2205913662910461e-05, -1.1430121958255768e-05, -1.0654330253601074e-05, -9.87853854894638e-06, -9.102746844291687e-06, -8.326955139636993e-06, -7.5511634349823e-06, -6.775371730327606e-06, -5.999580025672913e-06, -5.223788321018219e-06, -4.447996616363525e-06, -3.6722049117088318e-06, -2.896413207054138e-06, -2.1206215023994446e-06, -1.344829797744751e-06, -5.690380930900574e-07, 2.0675361156463623e-07, 9.825453162193298e-07, 1.7583370208740234e-06, 2.534128725528717e-06, 3.3099204301834106e-06, 4.085712134838104e-06, 4.861503839492798e-06, 5.6372955441474915e-06, 6.413087248802185e-06, 7.188878953456879e-06, 7.964670658111572e-06, 8.740462362766266e-06, 9.51625406742096e-06, 1.0292045772075653e-05, 1.1067837476730347e-05, 1.184362918138504e-05, 1.2619420886039734e-05, 1.3395212590694427e-05, 1.4171004295349121e-05, 1.4946796000003815e-05, 1.5722587704658508e-05, 1.6498379409313202e-05, 1.7274171113967896e-05, 1.804996281862259e-05, 1.8825754523277283e-05, 1.9601546227931976e-05, 2.037733793258667e-05, 2.1153129637241364e-05, 2.1928921341896057e-05, 2.270471304655075e-05, 2.3480504751205444e-05, 2.4256296455860138e-05, 2.503208816051483e-05, 2.5807879865169525e-05, 2.658367156982422e-05]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 14.0, 18.0, 20.0, 33.0, 45.0, 74.0, 106.0, 141.0, 198.0, 333.0, 413.0, 675.0, 983.0, 1590.0, 2114.0, 3558.0, 5055.0, 8765.0, 12639.0, 23107.0, 36620.0, 75202.0, 154866.0, 418007.0, 141280.0, 70350.0, 34288.0, 22276.0, 12260.0, 8432.0, 4919.0, 3415.0, 2156.0, 1587.0, 942.0, 649.0, 472.0, 301.0, 188.0, 143.0, 101.0, 71.0, 40.0, 34.0, 23.0, 13.0, 11.0, 11.0, 5.0, 0.0, 3.0, 2.0, 3.0], "bins": [-2.3603439331054688e-05, -2.2917985916137695e-05, -2.2232532501220703e-05, -2.154707908630371e-05, -2.086162567138672e-05, -2.0176172256469727e-05, -1.9490718841552734e-05, -1.8805265426635742e-05, -1.811981201171875e-05, -1.7434358596801758e-05, -1.6748905181884766e-05, -1.6063451766967773e-05, -1.537799835205078e-05, -1.4692544937133789e-05, -1.4007091522216797e-05, -1.3321638107299805e-05, -1.2636184692382812e-05, -1.195073127746582e-05, -1.1265277862548828e-05, -1.0579824447631836e-05, -9.894371032714844e-06, -9.208917617797852e-06, -8.52346420288086e-06, -7.838010787963867e-06, -7.152557373046875e-06, -6.467103958129883e-06, -5.781650543212891e-06, -5.0961971282958984e-06, -4.410743713378906e-06, -3.725290298461914e-06, -3.039836883544922e-06, -2.3543834686279297e-06, -1.6689300537109375e-06, -9.834766387939453e-07, -2.980232238769531e-07, 3.8743019104003906e-07, 1.0728836059570312e-06, 1.7583370208740234e-06, 2.4437904357910156e-06, 3.129243850708008e-06, 3.814697265625e-06, 4.500150680541992e-06, 5.185604095458984e-06, 5.8710575103759766e-06, 6.556510925292969e-06, 7.241964340209961e-06, 7.927417755126953e-06, 8.612871170043945e-06, 9.298324584960938e-06, 9.98377799987793e-06, 1.0669231414794922e-05, 1.1354684829711914e-05, 1.2040138244628906e-05, 1.2725591659545898e-05, 1.341104507446289e-05, 1.4096498489379883e-05, 1.4781951904296875e-05, 1.5467405319213867e-05, 1.615285873413086e-05, 1.683831214904785e-05, 1.7523765563964844e-05, 1.8209218978881836e-05, 1.8894672393798828e-05, 1.958012580871582e-05, 2.0265579223632812e-05]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 10.0, 13.0, 7.0, 9.0, 12.0, 12.0, 14.0, 13.0, 21.0, 24.0, 24.0, 30.0, 29.0, 38.0, 47.0, 46.0, 41.0, 41.0, 41.0, 56.0, 35.0, 42.0, 36.0, 43.0, 34.0, 36.0, 31.0, 28.0, 23.0, 22.0, 21.0, 18.0, 23.0, 20.0, 12.0, 8.0, 10.0, 10.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-2.7477741241455078e-05, -2.667214721441269e-05, -2.58665531873703e-05, -2.506095916032791e-05, -2.4255365133285522e-05, -2.3449771106243134e-05, -2.2644177079200745e-05, -2.1838583052158356e-05, -2.1032989025115967e-05, -2.0227394998073578e-05, -1.942180097103119e-05, -1.86162069439888e-05, -1.781061291694641e-05, -1.7005018889904022e-05, -1.6199424862861633e-05, -1.5393830835819244e-05, -1.4588236808776855e-05, -1.3782642781734467e-05, -1.2977048754692078e-05, -1.2171454727649689e-05, -1.13658607006073e-05, -1.0560266673564911e-05, -9.754672646522522e-06, -8.949078619480133e-06, -8.143484592437744e-06, -7.337890565395355e-06, -6.532296538352966e-06, -5.726702511310577e-06, -4.9211084842681885e-06, -4.1155144572257996e-06, -3.3099204301834106e-06, -2.5043264031410217e-06, -1.6987323760986328e-06, -8.931383490562439e-07, -8.754432201385498e-08, 7.180497050285339e-07, 1.5236437320709229e-06, 2.3292377591133118e-06, 3.1348317861557007e-06, 3.94042581319809e-06, 4.7460198402404785e-06, 5.5516138672828674e-06, 6.357207894325256e-06, 7.162801921367645e-06, 7.968395948410034e-06, 8.773989975452423e-06, 9.579584002494812e-06, 1.0385178029537201e-05, 1.119077205657959e-05, 1.1996366083621979e-05, 1.2801960110664368e-05, 1.3607554137706757e-05, 1.4413148164749146e-05, 1.5218742191791534e-05, 1.6024336218833923e-05, 1.6829930245876312e-05, 1.76355242729187e-05, 1.844111829996109e-05, 1.924671232700348e-05, 2.0052306354045868e-05, 2.0857900381088257e-05, 2.1663494408130646e-05, 2.2469088435173035e-05, 2.3274682462215424e-05, 2.4080276489257812e-05]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 5.0, 13.0, 9.0, 32.0, 29.0, 45.0, 68.0, 113.0, 175.0, 296.0, 524.0, 1024.0, 1815.0, 4970.0, 17373.0, 195898.0, 782329.0, 31384.0, 7133.0, 2579.0, 1168.0, 616.0, 353.0, 188.0, 143.0, 73.0, 61.0, 36.0, 25.0, 18.0, 19.0, 8.0, 6.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8656253814697266e-05, -1.8125399947166443e-05, -1.759454607963562e-05, -1.7063692212104797e-05, -1.6532838344573975e-05, -1.6001984477043152e-05, -1.547113060951233e-05, -1.4940276741981506e-05, -1.4409422874450684e-05, -1.387856900691986e-05, -1.3347715139389038e-05, -1.2816861271858215e-05, -1.2286007404327393e-05, -1.175515353679657e-05, -1.1224299669265747e-05, -1.0693445801734924e-05, -1.0162591934204102e-05, -9.631738066673279e-06, -9.100884199142456e-06, -8.570030331611633e-06, -8.03917646408081e-06, -7.508322596549988e-06, -6.977468729019165e-06, -6.446614861488342e-06, -5.9157609939575195e-06, -5.384907126426697e-06, -4.854053258895874e-06, -4.323199391365051e-06, -3.7923455238342285e-06, -3.2614916563034058e-06, -2.730637788772583e-06, -2.1997839212417603e-06, -1.6689300537109375e-06, -1.1380761861801147e-06, -6.07222318649292e-07, -7.636845111846924e-08, 4.544854164123535e-07, 9.853392839431763e-07, 1.516193151473999e-06, 2.0470470190048218e-06, 2.5779008865356445e-06, 3.1087547540664673e-06, 3.63960862159729e-06, 4.170462489128113e-06, 4.7013163566589355e-06, 5.232170224189758e-06, 5.763024091720581e-06, 6.293877959251404e-06, 6.8247318267822266e-06, 7.355585694313049e-06, 7.886439561843872e-06, 8.417293429374695e-06, 8.948147296905518e-06, 9.47900116443634e-06, 1.0009855031967163e-05, 1.0540708899497986e-05, 1.1071562767028809e-05, 1.1602416634559631e-05, 1.2133270502090454e-05, 1.2664124369621277e-05, 1.31949782371521e-05, 1.3725832104682922e-05, 1.4256685972213745e-05, 1.4787539839744568e-05, 1.531839370727539e-05]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 7.0, 0.0, 3.0, 0.0, 11.0, 10.0, 0.0, 15.0, 0.0, 28.0, 41.0, 0.0, 44.0, 0.0, 86.0, 84.0, 0.0, 110.0, 0.0, 123.0, 0.0, 115.0, 86.0, 0.0, 67.0, 0.0, 54.0, 40.0, 0.0, 28.0, 0.0, 17.0, 9.0, 0.0, 14.0, 0.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0728836059570312e-06, -1.037493348121643e-06, -1.0021030902862549e-06, -9.667128324508667e-07, -9.313225746154785e-07, -8.959323167800903e-07, -8.605420589447021e-07, -8.25151801109314e-07, -7.897615432739258e-07, -7.543712854385376e-07, -7.189810276031494e-07, -6.835907697677612e-07, -6.48200511932373e-07, -6.128102540969849e-07, -5.774199962615967e-07, -5.420297384262085e-07, -5.066394805908203e-07, -4.7124922275543213e-07, -4.3585896492004395e-07, -4.0046870708465576e-07, -3.650784492492676e-07, -3.296881914138794e-07, -2.942979335784912e-07, -2.5890767574310303e-07, -2.2351741790771484e-07, -1.8812716007232666e-07, -1.5273690223693848e-07, -1.1734664440155029e-07, -8.195638656616211e-08, -4.6566128730773926e-08, -1.1175870895385742e-08, 2.421438694000244e-08, 5.960464477539063e-08, 9.499490261077881e-08, 1.30385160446167e-07, 1.6577541828155518e-07, 2.0116567611694336e-07, 2.3655593395233154e-07, 2.7194619178771973e-07, 3.073364496231079e-07, 3.427267074584961e-07, 3.781169652938843e-07, 4.1350722312927246e-07, 4.4889748096466064e-07, 4.842877388000488e-07, 5.19677996635437e-07, 5.550682544708252e-07, 5.904585123062134e-07, 6.258487701416016e-07, 6.612390279769897e-07, 6.966292858123779e-07, 7.320195436477661e-07, 7.674098014831543e-07, 8.028000593185425e-07, 8.381903171539307e-07, 8.735805749893188e-07, 9.08970832824707e-07, 9.443610906600952e-07, 9.797513484954834e-07, 1.0151416063308716e-06, 1.0505318641662598e-06, 1.085922122001648e-06, 1.1213123798370361e-06, 1.1567026376724243e-06, 1.1920928955078125e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 4.0, 17.0, 27.0, 29.0, 52.0, 44.0, 86.0, 150.0, 113.0, 287.0, 433.0, 330.0, 820.0, 1365.0, 966.0, 2863.0, 5171.0, 4160.0, 14711.0, 13637.0, 60393.0, 233626.0, 369953.0, 233755.0, 60404.0, 13518.0, 14822.0, 7050.0, 2172.0, 2849.0, 995.0, 1308.0, 859.0, 308.0, 452.0, 295.0, 108.0, 144.0, 98.0, 37.0, 44.0, 27.0, 10.0, 18.0, 8.0, 12.0, 12.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-06, -2.882443368434906e-06, -2.7846544981002808e-06, -2.6868656277656555e-06, -2.5890767574310303e-06, -2.491287887096405e-06, -2.3934990167617798e-06, -2.2957101464271545e-06, -2.1979212760925293e-06, -2.100132405757904e-06, -2.002343535423279e-06, -1.9045546650886536e-06, -1.8067657947540283e-06, -1.708976924419403e-06, -1.6111880540847778e-06, -1.5133991837501526e-06, -1.4156103134155273e-06, -1.317821443080902e-06, -1.2200325727462769e-06, -1.1222437024116516e-06, -1.0244548320770264e-06, -9.266659617424011e-07, -8.288770914077759e-07, -7.310882210731506e-07, -6.332993507385254e-07, -5.355104804039001e-07, -4.377216100692749e-07, -3.3993273973464966e-07, -2.421438694000244e-07, -1.4435499906539917e-07, -4.6566128730773926e-08, 5.122274160385132e-08, 1.4901161193847656e-07, 2.468004822731018e-07, 3.4458935260772705e-07, 4.423782229423523e-07, 5.401670932769775e-07, 6.379559636116028e-07, 7.35744833946228e-07, 8.335337042808533e-07, 9.313225746154785e-07, 1.0291114449501038e-06, 1.126900315284729e-06, 1.2246891856193542e-06, 1.3224780559539795e-06, 1.4202669262886047e-06, 1.51805579662323e-06, 1.6158446669578552e-06, 1.7136335372924805e-06, 1.8114224076271057e-06, 1.909211277961731e-06, 2.007000148296356e-06, 2.1047890186309814e-06, 2.2025778889656067e-06, 2.300366759300232e-06, 2.398155629634857e-06, 2.4959444999694824e-06, 2.5937333703041077e-06, 2.691522240638733e-06, 2.789311110973358e-06, 2.8870999813079834e-06, 2.9848888516426086e-06, 3.082677721977234e-06, 3.180466592311859e-06, 3.2782554626464844e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 9.0, 3.0, 9.0, 14.0, 14.0, 6.0, 20.0, 26.0, 27.0, 46.0, 62.0, 44.0, 87.0, 94.0, 109.0, 34.0, 93.0, 65.0, 25.0, 47.0, 54.0, 29.0, 10.0, 11.0, 13.0, 4.0, 9.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-06, -2.878718078136444e-06, -2.777203917503357e-06, -2.6756897568702698e-06, -2.5741755962371826e-06, -2.4726614356040955e-06, -2.3711472749710083e-06, -2.269633114337921e-06, -2.168118953704834e-06, -2.066604793071747e-06, -1.9650906324386597e-06, -1.8635764718055725e-06, -1.7620623111724854e-06, -1.6605481505393982e-06, -1.559033989906311e-06, -1.4575198292732239e-06, -1.3560056686401367e-06, -1.2544915080070496e-06, -1.1529773473739624e-06, -1.0514631867408752e-06, -9.499490261077881e-07, -8.484348654747009e-07, -7.469207048416138e-07, -6.454065442085266e-07, -5.438923835754395e-07, -4.423782229423523e-07, -3.4086406230926514e-07, -2.39349901676178e-07, -1.3783574104309082e-07, -3.632158041000366e-08, 6.51925802230835e-08, 1.6670674085617065e-07, 2.682209014892578e-07, 3.6973506212234497e-07, 4.7124922275543213e-07, 5.727633833885193e-07, 6.742775440216064e-07, 7.757917046546936e-07, 8.773058652877808e-07, 9.78820025920868e-07, 1.080334186553955e-06, 1.1818483471870422e-06, 1.2833625078201294e-06, 1.3848766684532166e-06, 1.4863908290863037e-06, 1.5879049897193909e-06, 1.689419150352478e-06, 1.7909333109855652e-06, 1.8924474716186523e-06, 1.9939616322517395e-06, 2.0954757928848267e-06, 2.196989953517914e-06, 2.298504114151001e-06, 2.400018274784088e-06, 2.5015324354171753e-06, 2.6030465960502625e-06, 2.7045607566833496e-06, 2.8060749173164368e-06, 2.907589077949524e-06, 3.009103238582611e-06, 3.1106173992156982e-06, 3.2121315598487854e-06, 3.3136457204818726e-06, 3.4151598811149597e-06, 3.516674041748047e-06]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 7.0, 20.0, 17.0, 20.0, 21.0, 40.0, 47.0, 72.0, 104.0, 124.0, 124.0, 82.0, 80.0, 48.0, 38.0, 26.0, 16.0, 21.0, 13.0, 10.0, 8.0, 6.0, 7.0, 7.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8428237834014e-05, -9.537742880638689e-05, -9.232662705471739e-05, -8.927581802709028e-05, -8.622501627542078e-05, -8.317420724779367e-05, -8.012339822016656e-05, -7.707258919253945e-05, -7.402178744086996e-05, -7.097097841324285e-05, -6.792017666157335e-05, -6.486936763394624e-05, -6.181855860631913e-05, -5.876775685464963e-05, -5.571694782702252e-05, -5.266614243737422e-05, -4.9615337047725916e-05, -4.656453165807761e-05, -4.351372626842931e-05, -4.04629172408022e-05, -3.7412111851153895e-05, -3.436130646150559e-05, -3.131049743387848e-05, -2.8259692044230178e-05, -2.5208886654581875e-05, -2.215808126493357e-05, -1.9107274056295864e-05, -1.6056466847658157e-05, -1.3005661458009854e-05, -9.954855158866849e-06, -6.904048859723844e-06, -3.853241651086137e-06, -8.024362614378333e-07, 2.248370037705172e-06, 5.299176336848177e-06, 8.349982635991182e-06, 1.1400788935134187e-05, 1.4451595234277193e-05, 1.7502401533420198e-05, 2.0553208742057905e-05, 2.3604014131706208e-05, 2.665481952135451e-05, 2.970562672999222e-05, 3.2756433938629925e-05, 3.580723932827823e-05, 3.885804471792653e-05, 4.190885374555364e-05, 4.4959659135201946e-05, 4.801046452485025e-05, 5.106126991449855e-05, 5.4112075304146856e-05, 5.7162884331773967e-05, 6.021368972142227e-05, 6.326449511107057e-05, 6.631530413869768e-05, 6.93661131663248e-05, 7.241691491799429e-05, 7.54677239456214e-05, 7.85185256972909e-05, 8.156933472491801e-05, 8.462014375254512e-05, 8.767094550421461e-05, 9.072175453184173e-05, 9.377255628351122e-05, 9.682336531113833e-05]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 11.0, 11.0, 9.0, 10.0, 18.0, 16.0, 32.0, 31.0, 31.0, 34.0, 37.0, 47.0, 47.0, 55.0, 59.0, 46.0, 53.0, 60.0, 57.0, 45.0, 36.0, 40.0, 47.0, 24.0, 33.0, 25.0, 24.0, 12.0, 10.0, 13.0, 4.0, 6.0, 9.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.259845733642578e-05, -7.012113928794861e-05, -6.764382123947144e-05, -6.516650319099426e-05, -6.268918514251709e-05, -6.021186709403992e-05, -5.7734549045562744e-05, -5.525723099708557e-05, -5.27799129486084e-05, -5.0302594900131226e-05, -4.782527685165405e-05, -4.534795880317688e-05, -4.287064075469971e-05, -4.0393322706222534e-05, -3.791600465774536e-05, -3.543868660926819e-05, -3.2961368560791016e-05, -3.0484050512313843e-05, -2.800673246383667e-05, -2.5529414415359497e-05, -2.3052096366882324e-05, -2.057477831840515e-05, -1.809746026992798e-05, -1.5620142221450806e-05, -1.3142824172973633e-05, -1.066550612449646e-05, -8.188188076019287e-06, -5.710870027542114e-06, -3.2335519790649414e-06, -7.562339305877686e-07, 1.7210841178894043e-06, 4.198402166366577e-06, 6.67572021484375e-06, 9.153038263320923e-06, 1.1630356311798096e-05, 1.4107674360275269e-05, 1.658499240875244e-05, 1.9062310457229614e-05, 2.1539628505706787e-05, 2.401694655418396e-05, 2.6494264602661133e-05, 2.8971582651138306e-05, 3.144890069961548e-05, 3.392621874809265e-05, 3.6403536796569824e-05, 3.8880854845047e-05, 4.135817289352417e-05, 4.383549094200134e-05, 4.6312808990478516e-05, 4.879012703895569e-05, 5.126744508743286e-05, 5.3744763135910034e-05, 5.622208118438721e-05, 5.869939923286438e-05, 6.117671728134155e-05, 6.365403532981873e-05, 6.61313533782959e-05, 6.860867142677307e-05, 7.108598947525024e-05, 7.356330752372742e-05, 7.604062557220459e-05, 7.851794362068176e-05, 8.099526166915894e-05, 8.347257971763611e-05, 8.594989776611328e-05]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 5.0, 14.0, 13.0, 16.0, 28.0, 40.0, 64.0, 100.0, 160.0, 247.0, 454.0, 734.0, 1263.0, 2409.0, 5014.0, 13724.0, 62173.0, 1516283.0, 2501259.0, 66444.0, 12606.0, 5201.0, 2467.0, 1328.0, 729.0, 477.0, 334.0, 203.0, 119.0, 102.0, 65.0, 60.0, 31.0, 28.0, 22.0, 13.0, 16.0, 9.0, 7.0, 8.0, 4.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.07099723815918e-05, -3.914814442396164e-05, -3.758631646633148e-05, -3.6024488508701324e-05, -3.446266055107117e-05, -3.290083259344101e-05, -3.133900463581085e-05, -2.9777176678180695e-05, -2.8215348720550537e-05, -2.665352076292038e-05, -2.5091692805290222e-05, -2.3529864847660065e-05, -2.1968036890029907e-05, -2.040620893239975e-05, -1.8844380974769592e-05, -1.7282553017139435e-05, -1.5720725059509277e-05, -1.415889710187912e-05, -1.2597069144248962e-05, -1.1035241186618805e-05, -9.473413228988647e-06, -7.91158527135849e-06, -6.3497573137283325e-06, -4.787929356098175e-06, -3.2261013984680176e-06, -1.6642734408378601e-06, -1.0244548320770264e-07, 1.4593824744224548e-06, 3.0212104320526123e-06, 4.58303838968277e-06, 6.144866347312927e-06, 7.706694304943085e-06, 9.268522262573242e-06, 1.08303502202034e-05, 1.2392178177833557e-05, 1.3954006135463715e-05, 1.5515834093093872e-05, 1.707766205072403e-05, 1.8639490008354187e-05, 2.0201317965984344e-05, 2.1763145923614502e-05, 2.332497388124466e-05, 2.4886801838874817e-05, 2.6448629796504974e-05, 2.8010457754135132e-05, 2.957228571176529e-05, 3.113411366939545e-05, 3.2695941627025604e-05, 3.425776958465576e-05, 3.581959754228592e-05, 3.738142549991608e-05, 3.8943253457546234e-05, 4.050508141517639e-05, 4.206690937280655e-05, 4.3628737330436707e-05, 4.5190565288066864e-05, 4.675239324569702e-05, 4.831422120332718e-05, 4.9876049160957336e-05, 5.1437877118587494e-05, 5.299970507621765e-05, 5.456153303384781e-05, 5.6123360991477966e-05, 5.7685188949108124e-05, 5.924701690673828e-05]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 8.0, 14.0, 11.0, 13.0, 22.0, 28.0, 43.0, 53.0, 82.0, 81.0, 106.0, 93.0, 95.0, 84.0, 65.0, 42.0, 42.0, 26.0, 20.0, 13.0, 13.0, 8.0, 7.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.633167266845703e-05, -1.5716999769210815e-05, -1.51023268699646e-05, -1.4487653970718384e-05, -1.3872981071472168e-05, -1.3258308172225952e-05, -1.2643635272979736e-05, -1.202896237373352e-05, -1.1414289474487305e-05, -1.0799616575241089e-05, -1.0184943675994873e-05, -9.570270776748657e-06, -8.955597877502441e-06, -8.340924978256226e-06, -7.72625207901001e-06, -7.111579179763794e-06, -6.496906280517578e-06, -5.882233381271362e-06, -5.2675604820251465e-06, -4.652887582778931e-06, -4.038214683532715e-06, -3.423541784286499e-06, -2.808868885040283e-06, -2.1941959857940674e-06, -1.5795230865478516e-06, -9.648501873016357e-07, -3.501772880554199e-07, 2.644956111907959e-07, 8.791685104370117e-07, 1.4938414096832275e-06, 2.1085143089294434e-06, 2.723187208175659e-06, 3.337860107421875e-06, 3.952533006668091e-06, 4.567205905914307e-06, 5.1818788051605225e-06, 5.796551704406738e-06, 6.411224603652954e-06, 7.02589750289917e-06, 7.640570402145386e-06, 8.255243301391602e-06, 8.869916200637817e-06, 9.484589099884033e-06, 1.0099261999130249e-05, 1.0713934898376465e-05, 1.132860779762268e-05, 1.1943280696868896e-05, 1.2557953596115112e-05, 1.3172626495361328e-05, 1.3787299394607544e-05, 1.440197229385376e-05, 1.5016645193099976e-05, 1.563131809234619e-05, 1.6245990991592407e-05, 1.6860663890838623e-05, 1.747533679008484e-05, 1.8090009689331055e-05, 1.870468258857727e-05, 1.9319355487823486e-05, 1.9934028387069702e-05, 2.0548701286315918e-05, 2.1163374185562134e-05, 2.177804708480835e-05, 2.2392719984054565e-05, 2.300739288330078e-05]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 3.0, 9.0, 5.0, 14.0, 18.0, 14.0, 19.0, 41.0, 47.0, 89.0, 140.0, 156.0, 273.0, 382.0, 613.0, 881.0, 1446.0, 2545.0, 4430.0, 8306.0, 17092.0, 46955.0, 166852.0, 3101650.0, 694250.0, 89502.0, 29712.0, 12969.0, 7022.0, 3410.0, 1947.0, 1197.0, 765.0, 524.0, 319.0, 225.0, 119.0, 101.0, 67.0, 49.0, 35.0, 22.0, 25.0, 10.0, 7.0, 9.0, 5.0, 4.0, 3.0, 5.0], "bins": [-2.7358531951904297e-05, -2.663489431142807e-05, -2.5911256670951843e-05, -2.5187619030475616e-05, -2.446398138999939e-05, -2.3740343749523163e-05, -2.3016706109046936e-05, -2.229306846857071e-05, -2.1569430828094482e-05, -2.0845793187618256e-05, -2.012215554714203e-05, -1.9398517906665802e-05, -1.8674880266189575e-05, -1.795124262571335e-05, -1.722760498523712e-05, -1.6503967344760895e-05, -1.5780329704284668e-05, -1.5056692063808441e-05, -1.4333054423332214e-05, -1.3609416782855988e-05, -1.288577914237976e-05, -1.2162141501903534e-05, -1.1438503861427307e-05, -1.071486622095108e-05, -9.991228580474854e-06, -9.267590939998627e-06, -8.5439532995224e-06, -7.820315659046173e-06, -7.096678018569946e-06, -6.3730403780937195e-06, -5.649402737617493e-06, -4.925765097141266e-06, -4.202127456665039e-06, -3.4784898161888123e-06, -2.7548521757125854e-06, -2.0312145352363586e-06, -1.3075768947601318e-06, -5.83939254283905e-07, 1.3969838619232178e-07, 8.633360266685486e-07, 1.5869736671447754e-06, 2.310611307621002e-06, 3.034248948097229e-06, 3.757886588573456e-06, 4.481524229049683e-06, 5.2051618695259094e-06, 5.928799510002136e-06, 6.652437150478363e-06, 7.37607479095459e-06, 8.099712431430817e-06, 8.823350071907043e-06, 9.54698771238327e-06, 1.0270625352859497e-05, 1.0994262993335724e-05, 1.171790063381195e-05, 1.2441538274288177e-05, 1.3165175914764404e-05, 1.3888813555240631e-05, 1.4612451195716858e-05, 1.5336088836193085e-05, 1.605972647666931e-05, 1.678336411714554e-05, 1.7507001757621765e-05, 1.8230639398097992e-05, 1.895427703857422e-05]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 7.0, 10.0, 7.0, 12.0, 14.0, 16.0, 34.0, 36.0, 57.0, 63.0, 79.0, 188.0, 402.0, 766.0, 1061.0, 592.0, 271.0, 136.0, 83.0, 64.0, 41.0, 23.0, 23.0, 25.0, 14.0, 9.0, 9.0, 6.0, 9.0, 4.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2411346435546875e-05, -2.1556392312049866e-05, -2.0701438188552856e-05, -1.9846484065055847e-05, -1.8991529941558838e-05, -1.813657581806183e-05, -1.728162169456482e-05, -1.642666757106781e-05, -1.55717134475708e-05, -1.4716759324073792e-05, -1.3861805200576782e-05, -1.3006851077079773e-05, -1.2151896953582764e-05, -1.1296942830085754e-05, -1.0441988706588745e-05, -9.587034583091736e-06, -8.732080459594727e-06, -7.877126336097717e-06, -7.022172212600708e-06, -6.167218089103699e-06, -5.3122639656066895e-06, -4.45730984210968e-06, -3.602355718612671e-06, -2.7474015951156616e-06, -1.8924474716186523e-06, -1.037493348121643e-06, -1.825392246246338e-07, 6.724148988723755e-07, 1.5273690223693848e-06, 2.382323145866394e-06, 3.2372772693634033e-06, 4.092231392860413e-06, 4.947185516357422e-06, 5.802139639854431e-06, 6.6570937633514404e-06, 7.51204788684845e-06, 8.367002010345459e-06, 9.221956133842468e-06, 1.0076910257339478e-05, 1.0931864380836487e-05, 1.1786818504333496e-05, 1.2641772627830505e-05, 1.3496726751327515e-05, 1.4351680874824524e-05, 1.5206634998321533e-05, 1.6061589121818542e-05, 1.6916543245315552e-05, 1.777149736881256e-05, 1.862645149230957e-05, 1.948140561580658e-05, 2.033635973930359e-05, 2.1191313862800598e-05, 2.2046267986297607e-05, 2.2901222109794617e-05, 2.3756176233291626e-05, 2.4611130356788635e-05, 2.5466084480285645e-05, 2.6321038603782654e-05, 2.7175992727279663e-05, 2.8030946850776672e-05, 2.888590097427368e-05, 2.974085509777069e-05, 3.05958092212677e-05, 3.145076334476471e-05, 3.230571746826172e-05]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 2.0, 6.0, 8.0, 12.0, 9.0, 16.0, 31.0, 42.0, 55.0, 108.0, 130.0, 131.0, 103.0, 84.0, 55.0, 46.0, 31.0, 26.0, 24.0, 19.0, 14.0, 9.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011551639181561768, -0.00010982259846059605, -0.00010412880510557443, -9.84350117505528e-05, -9.274121839553118e-05, -8.704742504050955e-05, -8.135363168548793e-05, -7.565984560642391e-05, -6.996604497544467e-05, -6.427225162042305e-05, -5.857845826540142e-05, -5.28846649103798e-05, -4.719087155535817e-05, -4.1497078200336546e-05, -3.580328848329373e-05, -3.01094951282721e-05, -2.4415705411229283e-05, -1.8721912056207657e-05, -1.3028119610680733e-05, -7.334327165153809e-06, -1.6405338101321831e-06, 4.053259544889443e-06, 9.747051080921665e-06, 1.544084443594329e-05, 2.1134637790964916e-05, 2.6828431145986542e-05, 3.252222450100817e-05, 3.8216014218050987e-05, 4.390980757307261e-05, 4.960360092809424e-05, 5.5297394283115864e-05, 6.099118763813749e-05, 6.668498099315912e-05, 7.237877434818074e-05, 7.807256770320237e-05, 8.376636105822399e-05, 8.946015441324562e-05, 9.515394776826724e-05, 0.00010084774112328887, 0.00010654152720235288, 0.00011223532783333212, 0.00011792912118835375, 0.00012362291454337537, 0.00012931670062243938, 0.00013501050125341862, 0.00014070428733248264, 0.00014639808796346188, 0.0001520918740425259, 0.0001577856601215899, 0.0001634794462006539, 0.00016917324683163315, 0.00017486703291069716, 0.0001805608335416764, 0.00018625461962074041, 0.00019194842025171965, 0.00019764220633078367, 0.0002033360069617629, 0.00020902979304082692, 0.00021472359367180616, 0.00022041737975087017, 0.0002261111803818494, 0.00023180496646091342, 0.00023749876709189266, 0.00024319255317095667, 0.0002488863538019359]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 6.0, 10.0, 8.0, 6.0, 19.0, 10.0, 24.0, 27.0, 25.0, 28.0, 37.0, 23.0, 42.0, 37.0, 40.0, 46.0, 51.0, 42.0, 46.0, 58.0, 52.0, 44.0, 35.0, 31.0, 20.0, 46.0, 26.0, 19.0, 22.0, 26.0, 22.0, 12.0, 16.0, 12.0, 4.0, 6.0, 6.0, 6.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.088350296020508e-05, -7.843878120183945e-05, -7.599405944347382e-05, -7.354933768510818e-05, -7.110461592674255e-05, -6.865989416837692e-05, -6.621517241001129e-05, -6.377045065164566e-05, -6.132572889328003e-05, -5.88810071349144e-05, -5.643628537654877e-05, -5.3991563618183136e-05, -5.1546841859817505e-05, -4.9102120101451874e-05, -4.665739834308624e-05, -4.421267658472061e-05, -4.176795482635498e-05, -3.932323306798935e-05, -3.687851130962372e-05, -3.443378955125809e-05, -3.1989067792892456e-05, -2.9544346034526825e-05, -2.7099624276161194e-05, -2.4654902517795563e-05, -2.221018075942993e-05, -1.97654590010643e-05, -1.732073724269867e-05, -1.4876015484333038e-05, -1.2431293725967407e-05, -9.986571967601776e-06, -7.541850209236145e-06, -5.097128450870514e-06, -2.652406692504883e-06, -2.076849341392517e-07, 2.2370368242263794e-06, 4.6817585825920105e-06, 7.126480340957642e-06, 9.571202099323273e-06, 1.2015923857688904e-05, 1.4460645616054535e-05, 1.6905367374420166e-05, 1.9350089132785797e-05, 2.1794810891151428e-05, 2.423953264951706e-05, 2.668425440788269e-05, 2.912897616624832e-05, 3.157369792461395e-05, 3.4018419682979584e-05, 3.6463141441345215e-05, 3.8907863199710846e-05, 4.135258495807648e-05, 4.379730671644211e-05, 4.624202847480774e-05, 4.868675023317337e-05, 5.1131471991539e-05, 5.357619374990463e-05, 5.6020915508270264e-05, 5.8465637266635895e-05, 6.0910359025001526e-05, 6.335508078336716e-05, 6.579980254173279e-05, 6.824452430009842e-05, 7.068924605846405e-05, 7.313396781682968e-05, 7.557868957519531e-05]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 9.0, 7.0, 9.0, 16.0, 20.0, 29.0, 37.0, 59.0, 126.0, 188.0, 352.0, 723.0, 1415.0, 3039.0, 6744.0, 18199.0, 59807.0, 340505.0, 509254.0, 72658.0, 21194.0, 7575.0, 3296.0, 1537.0, 794.0, 409.0, 223.0, 124.0, 77.0, 42.0, 28.0, 17.0, 13.0, 9.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.165836334228516e-05, -7.911212742328644e-05, -7.656589150428772e-05, -7.4019655585289e-05, -7.147341966629028e-05, -6.892718374729156e-05, -6.638094782829285e-05, -6.383471190929413e-05, -6.128847599029541e-05, -5.874224007129669e-05, -5.6196004152297974e-05, -5.3649768233299255e-05, -5.110353231430054e-05, -4.855729639530182e-05, -4.60110604763031e-05, -4.346482455730438e-05, -4.0918588638305664e-05, -3.8372352719306946e-05, -3.582611680030823e-05, -3.327988088130951e-05, -3.073364496231079e-05, -2.8187409043312073e-05, -2.5641173124313354e-05, -2.3094937205314636e-05, -2.0548701286315918e-05, -1.80024653673172e-05, -1.545622944831848e-05, -1.2909993529319763e-05, -1.0363757610321045e-05, -7.817521691322327e-06, -5.271285772323608e-06, -2.72504985332489e-06, -1.7881393432617188e-07, 2.3674219846725464e-06, 4.913657903671265e-06, 7.459893822669983e-06, 1.0006129741668701e-05, 1.255236566066742e-05, 1.5098601579666138e-05, 1.7644837498664856e-05, 2.0191073417663574e-05, 2.2737309336662292e-05, 2.528354525566101e-05, 2.782978117465973e-05, 3.0376017093658447e-05, 3.2922253012657166e-05, 3.5468488931655884e-05, 3.80147248506546e-05, 4.056096076965332e-05, 4.310719668865204e-05, 4.565343260765076e-05, 4.8199668526649475e-05, 5.074590444564819e-05, 5.329214036464691e-05, 5.583837628364563e-05, 5.838461220264435e-05, 6.0930848121643066e-05, 6.347708404064178e-05, 6.60233199596405e-05, 6.856955587863922e-05, 7.111579179763794e-05, 7.366202771663666e-05, 7.620826363563538e-05, 7.87544995546341e-05, 8.130073547363281e-05]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 8.0, 16.0, 15.0, 32.0, 38.0, 50.0, 62.0, 71.0, 99.0, 129.0, 108.0, 84.0, 79.0, 47.0, 48.0, 27.0, 21.0, 8.0, 13.0, 10.0, 7.0, 5.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4483928680419922e-05, -1.3819895684719086e-05, -1.315586268901825e-05, -1.2491829693317413e-05, -1.1827796697616577e-05, -1.1163763701915741e-05, -1.0499730706214905e-05, -9.835697710514069e-06, -9.171664714813232e-06, -8.507631719112396e-06, -7.84359872341156e-06, -7.179565727710724e-06, -6.515532732009888e-06, -5.8514997363090515e-06, -5.187466740608215e-06, -4.523433744907379e-06, -3.859400749206543e-06, -3.1953677535057068e-06, -2.5313347578048706e-06, -1.8673017621040344e-06, -1.2032687664031982e-06, -5.392357707023621e-07, 1.2479722499847412e-07, 7.888302206993103e-07, 1.4528632164001465e-06, 2.1168962121009827e-06, 2.780929207801819e-06, 3.444962203502655e-06, 4.108995199203491e-06, 4.773028194904327e-06, 5.4370611906051636e-06, 6.101094186306e-06, 6.765127182006836e-06, 7.429160177707672e-06, 8.093193173408508e-06, 8.757226169109344e-06, 9.42125916481018e-06, 1.0085292160511017e-05, 1.0749325156211853e-05, 1.141335815191269e-05, 1.2077391147613525e-05, 1.2741424143314362e-05, 1.3405457139015198e-05, 1.4069490134716034e-05, 1.473352313041687e-05, 1.5397556126117706e-05, 1.6061589121818542e-05, 1.672562211751938e-05, 1.7389655113220215e-05, 1.805368810892105e-05, 1.8717721104621887e-05, 1.9381754100322723e-05, 2.004578709602356e-05, 2.0709820091724396e-05, 2.1373853087425232e-05, 2.2037886083126068e-05, 2.2701919078826904e-05, 2.336595207452774e-05, 2.4029985070228577e-05, 2.4694018065929413e-05, 2.535805106163025e-05, 2.6022084057331085e-05, 2.668611705303192e-05, 2.7350150048732758e-05, 2.8014183044433594e-05]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 7.0, 11.0, 10.0, 19.0, 17.0, 22.0, 35.0, 40.0, 85.0, 105.0, 153.0, 233.0, 319.0, 524.0, 798.0, 1188.0, 2043.0, 3584.0, 7869.0, 16791.0, 47358.0, 265551.0, 596248.0, 64982.0, 20628.0, 8747.0, 4458.0, 2592.0, 1394.0, 832.0, 518.0, 431.0, 251.0, 191.0, 126.0, 93.0, 99.0, 49.0, 37.0, 32.0, 23.0, 16.0, 9.0, 10.0, 10.0, 2.0, 1.0, 2.0, 3.0, 3.0], "bins": [-3.4928321838378906e-05, -3.396160900592804e-05, -3.299489617347717e-05, -3.2028183341026306e-05, -3.106147050857544e-05, -3.0094757676124573e-05, -2.9128044843673706e-05, -2.816133201122284e-05, -2.7194619178771973e-05, -2.6227906346321106e-05, -2.526119351387024e-05, -2.4294480681419373e-05, -2.3327767848968506e-05, -2.236105501651764e-05, -2.1394342184066772e-05, -2.0427629351615906e-05, -1.946091651916504e-05, -1.8494203686714172e-05, -1.7527490854263306e-05, -1.656077802181244e-05, -1.5594065189361572e-05, -1.4627352356910706e-05, -1.3660639524459839e-05, -1.2693926692008972e-05, -1.1727213859558105e-05, -1.0760501027107239e-05, -9.793788194656372e-06, -8.827075362205505e-06, -7.860362529754639e-06, -6.893649697303772e-06, -5.926936864852905e-06, -4.9602240324020386e-06, -3.993511199951172e-06, -3.026798367500305e-06, -2.0600855350494385e-06, -1.0933727025985718e-06, -1.2665987014770508e-07, 8.400529623031616e-07, 1.8067657947540283e-06, 2.773478627204895e-06, 3.7401914596557617e-06, 4.706904292106628e-06, 5.673617124557495e-06, 6.640329957008362e-06, 7.6070427894592285e-06, 8.573755621910095e-06, 9.540468454360962e-06, 1.0507181286811829e-05, 1.1473894119262695e-05, 1.2440606951713562e-05, 1.3407319784164429e-05, 1.4374032616615295e-05, 1.5340745449066162e-05, 1.630745828151703e-05, 1.7274171113967896e-05, 1.8240883946418762e-05, 1.920759677886963e-05, 2.0174309611320496e-05, 2.1141022443771362e-05, 2.210773527622223e-05, 2.3074448108673096e-05, 2.4041160941123962e-05, 2.500787377357483e-05, 2.5974586606025696e-05, 2.6941299438476562e-05]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 13.0, 8.0, 13.0, 10.0, 14.0, 22.0, 23.0, 33.0, 34.0, 54.0, 46.0, 46.0, 57.0, 56.0, 62.0, 55.0, 55.0, 57.0, 40.0, 48.0, 31.0, 42.0, 36.0, 27.0, 21.0, 16.0, 15.0, 12.0, 10.0, 5.0, 8.0, 2.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8073787689208984e-05, -2.71722674369812e-05, -2.6270747184753418e-05, -2.5369226932525635e-05, -2.446770668029785e-05, -2.356618642807007e-05, -2.2664666175842285e-05, -2.1763145923614502e-05, -2.086162567138672e-05, -1.9960105419158936e-05, -1.9058585166931152e-05, -1.815706491470337e-05, -1.7255544662475586e-05, -1.6354024410247803e-05, -1.545250415802002e-05, -1.4550983905792236e-05, -1.3649463653564453e-05, -1.274794340133667e-05, -1.1846423149108887e-05, -1.0944902896881104e-05, -1.004338264465332e-05, -9.141862392425537e-06, -8.240342140197754e-06, -7.338821887969971e-06, -6.4373016357421875e-06, -5.535781383514404e-06, -4.634261131286621e-06, -3.732740879058838e-06, -2.8312206268310547e-06, -1.9297003746032715e-06, -1.0281801223754883e-06, -1.2665987014770508e-07, 7.748603820800781e-07, 1.6763806343078613e-06, 2.5779008865356445e-06, 3.4794211387634277e-06, 4.380941390991211e-06, 5.282461643218994e-06, 6.183981895446777e-06, 7.0855021476745605e-06, 7.987022399902344e-06, 8.888542652130127e-06, 9.79006290435791e-06, 1.0691583156585693e-05, 1.1593103408813477e-05, 1.249462366104126e-05, 1.3396143913269043e-05, 1.4297664165496826e-05, 1.519918441772461e-05, 1.6100704669952393e-05, 1.7002224922180176e-05, 1.790374517440796e-05, 1.8805265426635742e-05, 1.9706785678863525e-05, 2.060830593109131e-05, 2.1509826183319092e-05, 2.2411346435546875e-05, 2.3312866687774658e-05, 2.421438694000244e-05, 2.5115907192230225e-05, 2.6017427444458008e-05, 2.691894769668579e-05, 2.7820467948913574e-05, 2.8721988201141357e-05, 2.962350845336914e-05]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 18.0, 14.0, 33.0, 62.0, 101.0, 106.0, 236.0, 415.0, 752.0, 1415.0, 3782.0, 12562.0, 61196.0, 860242.0, 87969.0, 12699.0, 3486.0, 1656.0, 803.0, 410.0, 207.0, 135.0, 91.0, 38.0, 28.0, 31.0, 17.0, 9.0, 5.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5914440155029297e-05, -1.5453435480594635e-05, -1.4992430806159973e-05, -1.4531426131725311e-05, -1.407042145729065e-05, -1.3609416782855988e-05, -1.3148412108421326e-05, -1.2687407433986664e-05, -1.2226402759552002e-05, -1.176539808511734e-05, -1.1304393410682678e-05, -1.0843388736248016e-05, -1.0382384061813354e-05, -9.921379387378693e-06, -9.46037471294403e-06, -8.999370038509369e-06, -8.538365364074707e-06, -8.077360689640045e-06, -7.616356015205383e-06, -7.1553513407707214e-06, -6.6943466663360596e-06, -6.233341991901398e-06, -5.772337317466736e-06, -5.311332643032074e-06, -4.850327968597412e-06, -4.38932329416275e-06, -3.928318619728088e-06, -3.4673139452934265e-06, -3.0063092708587646e-06, -2.5453045964241028e-06, -2.084299921989441e-06, -1.623295247554779e-06, -1.1622905731201172e-06, -7.012858986854553e-07, -2.4028122425079346e-07, 2.207234501838684e-07, 6.817281246185303e-07, 1.1427327990531921e-06, 1.603737473487854e-06, 2.064742147922516e-06, 2.5257468223571777e-06, 2.9867514967918396e-06, 3.4477561712265015e-06, 3.908760845661163e-06, 4.369765520095825e-06, 4.830770194530487e-06, 5.291774868965149e-06, 5.752779543399811e-06, 6.213784217834473e-06, 6.6747888922691345e-06, 7.135793566703796e-06, 7.596798241138458e-06, 8.05780291557312e-06, 8.518807590007782e-06, 8.979812264442444e-06, 9.440816938877106e-06, 9.901821613311768e-06, 1.036282628774643e-05, 1.0823830962181091e-05, 1.1284835636615753e-05, 1.1745840311050415e-05, 1.2206844985485077e-05, 1.2667849659919739e-05, 1.31288543343544e-05, 1.3589859008789062e-05]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 9.0, 12.0, 23.0, 0.0, 35.0, 52.0, 69.0, 78.0, 107.0, 0.0, 132.0, 128.0, 105.0, 77.0, 0.0, 60.0, 37.0, 28.0, 17.0, 8.0, 0.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4407560229301453e-06, -1.391395926475525e-06, -1.3420358300209045e-06, -1.2926757335662842e-06, -1.2433156371116638e-06, -1.1939555406570435e-06, -1.144595444202423e-06, -1.0952353477478027e-06, -1.0458752512931824e-06, -9.96515154838562e-07, -9.471550583839417e-07, -8.977949619293213e-07, -8.484348654747009e-07, -7.990747690200806e-07, -7.497146725654602e-07, -7.003545761108398e-07, -6.509944796562195e-07, -6.016343832015991e-07, -5.522742867469788e-07, -5.029141902923584e-07, -4.5355409383773804e-07, -4.041939973831177e-07, -3.548339009284973e-07, -3.0547380447387695e-07, -2.561137080192566e-07, -2.0675361156463623e-07, -1.5739351511001587e-07, -1.0803341865539551e-07, -5.8673322200775146e-08, -9.313225746154785e-09, 4.0046870708465576e-08, 8.940696716308594e-08, 1.387670636177063e-07, 1.8812716007232666e-07, 2.3748725652694702e-07, 2.868473529815674e-07, 3.3620744943618774e-07, 3.855675458908081e-07, 4.3492764234542847e-07, 4.842877388000488e-07, 5.336478352546692e-07, 5.830079317092896e-07, 6.323680281639099e-07, 6.817281246185303e-07, 7.310882210731506e-07, 7.80448317527771e-07, 8.298084139823914e-07, 8.791685104370117e-07, 9.285286068916321e-07, 9.778887033462524e-07, 1.0272487998008728e-06, 1.0766088962554932e-06, 1.1259689927101135e-06, 1.1753290891647339e-06, 1.2246891856193542e-06, 1.2740492820739746e-06, 1.323409378528595e-06, 1.3727694749832153e-06, 1.4221295714378357e-06, 1.471489667892456e-06, 1.5208497643470764e-06, 1.5702098608016968e-06, 1.6195699572563171e-06, 1.6689300537109375e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 4.0, 4.0, 8.0, 8.0, 19.0, 25.0, 23.0, 41.0, 51.0, 64.0, 94.0, 167.0, 207.0, 366.0, 543.0, 1018.0, 2313.0, 4713.0, 15666.0, 183570.0, 802181.0, 25431.0, 6021.0, 2922.0, 1219.0, 602.0, 448.0, 231.0, 175.0, 124.0, 78.0, 43.0, 45.0, 36.0, 25.0, 16.0, 6.0, 13.0, 12.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.621246337890625e-05, -1.559220254421234e-05, -1.4971941709518433e-05, -1.4351680874824524e-05, -1.3731420040130615e-05, -1.3111159205436707e-05, -1.2490898370742798e-05, -1.187063753604889e-05, -1.125037670135498e-05, -1.0630115866661072e-05, -1.0009855031967163e-05, -9.389594197273254e-06, -8.769333362579346e-06, -8.149072527885437e-06, -7.528811693191528e-06, -6.90855085849762e-06, -6.288290023803711e-06, -5.668029189109802e-06, -5.0477683544158936e-06, -4.427507519721985e-06, -3.807246685028076e-06, -3.1869858503341675e-06, -2.566725015640259e-06, -1.94646418094635e-06, -1.3262033462524414e-06, -7.059425115585327e-07, -8.568167686462402e-08, 5.345791578292847e-07, 1.1548399925231934e-06, 1.775100827217102e-06, 2.3953616619110107e-06, 3.0156224966049194e-06, 3.635883331298828e-06, 4.256144165992737e-06, 4.8764050006866455e-06, 5.496665835380554e-06, 6.116926670074463e-06, 6.737187504768372e-06, 7.35744833946228e-06, 7.977709174156189e-06, 8.597970008850098e-06, 9.218230843544006e-06, 9.838491678237915e-06, 1.0458752512931824e-05, 1.1079013347625732e-05, 1.1699274182319641e-05, 1.231953501701355e-05, 1.2939795851707458e-05, 1.3560056686401367e-05, 1.4180317521095276e-05, 1.4800578355789185e-05, 1.5420839190483093e-05, 1.6041100025177002e-05, 1.666136085987091e-05, 1.728162169456482e-05, 1.7901882529258728e-05, 1.8522143363952637e-05, 1.9142404198646545e-05, 1.9762665033340454e-05, 2.0382925868034363e-05, 2.100318670272827e-05, 2.162344753742218e-05, 2.224370837211609e-05, 2.2863969206809998e-05, 2.3484230041503906e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 2.0, 4.0, 4.0, 7.0, 8.0, 9.0, 22.0, 22.0, 28.0, 54.0, 87.0, 160.0, 167.0, 133.0, 103.0, 52.0, 34.0, 23.0, 15.0, 13.0, 5.0, 5.0, 3.0, 1.0, 4.0, 5.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.47713851928711e-06, -9.074807167053223e-06, -8.672475814819336e-06, -8.27014446258545e-06, -7.867813110351562e-06, -7.465481758117676e-06, -7.063150405883789e-06, -6.660819053649902e-06, -6.258487701416016e-06, -5.856156349182129e-06, -5.453824996948242e-06, -5.0514936447143555e-06, -4.649162292480469e-06, -4.246830940246582e-06, -3.844499588012695e-06, -3.4421682357788086e-06, -3.039836883544922e-06, -2.637505531311035e-06, -2.2351741790771484e-06, -1.8328428268432617e-06, -1.430511474609375e-06, -1.0281801223754883e-06, -6.258487701416016e-07, -2.2351741790771484e-07, 1.7881393432617188e-07, 5.811452865600586e-07, 9.834766387939453e-07, 1.385807991027832e-06, 1.7881393432617188e-06, 2.1904706954956055e-06, 2.592802047729492e-06, 2.995133399963379e-06, 3.3974647521972656e-06, 3.7997961044311523e-06, 4.202127456665039e-06, 4.604458808898926e-06, 5.0067901611328125e-06, 5.409121513366699e-06, 5.811452865600586e-06, 6.213784217834473e-06, 6.616115570068359e-06, 7.018446922302246e-06, 7.420778274536133e-06, 7.82310962677002e-06, 8.225440979003906e-06, 8.627772331237793e-06, 9.03010368347168e-06, 9.432435035705566e-06, 9.834766387939453e-06, 1.023709774017334e-05, 1.0639429092407227e-05, 1.1041760444641113e-05, 1.1444091796875e-05, 1.1846423149108887e-05, 1.2248754501342773e-05, 1.265108585357666e-05, 1.3053417205810547e-05, 1.3455748558044434e-05, 1.385807991027832e-05, 1.4260411262512207e-05, 1.4662742614746094e-05, 1.506507396697998e-05, 1.5467405319213867e-05, 1.5869736671447754e-05, 1.627206802368164e-05]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 10.0, 19.0, 32.0, 63.0, 101.0, 187.0, 206.0, 135.0, 69.0, 50.0, 25.0, 23.0, 13.0, 15.0, 8.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001914964959723875, -0.0001832297712098807, -0.00017496306099928916, -0.00016669633623678237, -0.00015842962602619082, -0.00015016290126368403, -0.00014189619105309248, -0.0001336294662905857, -0.00012536274152807891, -0.00011709602404152974, -0.00010882930655498058, -0.00010056258179247379, -9.229587158188224e-05, -8.402914681937546e-05, -7.576242933282629e-05, -6.749571184627712e-05, -5.922900163568556e-05, -5.0962284149136394e-05, -4.2695566662587225e-05, -3.442884553805925e-05, -2.616212805151008e-05, -1.7895410564960912e-05, -9.628689440432936e-06, -1.3619719538837671e-06, 6.904745532665402e-06, 1.5171463928709272e-05, 2.3438182324753143e-05, 3.1704901630291715e-05, 3.9971619116840884e-05, 4.823833660339005e-05, 5.650505772791803e-05, 6.47717752144672e-05, 7.303847814910114e-05, 8.130519563565031e-05, 8.957191312219948e-05, 9.783863788470626e-05, 0.00010610534809529781, 0.0001143720728578046, 0.00012263879762031138, 0.00013090550783090293, 0.0001391722180414945, 0.00014743894280400127, 0.00015570565301459283, 0.0001639723777770996, 0.00017223908798769116, 0.00018050581275019795, 0.00018877253751270473, 0.00019703924772329628, 0.00020530597248580307, 0.00021357269724830985, 0.0002218394074589014, 0.0002301061322214082, 0.00023837284243199974, 0.0002466395671945065, 0.0002549062774050981, 0.0002631730167195201, 0.00027143972693011165, 0.0002797064371407032, 0.0002879731764551252, 0.00029623988666571677, 0.0003045065968763083, 0.0003127733070868999, 0.0003210400464013219, 0.00032930675661191344, 0.000337573466822505]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 8.0, 7.0, 5.0, 14.0, 9.0, 24.0, 16.0, 28.0, 36.0, 36.0, 41.0, 52.0, 67.0, 73.0, 95.0, 83.0, 82.0, 55.0, 48.0, 48.0, 46.0, 27.0, 26.0, 25.0, 17.0, 9.0, 4.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001240372657775879, -0.00012032128870487213, -0.00011660531163215637, -0.00011288933455944061, -0.00010917335748672485, -0.0001054573804140091, -0.00010174140334129333, -9.802542626857758e-05, -9.430944919586182e-05, -9.059347212314606e-05, -8.68774950504303e-05, -8.316151797771454e-05, -7.944554090499878e-05, -7.572956383228302e-05, -7.201358675956726e-05, -6.82976096868515e-05, -6.458163261413574e-05, -6.086565554141998e-05, -5.7149678468704224e-05, -5.3433701395988464e-05, -4.9717724323272705e-05, -4.6001747250556946e-05, -4.2285770177841187e-05, -3.856979310512543e-05, -3.485381603240967e-05, -3.113783895969391e-05, -2.742186188697815e-05, -2.370588481426239e-05, -1.998990774154663e-05, -1.627393066883087e-05, -1.2557953596115112e-05, -8.841976523399353e-06, -5.125999450683594e-06, -1.4100223779678345e-06, 2.305954694747925e-06, 6.021931767463684e-06, 9.737908840179443e-06, 1.3453885912895203e-05, 1.7169862985610962e-05, 2.088584005832672e-05, 2.460181713104248e-05, 2.831779420375824e-05, 3.2033771276474e-05, 3.574974834918976e-05, 3.946572542190552e-05, 4.318170249462128e-05, 4.6897679567337036e-05, 5.0613656640052795e-05, 5.4329633712768555e-05, 5.8045610785484314e-05, 6.176158785820007e-05, 6.547756493091583e-05, 6.919354200363159e-05, 7.290951907634735e-05, 7.662549614906311e-05, 8.034147322177887e-05, 8.405745029449463e-05, 8.777342736721039e-05, 9.148940443992615e-05, 9.52053815126419e-05, 9.892135858535767e-05, 0.00010263733565807343, 0.00010635331273078918, 0.00011006928980350494, 0.0001137852668762207]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 8.0, 11.0, 13.0, 21.0, 20.0, 40.0, 54.0, 71.0, 233.0, 258.0, 81.0, 57.0, 35.0, 26.0, 19.0, 17.0, 15.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.504753112792969e-05, -3.391783684492111e-05, -3.278814256191254e-05, -3.165844827890396e-05, -3.0528753995895386e-05, -2.939905971288681e-05, -2.8269365429878235e-05, -2.713967114686966e-05, -2.6009976863861084e-05, -2.488028258085251e-05, -2.3750588297843933e-05, -2.2620894014835358e-05, -2.1491199731826782e-05, -2.0361505448818207e-05, -1.923181116580963e-05, -1.8102116882801056e-05, -1.697242259979248e-05, -1.5842728316783905e-05, -1.471303403377533e-05, -1.3583339750766754e-05, -1.2453645467758179e-05, -1.1323951184749603e-05, -1.0194256901741028e-05, -9.064562618732452e-06, -7.934868335723877e-06, -6.8051740527153015e-06, -5.675479769706726e-06, -4.545785486698151e-06, -3.416091203689575e-06, -2.2863969206809998e-06, -1.1567026376724243e-06, -2.7008354663848877e-08, 1.1026859283447266e-06, 2.232380211353302e-06, 3.3620744943618774e-06, 4.491768777370453e-06, 5.621463060379028e-06, 6.751157343387604e-06, 7.88085162639618e-06, 9.010545909404755e-06, 1.014024019241333e-05, 1.1269934475421906e-05, 1.2399628758430481e-05, 1.3529323041439056e-05, 1.4659017324447632e-05, 1.5788711607456207e-05, 1.6918405890464783e-05, 1.8048100173473358e-05, 1.9177794456481934e-05, 2.030748873949051e-05, 2.1437183022499084e-05, 2.256687730550766e-05, 2.3696571588516235e-05, 2.482626587152481e-05, 2.5955960154533386e-05, 2.708565443754196e-05, 2.8215348720550537e-05, 2.9345043003559113e-05, 3.0474737286567688e-05, 3.1604431569576263e-05, 3.273412585258484e-05, 3.3863820135593414e-05, 3.499351441860199e-05, 3.6123208701610565e-05, 3.725290298461914e-05]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 11.0, 19.0, 34.0, 41.0, 64.0, 124.0, 217.0, 515.0, 1240.0, 4259.0, 35477.0, 8319879.0, 21401.0, 3375.0, 1001.0, 430.0, 183.0, 111.0, 74.0, 32.0, 20.0, 17.0, 16.0, 6.0, 8.0, 9.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.122166036628187e-05, -7.845953950891271e-05, -7.569741137558594e-05, -7.293529051821679e-05, -7.017316966084763e-05, -6.741104880347848e-05, -6.464892067015171e-05, -6.188679981278256e-05, -5.91246789554134e-05, -5.636255446006544e-05, -5.3600433602696285e-05, -5.083830910734832e-05, -4.807618824997917e-05, -4.5314063754631206e-05, -4.2551939259283245e-05, -3.978981840191409e-05, -3.702769390656613e-05, -3.4265569411218166e-05, -3.150344855384901e-05, -2.874132405850105e-05, -2.5979203201131895e-05, -2.3217078705783933e-05, -2.0454956029425375e-05, -1.7692833353066817e-05, -1.4930710676708259e-05, -1.21685880003497e-05, -9.406465323991142e-06, -6.644341738137882e-06, -3.882219061779324e-06, -1.1200963854207657e-06, 1.6420272004324943e-06, 4.4041498767910525e-06, 7.166272553149611e-06, 9.928395229508169e-06, 1.2690517905866727e-05, 1.545264240121469e-05, 1.8214763258583844e-05, 2.0976887753931805e-05, 2.3739010430290364e-05, 2.6501133106648922e-05, 2.926325578300748e-05, 3.202537845936604e-05, 3.4787502954714e-05, 3.7549623812083155e-05, 4.031174830743112e-05, 4.307386916480027e-05, 4.583599366014823e-05, 4.859811451751739e-05, 5.136023901286535e-05, 5.412236350821331e-05, 5.6884484365582466e-05, 5.964660886093043e-05, 6.240873335627839e-05, 6.517085421364754e-05, 6.79329750710167e-05, 7.069509592838585e-05, 7.345722406171262e-05, 7.621934491908178e-05, 7.898147305240855e-05, 8.17435939097777e-05, 8.450571476714686e-05, 8.726783562451601e-05, 9.002996375784278e-05, 9.279208461521193e-05, 9.555420547258109e-05]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 18.0, 28.0, 4.0, 4.0, 9.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.00020167362526990473, -0.00019640142272692174, -0.00019112923473585397, -0.00018585703219287097, -0.0001805848442018032, -0.0001753126416588202, -0.00017004043911583722, -0.00016476825112476945, -0.00015949606313370168, -0.0001542238605907187, -0.00014895167259965092, -0.00014367947005666792, -0.00013840728206560016, -0.00013313507952261716, -0.00012786287697963417, -0.0001225906889885664, -0.0001173184864455834, -0.00011204629117855802, -0.00010677409591153264, -0.00010150189336854964, -9.622970537748188e-05, -9.095750283449888e-05, -8.56853075674735e-05, -8.041311230044812e-05, -7.514091703342274e-05, -6.986872176639736e-05, -6.459652649937198e-05, -5.932432759436779e-05, -5.4052132327342406e-05, -4.8779937060317025e-05, -4.3507738155312836e-05, -3.8235542888287455e-05, -3.29633621731773e-05, -2.769116690615192e-05, -2.2418969820137136e-05, -1.714677273412235e-05, -1.187457746709697e-05, -6.602382200071588e-06, -1.3301832950673997e-06, 3.942011971957982e-06, 9.214207238983363e-06, 1.4486403415503446e-05, 1.975859959202353e-05, 2.5030796678038314e-05, 3.0302991945063695e-05, 3.557518721208908e-05, 4.0847386117093265e-05, 4.6119581384118646e-05, 5.139177665114403e-05, 5.666397191816941e-05, 6.193616718519479e-05, 6.720836972817779e-05, 7.248055771924555e-05, 7.775276026222855e-05, 8.302495552925393e-05, 8.829715079627931e-05, 9.356934606330469e-05, 9.884154133033007e-05, 0.00010411373659735546, 0.00010938593186438084, 0.00011465813440736383, 0.0001199303223984316, 0.0001252025249414146, 0.00013047471293248236, 0.00013574691547546536]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 3.0, 10.0, 12.0, 8.0, 19.0, 19.0, 26.0, 49.0, 51.0, 50.0, 95.0, 78.0, 91.0, 92.0, 73.0, 64.0, 49.0, 40.0, 33.0, 34.0, 19.0, 21.0, 15.0, 10.0, 5.0, 8.0, 3.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9981136322021484e-05, -2.9102899134159088e-05, -2.8224661946296692e-05, -2.7346424758434296e-05, -2.64681875705719e-05, -2.5589950382709503e-05, -2.4711713194847107e-05, -2.383347600698471e-05, -2.2955238819122314e-05, -2.2077001631259918e-05, -2.1198764443397522e-05, -2.0320527255535126e-05, -1.944229006767273e-05, -1.8564052879810333e-05, -1.7685815691947937e-05, -1.680757850408554e-05, -1.5929341316223145e-05, -1.5051104128360748e-05, -1.4172866940498352e-05, -1.3294629752635956e-05, -1.241639256477356e-05, -1.1538155376911163e-05, -1.0659918189048767e-05, -9.781681001186371e-06, -8.903443813323975e-06, -8.025206625461578e-06, -7.146969437599182e-06, -6.268732249736786e-06, -5.39049506187439e-06, -4.512257874011993e-06, -3.634020686149597e-06, -2.755783498287201e-06, -1.8775463104248047e-06, -9.993091225624084e-07, -1.210719347000122e-07, 7.57165253162384e-07, 1.6354024410247803e-06, 2.5136396288871765e-06, 3.3918768167495728e-06, 4.270114004611969e-06, 5.148351192474365e-06, 6.0265883803367615e-06, 6.904825568199158e-06, 7.783062756061554e-06, 8.66129994392395e-06, 9.539537131786346e-06, 1.0417774319648743e-05, 1.1296011507511139e-05, 1.2174248695373535e-05, 1.3052485883235931e-05, 1.3930723071098328e-05, 1.4808960258960724e-05, 1.568719744682312e-05, 1.6565434634685516e-05, 1.7443671822547913e-05, 1.832190901041031e-05, 1.9200146198272705e-05, 2.00783833861351e-05, 2.0956620573997498e-05, 2.1834857761859894e-05, 2.271309494972229e-05, 2.3591332137584686e-05, 2.4469569325447083e-05, 2.534780651330948e-05, 2.6226043701171875e-05]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 9.0, 10.0, 16.0, 23.0, 35.0, 88.0, 108.0, 213.0, 497.0, 1358.0, 5063.0, 25005.0, 372508.0, 103321.0, 11451.0, 2796.0, 967.0, 408.0, 159.0, 93.0, 46.0, 31.0, 22.0, 11.0, 12.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021767616271972656, -0.00020609423518180847, -0.00019451230764389038, -0.0001829303801059723, -0.0001713484525680542, -0.0001597665250301361, -0.00014818459749221802, -0.00013660266995429993, -0.00012502074241638184, -0.00011343881487846375, -0.00010185688734054565, -9.027495980262756e-05, -7.869303226470947e-05, -6.711110472679138e-05, -5.552917718887329e-05, -4.39472496509552e-05, -3.236532211303711e-05, -2.078339457511902e-05, -9.201467037200928e-06, 2.380460500717163e-06, 1.3962388038635254e-05, 2.5544315576553345e-05, 3.7126243114471436e-05, 4.8708170652389526e-05, 6.029009819030762e-05, 7.187202572822571e-05, 8.34539532661438e-05, 9.503588080406189e-05, 0.00010661780834197998, 0.00011819973587989807, 0.00012978166341781616, 0.00014136359095573425, 0.00015294551849365234, 0.00016452744603157043, 0.00017610937356948853, 0.00018769130110740662, 0.0001992732286453247, 0.0002108551561832428, 0.0002224370837211609, 0.00023401901125907898, 0.00024560093879699707, 0.00025718286633491516, 0.00026876479387283325, 0.00028034672141075134, 0.00029192864894866943, 0.0003035105764865875, 0.0003150925040245056, 0.0003266744315624237, 0.0003382563591003418, 0.0003498382866382599, 0.000361420214176178, 0.00037300214171409607, 0.00038458406925201416, 0.00039616599678993225, 0.00040774792432785034, 0.00041932985186576843, 0.0004309117794036865, 0.0004424937069416046, 0.0004540756344795227, 0.0004656575620174408, 0.0004772394895553589, 0.000488821417093277, 0.0005004033446311951, 0.0005119852721691132, 0.0005235671997070312]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 13.0, 15.0, 18.0, 31.0, 42.0, 56.0, 61.0, 94.0, 86.0, 86.0, 109.0, 82.0, 67.0, 75.0, 37.0, 34.0, 21.0, 14.0, 25.0, 12.0, 4.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2172927856445312e-05, -2.1198764443397522e-05, -2.022460103034973e-05, -1.925043761730194e-05, -1.827627420425415e-05, -1.730211079120636e-05, -1.632794737815857e-05, -1.535378396511078e-05, -1.4379620552062988e-05, -1.3405457139015198e-05, -1.2431293725967407e-05, -1.1457130312919617e-05, -1.0482966899871826e-05, -9.508803486824036e-06, -8.534640073776245e-06, -7.560476660728455e-06, -6.586313247680664e-06, -5.6121498346328735e-06, -4.637986421585083e-06, -3.6638230085372925e-06, -2.689659595489502e-06, -1.7154961824417114e-06, -7.413327693939209e-07, 2.3283064365386963e-07, 1.2069940567016602e-06, 2.1811574697494507e-06, 3.155320882797241e-06, 4.129484295845032e-06, 5.103647708892822e-06, 6.077811121940613e-06, 7.051974534988403e-06, 8.026137948036194e-06, 9.000301361083984e-06, 9.974464774131775e-06, 1.0948628187179565e-05, 1.1922791600227356e-05, 1.2896955013275146e-05, 1.3871118426322937e-05, 1.4845281839370728e-05, 1.5819445252418518e-05, 1.679360866546631e-05, 1.77677720785141e-05, 1.874193549156189e-05, 1.971609890460968e-05, 2.069026231765747e-05, 2.166442573070526e-05, 2.2638589143753052e-05, 2.3612752556800842e-05, 2.4586915969848633e-05, 2.5561079382896423e-05, 2.6535242795944214e-05, 2.7509406208992004e-05, 2.8483569622039795e-05, 2.9457733035087585e-05, 3.0431896448135376e-05, 3.1406059861183167e-05, 3.238022327423096e-05, 3.335438668727875e-05, 3.432855010032654e-05, 3.530271351337433e-05, 3.627687692642212e-05, 3.725104033946991e-05, 3.82252037525177e-05, 3.919936716556549e-05, 4.017353057861328e-05]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 6.0, 14.0, 7.0, 14.0, 13.0, 14.0, 24.0, 38.0, 36.0, 36.0, 41.0, 28.0, 32.0, 32.0, 28.0, 21.0, 12.0, 15.0, 9.0, 8.0, 6.0, 6.0, 9.0, 2.0, 6.0, 3.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.5904526410158724e-05, -2.4931645384640433e-05, -2.3958764359122142e-05, -2.298588333360385e-05, -2.201300230808556e-05, -2.1040119463577867e-05, -2.0067238438059576e-05, -1.9094357412541285e-05, -1.8121476387022994e-05, -1.7148595361504704e-05, -1.6175714335986413e-05, -1.520283240097342e-05, -1.422995137545513e-05, -1.325707034993684e-05, -1.2284188414923847e-05, -1.1311307389405556e-05, -1.0338426363887265e-05, -9.365545338368975e-06, -8.392664312850684e-06, -7.4197823778376915e-06, -6.446901352319401e-06, -5.47402032680111e-06, -4.5011388465354685e-06, -3.528257366269827e-06, -2.555376340751536e-06, -1.58249508785957e-06, -6.096138349676039e-07, 3.6326741792436223e-07, 1.3361486708163284e-06, 2.309029696334619e-06, 3.2819111766002607e-06, 4.254792656865902e-06, 5.227677320363e-06, 6.200558345881291e-06, 7.173439826146932e-06, 8.146321306412574e-06, 9.119202331930865e-06, 1.0092083357449155e-05, 1.1064965292462148e-05, 1.2037846317980438e-05, 1.301072734349873e-05, 1.398360836901702e-05, 1.495648939453531e-05, 1.59293704200536e-05, 1.6902253264561296e-05, 1.7875132471090183e-05, 1.8848015315597877e-05, 1.9820896341116168e-05, 2.0793777366634458e-05, 2.176665839215275e-05, 2.273953941767104e-05, 2.371242044318933e-05, 2.468530146870762e-05, 2.5658184313215315e-05, 2.6631065338733606e-05, 2.7603946364251897e-05, 2.8576827389770187e-05, 2.9549708415288478e-05, 3.052259125979617e-05, 3.149547046632506e-05, 3.2468353310832754e-05, 3.344123251736164e-05, 3.4414115361869335e-05, 3.538699820637703e-05, 3.6359877412905917e-05]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 8.0, 9.0, 4.0, 6.0, 14.0, 23.0, 34.0, 32.0, 44.0, 44.0, 48.0, 45.0, 30.0, 17.0, 12.0, 21.0, 9.0, 5.0, 11.0, 5.0, 7.0, 4.0, 4.0, 4.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6803226470947266e-05, -5.496758967638016e-05, -5.313195288181305e-05, -5.129631608724594e-05, -4.946067929267883e-05, -4.7625042498111725e-05, -4.578940570354462e-05, -4.395376890897751e-05, -4.21181321144104e-05, -4.028249531984329e-05, -3.8446858525276184e-05, -3.6611221730709076e-05, -3.477558493614197e-05, -3.293994814157486e-05, -3.110431134700775e-05, -2.9268674552440643e-05, -2.7433037757873535e-05, -2.5597400963306427e-05, -2.376176416873932e-05, -2.192612737417221e-05, -2.0090490579605103e-05, -1.8254853785037994e-05, -1.6419216990470886e-05, -1.4583580195903778e-05, -1.274794340133667e-05, -1.0912306606769562e-05, -9.076669812202454e-06, -7.2410330176353455e-06, -5.405396223068237e-06, -3.569759428501129e-06, -1.734122633934021e-06, 1.0151416063308716e-07, 1.9371509552001953e-06, 3.7727877497673035e-06, 5.608424544334412e-06, 7.44406133890152e-06, 9.279698133468628e-06, 1.1115334928035736e-05, 1.2950971722602844e-05, 1.4786608517169952e-05, 1.662224531173706e-05, 1.845788210630417e-05, 2.0293518900871277e-05, 2.2129155695438385e-05, 2.3964792490005493e-05, 2.58004292845726e-05, 2.763606607913971e-05, 2.9471702873706818e-05, 3.1307339668273926e-05, 3.3142976462841034e-05, 3.497861325740814e-05, 3.681425005197525e-05, 3.864988684654236e-05, 4.0485523641109467e-05, 4.2321160435676575e-05, 4.415679723024368e-05, 4.599243402481079e-05, 4.78280708193779e-05, 4.966370761394501e-05, 5.1499344408512115e-05, 5.3334981203079224e-05, 5.517061799764633e-05, 5.700625479221344e-05, 5.884189158678055e-05, 6.0677528381347656e-05]}, "eval/loss": 18.359586715698242, "eval/bleu": 0.0, "eval/runtime": 3668.9753, "eval/samples_per_second": 4.023, "eval/steps_per_second": 1.006} \ No newline at end of file