diff --git "a/wandb/run-20220328_170142-by95ehra/files/wandb-summary.json" "b/wandb/run-20220328_170142-by95ehra/files/wandb-summary.json" --- "a/wandb/run-20220328_170142-by95ehra/files/wandb-summary.json" +++ "b/wandb/run-20220328_170142-by95ehra/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 2.7605, "train/learning_rate": 0.0002982, "train/epoch": 4.5, "train/global_step": 500, "_runtime": 11634, "_timestamp": 1648498536, "_step": 500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 46.0, 141.0, 262.0, 310.0, 181.0, 51.0, 15.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.353339195251465, -9.54570484161377, -8.73807144165039, -7.930437088012695, -7.122803688049316, -6.315169334411621, -5.507535457611084, -4.699901580810547, -3.8922677040100098, -3.0846338272094727, -2.2769999504089355, -1.4693658351898193, -0.6617319583892822, 0.14590215682983398, 0.9535360336303711, 1.7611699104309082, 2.5688037872314453, 3.3764376640319824, 4.1840715408325195, 4.991705894470215, 5.799339294433594, 6.606973648071289, 7.414607524871826, 8.222241401672363, 9.029874801635742, 9.837509155273438, 10.645142555236816, 11.452776908874512, 12.26041030883789, 13.068044662475586, 13.875679016113281, 14.68331241607666, 15.490945816040039, 16.298580169677734, 17.10621452331543, 17.913846969604492, 18.721481323242188, 19.529115676879883, 20.336750030517578, 21.14438247680664, 21.952016830444336, 22.75965118408203, 23.567285537719727, 24.37491798400879, 25.182552337646484, 25.99018669128418, 26.797821044921875, 27.605453491210938, 28.413089752197266, 29.22072410583496, 30.028358459472656, 30.83599090576172, 31.643625259399414, 32.45125961303711, 33.25889205932617, 34.0665283203125, 34.87416076660156, 35.681793212890625, 36.48942947387695, 37.297061920166016, 38.104698181152344, 38.912330627441406, 39.71996307373047, 40.5275993347168, 41.33523178100586]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 9.0, 17.0, 13.0, 27.0, 37.0, 41.0, 35.0, 49.0, 47.0, 62.0, 71.0, 54.0, 72.0, 58.0, 62.0, 67.0, 56.0, 44.0, 32.0, 36.0, 29.0, 24.0, 18.0, 7.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.729734420776367, -12.391545295715332, -12.053356170654297, -11.715167045593262, -11.376977920532227, -11.038788795471191, -10.700599670410156, -10.362410545349121, -10.024221420288086, -9.68603229522705, -9.347843170166016, -9.00965404510498, -8.671464920043945, -8.33327579498291, -7.995086669921875, -7.65689754486084, -7.318708419799805, -6.9805192947387695, -6.642330169677734, -6.304141044616699, -5.965951919555664, -5.627762794494629, -5.289573669433594, -4.951384544372559, -4.613195419311523, -4.275006294250488, -3.936817169189453, -3.598628044128418, -3.260438919067383, -2.9222497940063477, -2.5840606689453125, -2.2458715438842773, -1.9076824188232422, -1.569493293762207, -1.2313041687011719, -0.8931150436401367, -0.5549259185791016, -0.2167367935180664, 0.12145233154296875, 0.4596414566040039, 0.7978305816650391, 1.1360197067260742, 1.4742088317871094, 1.8123979568481445, 2.1505870819091797, 2.488776206970215, 2.82696533203125, 3.165154457092285, 3.5033435821533203, 3.8415327072143555, 4.179721832275391, 4.517910957336426, 4.856100082397461, 5.194289207458496, 5.532478332519531, 5.870667457580566, 6.208856582641602, 6.547045707702637, 6.885234832763672, 7.223423957824707, 7.561613082885742, 7.899802207946777, 8.237991333007812, 8.576180458068848, 8.914369583129883]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 11.0, 10.0, 23.0, 31.0, 59.0, 86.0, 145.0, 255.0, 464.0, 870.0, 1651.0, 3609.0, 8751.0, 23231.0, 67072.0, 209532.0, 671459.0, 1526038.0, 1095098.0, 397874.0, 123869.0, 38329.0, 14171.0, 6060.0, 2767.0, 1266.0, 694.0, 349.0, 214.0, 131.0, 59.0, 27.0, 39.0, 17.0, 12.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.59375, -12.2208251953125, -11.847900390625, -11.4749755859375, -11.10205078125, -10.7291259765625, -10.356201171875, -9.9832763671875, -9.6103515625, -9.2374267578125, -8.864501953125, -8.4915771484375, -8.11865234375, -7.7457275390625, -7.372802734375, -6.9998779296875, -6.626953125, -6.2540283203125, -5.881103515625, -5.5081787109375, -5.13525390625, -4.7623291015625, -4.389404296875, -4.0164794921875, -3.6435546875, -3.2706298828125, -2.897705078125, -2.5247802734375, -2.15185546875, -1.7789306640625, -1.406005859375, -1.0330810546875, -0.66015625, -0.2872314453125, 0.085693359375, 0.4586181640625, 0.83154296875, 1.2044677734375, 1.577392578125, 1.9503173828125, 2.3232421875, 2.6961669921875, 3.069091796875, 3.4420166015625, 3.81494140625, 4.1878662109375, 4.560791015625, 4.9337158203125, 5.306640625, 5.6795654296875, 6.052490234375, 6.4254150390625, 6.79833984375, 7.1712646484375, 7.544189453125, 7.9171142578125, 8.2900390625, 8.6629638671875, 9.035888671875, 9.4088134765625, 9.78173828125, 10.1546630859375, 10.527587890625, 10.9005126953125, 11.2734375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 8.0, 5.0, 10.0, 14.0, 12.0, 18.0, 15.0, 27.0, 26.0, 38.0, 43.0, 54.0, 57.0, 53.0, 68.0, 63.0, 54.0, 74.0, 71.0, 49.0, 46.0, 45.0, 33.0, 29.0, 30.0, 19.0, 11.0, 9.0, 10.0, 1.0, 5.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-19.21875, -18.7213134765625, -18.223876953125, -17.7264404296875, -17.22900390625, -16.7315673828125, -16.234130859375, -15.7366943359375, -15.2392578125, -14.7418212890625, -14.244384765625, -13.7469482421875, -13.24951171875, -12.7520751953125, -12.254638671875, -11.7572021484375, -11.259765625, -10.7623291015625, -10.264892578125, -9.7674560546875, -9.27001953125, -8.7725830078125, -8.275146484375, -7.7777099609375, -7.2802734375, -6.7828369140625, -6.285400390625, -5.7879638671875, -5.29052734375, -4.7930908203125, -4.295654296875, -3.7982177734375, -3.30078125, -2.8033447265625, -2.305908203125, -1.8084716796875, -1.31103515625, -0.8135986328125, -0.316162109375, 0.1812744140625, 0.6787109375, 1.1761474609375, 1.673583984375, 2.1710205078125, 2.66845703125, 3.1658935546875, 3.663330078125, 4.1607666015625, 4.658203125, 5.1556396484375, 5.653076171875, 6.1505126953125, 6.64794921875, 7.1453857421875, 7.642822265625, 8.1402587890625, 8.6376953125, 9.1351318359375, 9.632568359375, 10.1300048828125, 10.62744140625, 11.1248779296875, 11.622314453125, 12.1197509765625, 12.6171875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 7.0, 15.0, 30.0, 64.0, 137.0, 283.0, 1326.0, 4189584.0, 2200.0, 345.0, 154.0, 57.0, 35.0, 16.0, 11.0, 5.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-284.25, -276.029296875, -267.80859375, -259.587890625, -251.3671875, -243.146484375, -234.92578125, -226.705078125, -218.484375, -210.263671875, -202.04296875, -193.822265625, -185.6015625, -177.380859375, -169.16015625, -160.939453125, -152.71875, -144.498046875, -136.27734375, -128.056640625, -119.8359375, -111.615234375, -103.39453125, -95.173828125, -86.953125, -78.732421875, -70.51171875, -62.291015625, -54.0703125, -45.849609375, -37.62890625, -29.408203125, -21.1875, -12.966796875, -4.74609375, 3.474609375, 11.6953125, 19.916015625, 28.13671875, 36.357421875, 44.578125, 52.798828125, 61.01953125, 69.240234375, 77.4609375, 85.681640625, 93.90234375, 102.123046875, 110.34375, 118.564453125, 126.78515625, 135.005859375, 143.2265625, 151.447265625, 159.66796875, 167.888671875, 176.109375, 184.330078125, 192.55078125, 200.771484375, 208.9921875, 217.212890625, 225.43359375, 233.654296875, 241.875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 10.0, 11.0, 27.0, 41.0, 97.0, 167.0, 289.0, 599.0, 1216.0, 800.0, 377.0, 204.0, 93.0, 59.0, 24.0, 28.0, 8.0, 9.0, 7.0, 6.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5, -10.20556640625, -9.9111328125, -9.61669921875, -9.322265625, -9.02783203125, -8.7333984375, -8.43896484375, -8.14453125, -7.85009765625, -7.5556640625, -7.26123046875, -6.966796875, -6.67236328125, -6.3779296875, -6.08349609375, -5.7890625, -5.49462890625, -5.2001953125, -4.90576171875, -4.611328125, -4.31689453125, -4.0224609375, -3.72802734375, -3.43359375, -3.13916015625, -2.8447265625, -2.55029296875, -2.255859375, -1.96142578125, -1.6669921875, -1.37255859375, -1.078125, -0.78369140625, -0.4892578125, -0.19482421875, 0.099609375, 0.39404296875, 0.6884765625, 0.98291015625, 1.27734375, 1.57177734375, 1.8662109375, 2.16064453125, 2.455078125, 2.74951171875, 3.0439453125, 3.33837890625, 3.6328125, 3.92724609375, 4.2216796875, 4.51611328125, 4.810546875, 5.10498046875, 5.3994140625, 5.69384765625, 5.98828125, 6.28271484375, 6.5771484375, 6.87158203125, 7.166015625, 7.46044921875, 7.7548828125, 8.04931640625, 8.34375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 31.0, 56.0, 98.0, 167.0, 179.0, 174.0, 138.0, 75.0, 39.0, 24.0, 13.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.14811325073242, -54.99135208129883, -53.83458709716797, -52.677825927734375, -51.52106475830078, -50.36430358886719, -49.20753860473633, -48.050777435302734, -46.89401626586914, -45.73725509643555, -44.58049011230469, -43.423728942871094, -42.2669677734375, -41.110206604003906, -39.95344161987305, -38.79668045043945, -37.639915466308594, -36.483154296875, -35.32638931274414, -34.16962814331055, -33.01286697387695, -31.856103897094727, -30.6993408203125, -29.542579650878906, -28.385818481445312, -27.229055404663086, -26.072294235229492, -24.915531158447266, -23.758769989013672, -22.602006912231445, -21.44524383544922, -20.288482666015625, -19.131723403930664, -17.974960327148438, -16.818199157714844, -15.661436080932617, -14.504674911499023, -13.347911834716797, -12.191149711608887, -11.034387588500977, -9.877625465393066, -8.720863342285156, -7.564101219177246, -6.407338619232178, -5.250576496124268, -4.093814373016357, -2.937051773071289, -1.780289649963379, -0.6235275268554688, 0.533234715461731, 1.6899969577789307, 2.84675931930542, 4.00352144241333, 5.16028356552124, 6.317046165466309, 7.473808288574219, 8.630570411682129, 9.787332534790039, 10.94409465789795, 12.10085678100586, 13.257619857788086, 14.41438102722168, 15.571144104003906, 16.7279052734375, 17.884668350219727]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 7.0, 4.0, 8.0, 9.0, 12.0, 17.0, 15.0, 24.0, 19.0, 17.0, 26.0, 41.0, 30.0, 33.0, 44.0, 46.0, 39.0, 45.0, 43.0, 51.0, 50.0, 48.0, 46.0, 43.0, 31.0, 46.0, 33.0, 23.0, 29.0, 18.0, 18.0, 21.0, 13.0, 17.0, 7.0, 3.0, 4.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-13.54446792602539, -13.187993049621582, -12.831517219543457, -12.475042343139648, -12.118566513061523, -11.762091636657715, -11.405616760253906, -11.049140930175781, -10.692666053771973, -10.336191177368164, -9.979715347290039, -9.62324047088623, -9.266765594482422, -8.910289764404297, -8.553814888000488, -8.19734001159668, -7.840864181518555, -7.484388828277588, -7.127913475036621, -6.7714385986328125, -6.414963245391846, -6.058487892150879, -5.70201301574707, -5.3455376625061035, -4.989062309265137, -4.63258695602417, -4.276111602783203, -3.9196367263793945, -3.5631613731384277, -3.206686019897461, -2.8502109050750732, -2.4937357902526855, -2.1372604370117188, -1.7807852029800415, -1.4243099689483643, -1.067834734916687, -0.7113595008850098, -0.3548842668533325, 0.0015909671783447266, 0.3580660820007324, 0.7145414352416992, 1.0710166692733765, 1.4274919033050537, 1.783967137336731, 2.140442371368408, 2.496917724609375, 2.8533928394317627, 3.2098679542541504, 3.566343307495117, 3.922818660736084, 4.279294013977051, 4.635768890380859, 4.992244243621826, 5.348719596862793, 5.705194473266602, 6.061669826507568, 6.418145179748535, 6.774620532989502, 7.131095886230469, 7.487570762634277, 7.844046115875244, 8.200521469116211, 8.55699634552002, 8.913471221923828, 9.269947052001953]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 12.0, 11.0, 12.0, 24.0, 52.0, 91.0, 174.0, 269.0, 548.0, 1168.0, 2605.0, 5575.0, 12250.0, 28852.0, 65689.0, 140087.0, 242642.0, 255985.0, 157769.0, 75481.0, 32811.0, 14332.0, 6407.0, 2938.0, 1362.0, 668.0, 327.0, 152.0, 97.0, 64.0, 43.0, 23.0, 13.0, 9.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.59375, -3.48175048828125, -3.3697509765625, -3.25775146484375, -3.145751953125, -3.03375244140625, -2.9217529296875, -2.80975341796875, -2.69775390625, -2.58575439453125, -2.4737548828125, -2.36175537109375, -2.249755859375, -2.13775634765625, -2.0257568359375, -1.91375732421875, -1.8017578125, -1.68975830078125, -1.5777587890625, -1.46575927734375, -1.353759765625, -1.24176025390625, -1.1297607421875, -1.01776123046875, -0.90576171875, -0.79376220703125, -0.6817626953125, -0.56976318359375, -0.457763671875, -0.34576416015625, -0.2337646484375, -0.12176513671875, -0.009765625, 0.10223388671875, 0.2142333984375, 0.32623291015625, 0.438232421875, 0.55023193359375, 0.6622314453125, 0.77423095703125, 0.88623046875, 0.99822998046875, 1.1102294921875, 1.22222900390625, 1.334228515625, 1.44622802734375, 1.5582275390625, 1.67022705078125, 1.7822265625, 1.89422607421875, 2.0062255859375, 2.11822509765625, 2.230224609375, 2.34222412109375, 2.4542236328125, 2.56622314453125, 2.67822265625, 2.79022216796875, 2.9022216796875, 3.01422119140625, 3.126220703125, 3.23822021484375, 3.3502197265625, 3.46221923828125, 3.57421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 6.0, 11.0, 14.0, 18.0, 18.0, 27.0, 25.0, 41.0, 47.0, 42.0, 47.0, 57.0, 71.0, 70.0, 67.0, 68.0, 61.0, 56.0, 49.0, 43.0, 45.0, 37.0, 19.0, 18.0, 13.0, 11.0, 4.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.1875, -15.8004150390625, -15.413330078125, -15.0262451171875, -14.63916015625, -14.2520751953125, -13.864990234375, -13.4779052734375, -13.0908203125, -12.7037353515625, -12.316650390625, -11.9295654296875, -11.54248046875, -11.1553955078125, -10.768310546875, -10.3812255859375, -9.994140625, -9.6070556640625, -9.219970703125, -8.8328857421875, -8.44580078125, -8.0587158203125, -7.671630859375, -7.2845458984375, -6.8974609375, -6.5103759765625, -6.123291015625, -5.7362060546875, -5.34912109375, -4.9620361328125, -4.574951171875, -4.1878662109375, -3.80078125, -3.4136962890625, -3.026611328125, -2.6395263671875, -2.25244140625, -1.8653564453125, -1.478271484375, -1.0911865234375, -0.7041015625, -0.3170166015625, 0.070068359375, 0.4571533203125, 0.84423828125, 1.2313232421875, 1.618408203125, 2.0054931640625, 2.392578125, 2.7796630859375, 3.166748046875, 3.5538330078125, 3.94091796875, 4.3280029296875, 4.715087890625, 5.1021728515625, 5.4892578125, 5.8763427734375, 6.263427734375, 6.6505126953125, 7.03759765625, 7.4246826171875, 7.811767578125, 8.1988525390625, 8.5859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 4.0, 4.0, 8.0, 15.0, 8.0, 23.0, 29.0, 40.0, 67.0, 88.0, 134.0, 194.0, 353.0, 582.0, 1011.0, 1984.0, 3765.0, 7474.0, 15301.0, 32067.0, 67112.0, 131391.0, 212449.0, 233093.0, 165674.0, 90506.0, 43640.0, 21081.0, 10115.0, 4842.0, 2410.0, 1324.0, 651.0, 398.0, 237.0, 148.0, 113.0, 74.0, 46.0, 31.0, 27.0, 11.0, 14.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.453125, -2.371917724609375, -2.29071044921875, -2.209503173828125, -2.1282958984375, -2.047088623046875, -1.96588134765625, -1.884674072265625, -1.803466796875, -1.722259521484375, -1.64105224609375, -1.559844970703125, -1.4786376953125, -1.397430419921875, -1.31622314453125, -1.235015869140625, -1.15380859375, -1.072601318359375, -0.99139404296875, -0.910186767578125, -0.8289794921875, -0.747772216796875, -0.66656494140625, -0.585357666015625, -0.504150390625, -0.422943115234375, -0.34173583984375, -0.260528564453125, -0.1793212890625, -0.098114013671875, -0.01690673828125, 0.064300537109375, 0.1455078125, 0.226715087890625, 0.30792236328125, 0.389129638671875, 0.4703369140625, 0.551544189453125, 0.63275146484375, 0.713958740234375, 0.795166015625, 0.876373291015625, 0.95758056640625, 1.038787841796875, 1.1199951171875, 1.201202392578125, 1.28240966796875, 1.363616943359375, 1.44482421875, 1.526031494140625, 1.60723876953125, 1.688446044921875, 1.7696533203125, 1.850860595703125, 1.93206787109375, 2.013275146484375, 2.094482421875, 2.175689697265625, 2.25689697265625, 2.338104248046875, 2.4193115234375, 2.500518798828125, 2.58172607421875, 2.662933349609375, 2.744140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 7.0, 8.0, 10.0, 10.0, 10.0, 17.0, 11.0, 19.0, 20.0, 25.0, 32.0, 30.0, 35.0, 35.0, 29.0, 46.0, 43.0, 43.0, 46.0, 55.0, 43.0, 44.0, 30.0, 40.0, 36.0, 41.0, 35.0, 22.0, 32.0, 15.0, 24.0, 18.0, 13.0, 14.0, 15.0, 11.0, 7.0, 4.0, 7.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.5625, -18.024658203125, -17.48681640625, -16.948974609375, -16.4111328125, -15.873291015625, -15.33544921875, -14.797607421875, -14.259765625, -13.721923828125, -13.18408203125, -12.646240234375, -12.1083984375, -11.570556640625, -11.03271484375, -10.494873046875, -9.95703125, -9.419189453125, -8.88134765625, -8.343505859375, -7.8056640625, -7.267822265625, -6.72998046875, -6.192138671875, -5.654296875, -5.116455078125, -4.57861328125, -4.040771484375, -3.5029296875, -2.965087890625, -2.42724609375, -1.889404296875, -1.3515625, -0.813720703125, -0.27587890625, 0.261962890625, 0.7998046875, 1.337646484375, 1.87548828125, 2.413330078125, 2.951171875, 3.489013671875, 4.02685546875, 4.564697265625, 5.1025390625, 5.640380859375, 6.17822265625, 6.716064453125, 7.25390625, 7.791748046875, 8.32958984375, 8.867431640625, 9.4052734375, 9.943115234375, 10.48095703125, 11.018798828125, 11.556640625, 12.094482421875, 12.63232421875, 13.170166015625, 13.7080078125, 14.245849609375, 14.78369140625, 15.321533203125, 15.859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 10.0, 7.0, 13.0, 11.0, 17.0, 22.0, 34.0, 53.0, 67.0, 127.0, 163.0, 247.0, 404.0, 753.0, 1309.0, 2668.0, 6157.0, 15167.0, 45457.0, 182234.0, 516300.0, 199541.0, 49065.0, 16026.0, 6469.0, 2847.0, 1369.0, 768.0, 435.0, 294.0, 172.0, 104.0, 69.0, 56.0, 31.0, 24.0, 10.0, 13.0, 8.0, 11.0, 2.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5625, -1.51446533203125, -1.4664306640625, -1.41839599609375, -1.370361328125, -1.32232666015625, -1.2742919921875, -1.22625732421875, -1.17822265625, -1.13018798828125, -1.0821533203125, -1.03411865234375, -0.986083984375, -0.93804931640625, -0.8900146484375, -0.84197998046875, -0.7939453125, -0.74591064453125, -0.6978759765625, -0.64984130859375, -0.601806640625, -0.55377197265625, -0.5057373046875, -0.45770263671875, -0.40966796875, -0.36163330078125, -0.3135986328125, -0.26556396484375, -0.217529296875, -0.16949462890625, -0.1214599609375, -0.07342529296875, -0.025390625, 0.02264404296875, 0.0706787109375, 0.11871337890625, 0.166748046875, 0.21478271484375, 0.2628173828125, 0.31085205078125, 0.35888671875, 0.40692138671875, 0.4549560546875, 0.50299072265625, 0.551025390625, 0.59906005859375, 0.6470947265625, 0.69512939453125, 0.7431640625, 0.79119873046875, 0.8392333984375, 0.88726806640625, 0.935302734375, 0.98333740234375, 1.0313720703125, 1.07940673828125, 1.12744140625, 1.17547607421875, 1.2235107421875, 1.27154541015625, 1.319580078125, 1.36761474609375, 1.4156494140625, 1.46368408203125, 1.51171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 1.0, 7.0, 7.0, 11.0, 4.0, 19.0, 25.0, 22.0, 36.0, 61.0, 67.0, 80.0, 100.0, 132.0, 96.0, 80.0, 56.0, 54.0, 22.0, 16.0, 14.0, 14.0, 13.0, 8.0, 5.0, 6.0, 5.0, 6.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0009407997131347656, -0.0009115710854530334, -0.0008823424577713013, -0.0008531138300895691, -0.0008238852024078369, -0.0007946565747261047, -0.0007654279470443726, -0.0007361993193626404, -0.0007069706916809082, -0.000677742063999176, -0.0006485134363174438, -0.0006192848086357117, -0.0005900561809539795, -0.0005608275532722473, -0.0005315989255905151, -0.000502370297908783, -0.0004731416702270508, -0.0004439130425453186, -0.0004146844148635864, -0.00038545578718185425, -0.00035622715950012207, -0.0003269985318183899, -0.0002977699041366577, -0.00026854127645492554, -0.00023931264877319336, -0.00021008402109146118, -0.000180855393409729, -0.00015162676572799683, -0.00012239813804626465, -9.316951036453247e-05, -6.394088268280029e-05, -3.4712255001068115e-05, -5.4836273193359375e-06, 2.374500036239624e-05, 5.297362804412842e-05, 8.22022557258606e-05, 0.00011143088340759277, 0.00014065951108932495, 0.00016988813877105713, 0.0001991167664527893, 0.00022834539413452148, 0.00025757402181625366, 0.00028680264949798584, 0.000316031277179718, 0.0003452599048614502, 0.0003744885325431824, 0.00040371716022491455, 0.00043294578790664673, 0.0004621744155883789, 0.0004914030432701111, 0.0005206316709518433, 0.0005498602986335754, 0.0005790889263153076, 0.0006083175539970398, 0.000637546181678772, 0.0006667748093605042, 0.0006960034370422363, 0.0007252320647239685, 0.0007544606924057007, 0.0007836893200874329, 0.000812917947769165, 0.0008421465754508972, 0.0008713752031326294, 0.0009006038308143616, 0.0009298324584960938]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 6.0, 2.0, 8.0, 2.0, 8.0, 8.0, 11.0, 17.0, 23.0, 51.0, 86.0, 219.0, 1330.0, 28299.0, 968264.0, 47916.0, 1739.0, 310.0, 100.0, 40.0, 38.0, 16.0, 16.0, 12.0, 12.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8515625, -7.61761474609375, -7.3836669921875, -7.14971923828125, -6.915771484375, -6.68182373046875, -6.4478759765625, -6.21392822265625, -5.97998046875, -5.74603271484375, -5.5120849609375, -5.27813720703125, -5.044189453125, -4.81024169921875, -4.5762939453125, -4.34234619140625, -4.1083984375, -3.87445068359375, -3.6405029296875, -3.40655517578125, -3.172607421875, -2.93865966796875, -2.7047119140625, -2.47076416015625, -2.23681640625, -2.00286865234375, -1.7689208984375, -1.53497314453125, -1.301025390625, -1.06707763671875, -0.8331298828125, -0.59918212890625, -0.365234375, -0.13128662109375, 0.1026611328125, 0.33660888671875, 0.570556640625, 0.80450439453125, 1.0384521484375, 1.27239990234375, 1.50634765625, 1.74029541015625, 1.9742431640625, 2.20819091796875, 2.442138671875, 2.67608642578125, 2.9100341796875, 3.14398193359375, 3.3779296875, 3.61187744140625, 3.8458251953125, 4.07977294921875, 4.313720703125, 4.54766845703125, 4.7816162109375, 5.01556396484375, 5.24951171875, 5.48345947265625, 5.7174072265625, 5.95135498046875, 6.185302734375, 6.41925048828125, 6.6531982421875, 6.88714599609375, 7.12109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 6.0, 3.0, 2.0, 2.0, 6.0, 11.0, 15.0, 19.0, 30.0, 38.0, 67.0, 112.0, 146.0, 151.0, 119.0, 89.0, 53.0, 32.0, 32.0, 17.0, 16.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0849609375, -1.0532073974609375, -1.021453857421875, -0.9897003173828125, -0.95794677734375, -0.9261932373046875, -0.894439697265625, -0.8626861572265625, -0.8309326171875, -0.7991790771484375, -0.767425537109375, -0.7356719970703125, -0.70391845703125, -0.6721649169921875, -0.640411376953125, -0.6086578369140625, -0.576904296875, -0.5451507568359375, -0.513397216796875, -0.4816436767578125, -0.44989013671875, -0.4181365966796875, -0.386383056640625, -0.3546295166015625, -0.3228759765625, -0.2911224365234375, -0.259368896484375, -0.2276153564453125, -0.19586181640625, -0.1641082763671875, -0.132354736328125, -0.1006011962890625, -0.06884765625, -0.0370941162109375, -0.005340576171875, 0.0264129638671875, 0.05816650390625, 0.0899200439453125, 0.121673583984375, 0.1534271240234375, 0.1851806640625, 0.2169342041015625, 0.248687744140625, 0.2804412841796875, 0.31219482421875, 0.3439483642578125, 0.375701904296875, 0.4074554443359375, 0.439208984375, 0.4709625244140625, 0.502716064453125, 0.5344696044921875, 0.56622314453125, 0.5979766845703125, 0.629730224609375, 0.6614837646484375, 0.6932373046875, 0.7249908447265625, 0.756744384765625, 0.7884979248046875, 0.82025146484375, 0.8520050048828125, 0.883758544921875, 0.9155120849609375, 0.947265625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 9.0, 60.0, 273.0, 398.0, 214.0, 49.0, 10.0, 3.0], "bins": [-115.10926818847656, -113.16902160644531, -111.22877502441406, -109.28852844238281, -107.3482894897461, -105.40804290771484, -103.4677963256836, -101.52754974365234, -99.5873031616211, -97.64705657958984, -95.7068099975586, -93.76657104492188, -91.82632446289062, -89.88607788085938, -87.94583129882812, -86.00558471679688, -84.06533813476562, -82.12509155273438, -80.18484497070312, -78.24459838867188, -76.30435943603516, -74.3641128540039, -72.42386627197266, -70.4836196899414, -68.54338073730469, -66.60313415527344, -64.66288757324219, -62.7226448059082, -60.78239822387695, -58.84215545654297, -56.90190887451172, -54.96166229248047, -53.02141571044922, -51.08116912841797, -49.140926361083984, -47.200679779052734, -45.260433197021484, -43.3201904296875, -41.37994384765625, -39.439697265625, -37.499454498291016, -35.559207916259766, -33.61896514892578, -31.67871856689453, -29.73847198486328, -27.798227310180664, -25.857982635498047, -23.917736053466797, -21.97749137878418, -20.037246704101562, -18.097000122070312, -16.156755447387695, -14.216509819030762, -12.276264190673828, -10.336019515991211, -8.395773887634277, -6.455528259277344, -4.51528263092041, -2.5750374794006348, -0.6347923278808594, 1.3054533004760742, 3.245698928833008, 5.185943603515625, 7.126189231872559, 9.066434860229492]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 9.0, 10.0, 9.0, 18.0, 17.0, 30.0, 23.0, 38.0, 49.0, 64.0, 69.0, 74.0, 79.0, 75.0, 58.0, 63.0, 72.0, 69.0, 51.0, 38.0, 27.0, 19.0, 10.0, 10.0, 9.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.60319709777832, -18.151254653930664, -17.699312210083008, -17.24736976623535, -16.795425415039062, -16.343482971191406, -15.89154052734375, -15.439598083496094, -14.987655639648438, -14.535713195800781, -14.083770751953125, -13.631827354431152, -13.179884910583496, -12.72794246673584, -12.275999069213867, -11.824056625366211, -11.372114181518555, -10.920171737670898, -10.468229293823242, -10.01628589630127, -9.564343452453613, -9.112401008605957, -8.660457611083984, -8.208515167236328, -7.756572723388672, -7.304630279541016, -6.852687358856201, -6.400744438171387, -5.9488019943237305, -5.496859550476074, -5.04491662979126, -4.592973709106445, -4.141030311584473, -3.6890876293182373, -3.237144947052002, -2.7852022647857666, -2.3332595825195312, -1.881316900253296, -1.4293742179870605, -0.9774315357208252, -0.5254888534545898, -0.07354617118835449, 0.37839651107788086, 0.8303391933441162, 1.2822818756103516, 1.734224557876587, 2.1861672401428223, 2.6381099224090576, 3.090052604675293, 3.5419952869415283, 3.9939379692077637, 4.445880889892578, 4.897823333740234, 5.349765777587891, 5.801708698272705, 6.2536516189575195, 6.705594062805176, 7.157536506652832, 7.6094794273376465, 8.061422348022461, 8.513364791870117, 8.965307235717773, 9.41724967956543, 9.869193077087402, 10.321135520935059]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 10.0, 15.0, 21.0, 37.0, 41.0, 85.0, 143.0, 206.0, 450.0, 821.0, 1578.0, 3247.0, 6189.0, 12462.0, 26214.0, 54505.0, 113677.0, 209980.0, 258468.0, 181276.0, 92915.0, 43934.0, 21295.0, 10211.0, 5183.0, 2591.0, 1368.0, 720.0, 366.0, 192.0, 117.0, 85.0, 46.0, 23.0, 15.0, 12.0, 8.0, 9.0, 8.0, 3.0, 4.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.0390625, -3.9014892578125, -3.763916015625, -3.6263427734375, -3.48876953125, -3.3511962890625, -3.213623046875, -3.0760498046875, -2.9384765625, -2.8009033203125, -2.663330078125, -2.5257568359375, -2.38818359375, -2.2506103515625, -2.113037109375, -1.9754638671875, -1.837890625, -1.7003173828125, -1.562744140625, -1.4251708984375, -1.28759765625, -1.1500244140625, -1.012451171875, -0.8748779296875, -0.7373046875, -0.5997314453125, -0.462158203125, -0.3245849609375, -0.18701171875, -0.0494384765625, 0.088134765625, 0.2257080078125, 0.36328125, 0.5008544921875, 0.638427734375, 0.7760009765625, 0.91357421875, 1.0511474609375, 1.188720703125, 1.3262939453125, 1.4638671875, 1.6014404296875, 1.739013671875, 1.8765869140625, 2.01416015625, 2.1517333984375, 2.289306640625, 2.4268798828125, 2.564453125, 2.7020263671875, 2.839599609375, 2.9771728515625, 3.11474609375, 3.2523193359375, 3.389892578125, 3.5274658203125, 3.6650390625, 3.8026123046875, 3.940185546875, 4.0777587890625, 4.21533203125, 4.3529052734375, 4.490478515625, 4.6280517578125, 4.765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 12.0, 13.0, 13.0, 10.0, 20.0, 34.0, 37.0, 39.0, 36.0, 50.0, 55.0, 53.0, 62.0, 63.0, 59.0, 67.0, 67.0, 54.0, 49.0, 44.0, 34.0, 24.0, 27.0, 23.0, 15.0, 12.0, 14.0, 5.0, 2.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.625, -31.825439453125, -31.02587890625, -30.226318359375, -29.4267578125, -28.627197265625, -27.82763671875, -27.028076171875, -26.228515625, -25.428955078125, -24.62939453125, -23.829833984375, -23.0302734375, -22.230712890625, -21.43115234375, -20.631591796875, -19.83203125, -19.032470703125, -18.23291015625, -17.433349609375, -16.6337890625, -15.834228515625, -15.03466796875, -14.235107421875, -13.435546875, -12.635986328125, -11.83642578125, -11.036865234375, -10.2373046875, -9.437744140625, -8.63818359375, -7.838623046875, -7.0390625, -6.239501953125, -5.43994140625, -4.640380859375, -3.8408203125, -3.041259765625, -2.24169921875, -1.442138671875, -0.642578125, 0.156982421875, 0.95654296875, 1.756103515625, 2.5556640625, 3.355224609375, 4.15478515625, 4.954345703125, 5.75390625, 6.553466796875, 7.35302734375, 8.152587890625, 8.9521484375, 9.751708984375, 10.55126953125, 11.350830078125, 12.150390625, 12.949951171875, 13.74951171875, 14.549072265625, 15.3486328125, 16.148193359375, 16.94775390625, 17.747314453125, 18.546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 3.0, 5.0, 4.0, 9.0, 7.0, 11.0, 14.0, 20.0, 26.0, 44.0, 51.0, 62.0, 113.0, 133.0, 242.0, 365.0, 894.0, 3219.0, 24303.0, 334851.0, 620582.0, 55297.0, 5744.0, 1215.0, 499.0, 278.0, 154.0, 120.0, 75.0, 55.0, 39.0, 31.0, 19.0, 16.0, 11.0, 10.0, 10.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-17.84375, -17.350341796875, -16.85693359375, -16.363525390625, -15.8701171875, -15.376708984375, -14.88330078125, -14.389892578125, -13.896484375, -13.403076171875, -12.90966796875, -12.416259765625, -11.9228515625, -11.429443359375, -10.93603515625, -10.442626953125, -9.94921875, -9.455810546875, -8.96240234375, -8.468994140625, -7.9755859375, -7.482177734375, -6.98876953125, -6.495361328125, -6.001953125, -5.508544921875, -5.01513671875, -4.521728515625, -4.0283203125, -3.534912109375, -3.04150390625, -2.548095703125, -2.0546875, -1.561279296875, -1.06787109375, -0.574462890625, -0.0810546875, 0.412353515625, 0.90576171875, 1.399169921875, 1.892578125, 2.385986328125, 2.87939453125, 3.372802734375, 3.8662109375, 4.359619140625, 4.85302734375, 5.346435546875, 5.83984375, 6.333251953125, 6.82666015625, 7.320068359375, 7.8134765625, 8.306884765625, 8.80029296875, 9.293701171875, 9.787109375, 10.280517578125, 10.77392578125, 11.267333984375, 11.7607421875, 12.254150390625, 12.74755859375, 13.240966796875, 13.734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 7.0, 9.0, 11.0, 15.0, 9.0, 8.0, 16.0, 20.0, 30.0, 36.0, 38.0, 27.0, 45.0, 38.0, 44.0, 48.0, 47.0, 47.0, 24.0, 52.0, 44.0, 38.0, 51.0, 32.0, 33.0, 35.0, 28.0, 36.0, 23.0, 13.0, 29.0, 13.0, 18.0, 10.0, 4.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.328125, -17.7216796875, -17.115234375, -16.5087890625, -15.90234375, -15.2958984375, -14.689453125, -14.0830078125, -13.4765625, -12.8701171875, -12.263671875, -11.6572265625, -11.05078125, -10.4443359375, -9.837890625, -9.2314453125, -8.625, -8.0185546875, -7.412109375, -6.8056640625, -6.19921875, -5.5927734375, -4.986328125, -4.3798828125, -3.7734375, -3.1669921875, -2.560546875, -1.9541015625, -1.34765625, -0.7412109375, -0.134765625, 0.4716796875, 1.078125, 1.6845703125, 2.291015625, 2.8974609375, 3.50390625, 4.1103515625, 4.716796875, 5.3232421875, 5.9296875, 6.5361328125, 7.142578125, 7.7490234375, 8.35546875, 8.9619140625, 9.568359375, 10.1748046875, 10.78125, 11.3876953125, 11.994140625, 12.6005859375, 13.20703125, 13.8134765625, 14.419921875, 15.0263671875, 15.6328125, 16.2392578125, 16.845703125, 17.4521484375, 18.05859375, 18.6650390625, 19.271484375, 19.8779296875, 20.484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 7.0, 10.0, 13.0, 31.0, 34.0, 65.0, 178.0, 436.0, 1413.0, 6019.0, 65001.0, 755297.0, 204179.0, 12434.0, 2296.0, 677.0, 229.0, 109.0, 45.0, 22.0, 17.0, 12.0, 8.0, 4.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.876953125, -3.719879150390625, -3.56280517578125, -3.405731201171875, -3.2486572265625, -3.091583251953125, -2.93450927734375, -2.777435302734375, -2.620361328125, -2.463287353515625, -2.30621337890625, -2.149139404296875, -1.9920654296875, -1.834991455078125, -1.67791748046875, -1.520843505859375, -1.36376953125, -1.206695556640625, -1.04962158203125, -0.892547607421875, -0.7354736328125, -0.578399658203125, -0.42132568359375, -0.264251708984375, -0.107177734375, 0.049896240234375, 0.20697021484375, 0.364044189453125, 0.5211181640625, 0.678192138671875, 0.83526611328125, 0.992340087890625, 1.1494140625, 1.306488037109375, 1.46356201171875, 1.620635986328125, 1.7777099609375, 1.934783935546875, 2.09185791015625, 2.248931884765625, 2.406005859375, 2.563079833984375, 2.72015380859375, 2.877227783203125, 3.0343017578125, 3.191375732421875, 3.34844970703125, 3.505523681640625, 3.66259765625, 3.819671630859375, 3.97674560546875, 4.133819580078125, 4.2908935546875, 4.447967529296875, 4.60504150390625, 4.762115478515625, 4.919189453125, 5.076263427734375, 5.23333740234375, 5.390411376953125, 5.5474853515625, 5.704559326171875, 5.86163330078125, 6.018707275390625, 6.17578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 4.0, 4.0, 4.0, 12.0, 12.0, 30.0, 37.0, 46.0, 69.0, 58.0, 71.0, 89.0, 83.0, 92.0, 84.0, 74.0, 57.0, 30.0, 37.0, 26.0, 18.0, 14.0, 15.0, 10.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0005397796630859375, -0.0005257874727249146, -0.0005117952823638916, -0.0004978030920028687, -0.0004838109016418457, -0.00046981871128082275, -0.0004558265209197998, -0.00044183433055877686, -0.0004278421401977539, -0.00041384994983673096, -0.000399857759475708, -0.00038586556911468506, -0.0003718733787536621, -0.00035788118839263916, -0.0003438889980316162, -0.00032989680767059326, -0.0003159046173095703, -0.00030191242694854736, -0.0002879202365875244, -0.00027392804622650146, -0.0002599358558654785, -0.00024594366550445557, -0.00023195147514343262, -0.00021795928478240967, -0.00020396709442138672, -0.00018997490406036377, -0.00017598271369934082, -0.00016199052333831787, -0.00014799833297729492, -0.00013400614261627197, -0.00012001395225524902, -0.00010602176189422607, -9.202957153320312e-05, -7.803738117218018e-05, -6.404519081115723e-05, -5.005300045013428e-05, -3.606081008911133e-05, -2.206861972808838e-05, -8.07642936706543e-06, 5.9157609939575195e-06, 1.990795135498047e-05, 3.390014171600342e-05, 4.789233207702637e-05, 6.188452243804932e-05, 7.587671279907227e-05, 8.986890316009521e-05, 0.00010386109352111816, 0.00011785328388214111, 0.00013184547424316406, 0.000145837664604187, 0.00015982985496520996, 0.0001738220453262329, 0.00018781423568725586, 0.0002018064260482788, 0.00021579861640930176, 0.0002297908067703247, 0.00024378299713134766, 0.0002577751874923706, 0.00027176737785339355, 0.0002857595682144165, 0.00029975175857543945, 0.0003137439489364624, 0.00032773613929748535, 0.0003417283296585083, 0.00035572052001953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 9.0, 14.0, 21.0, 24.0, 39.0, 81.0, 159.0, 276.0, 767.0, 2898.0, 18981.0, 337772.0, 639843.0, 41211.0, 4605.0, 1099.0, 369.0, 157.0, 77.0, 54.0, 37.0, 16.0, 12.0, 5.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6015625, -5.44219970703125, -5.2828369140625, -5.12347412109375, -4.964111328125, -4.80474853515625, -4.6453857421875, -4.48602294921875, -4.32666015625, -4.16729736328125, -4.0079345703125, -3.84857177734375, -3.689208984375, -3.52984619140625, -3.3704833984375, -3.21112060546875, -3.0517578125, -2.89239501953125, -2.7330322265625, -2.57366943359375, -2.414306640625, -2.25494384765625, -2.0955810546875, -1.93621826171875, -1.77685546875, -1.61749267578125, -1.4581298828125, -1.29876708984375, -1.139404296875, -0.98004150390625, -0.8206787109375, -0.66131591796875, -0.501953125, -0.34259033203125, -0.1832275390625, -0.02386474609375, 0.135498046875, 0.29486083984375, 0.4542236328125, 0.61358642578125, 0.77294921875, 0.93231201171875, 1.0916748046875, 1.25103759765625, 1.410400390625, 1.56976318359375, 1.7291259765625, 1.88848876953125, 2.0478515625, 2.20721435546875, 2.3665771484375, 2.52593994140625, 2.685302734375, 2.84466552734375, 3.0040283203125, 3.16339111328125, 3.32275390625, 3.48211669921875, 3.6414794921875, 3.80084228515625, 3.960205078125, 4.11956787109375, 4.2789306640625, 4.43829345703125, 4.59765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 7.0, 3.0, 11.0, 12.0, 10.0, 15.0, 21.0, 30.0, 36.0, 34.0, 50.0, 69.0, 93.0, 105.0, 93.0, 56.0, 70.0, 60.0, 46.0, 45.0, 36.0, 23.0, 23.0, 5.0, 8.0, 9.0, 10.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.28125, -1.2390899658203125, -1.196929931640625, -1.1547698974609375, -1.11260986328125, -1.0704498291015625, -1.028289794921875, -0.9861297607421875, -0.9439697265625, -0.9018096923828125, -0.859649658203125, -0.8174896240234375, -0.77532958984375, -0.7331695556640625, -0.691009521484375, -0.6488494873046875, -0.606689453125, -0.5645294189453125, -0.522369384765625, -0.4802093505859375, -0.43804931640625, -0.3958892822265625, -0.353729248046875, -0.3115692138671875, -0.2694091796875, -0.2272491455078125, -0.185089111328125, -0.1429290771484375, -0.10076904296875, -0.0586090087890625, -0.016448974609375, 0.0257110595703125, 0.06787109375, 0.1100311279296875, 0.152191162109375, 0.1943511962890625, 0.23651123046875, 0.2786712646484375, 0.320831298828125, 0.3629913330078125, 0.4051513671875, 0.4473114013671875, 0.489471435546875, 0.5316314697265625, 0.57379150390625, 0.6159515380859375, 0.658111572265625, 0.7002716064453125, 0.742431640625, 0.7845916748046875, 0.826751708984375, 0.8689117431640625, 0.91107177734375, 0.9532318115234375, 0.995391845703125, 1.0375518798828125, 1.0797119140625, 1.1218719482421875, 1.164031982421875, 1.2061920166015625, 1.24835205078125, 1.2905120849609375, 1.332672119140625, 1.3748321533203125, 1.4169921875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 11.0, 191.0, 605.0, 198.0, 14.0], "bins": [-308.8100280761719, -303.78314208984375, -298.75628662109375, -293.7294006347656, -288.7025451660156, -283.6756591796875, -278.6488037109375, -273.6219177246094, -268.5950622558594, -263.56817626953125, -258.54132080078125, -253.5144500732422, -248.48757934570312, -243.460693359375, -238.433837890625, -233.40695190429688, -228.38006591796875, -223.3531951904297, -218.32632446289062, -213.29945373535156, -208.2725830078125, -203.24569702148438, -198.21884155273438, -193.19195556640625, -188.16510009765625, -183.1382293701172, -178.11135864257812, -173.08448791503906, -168.0576171875, -163.03073120117188, -158.00387573242188, -152.97698974609375, -147.95013427734375, -142.9232635498047, -137.89639282226562, -132.86952209472656, -127.84264373779297, -122.8157730102539, -117.78890228271484, -112.76202392578125, -107.73515319824219, -102.70828247070312, -97.68141174316406, -92.654541015625, -87.6276626586914, -82.60079193115234, -77.57392120361328, -72.54704284667969, -67.52017211914062, -62.49330139160156, -57.466426849365234, -52.43955612182617, -47.412681579589844, -42.38581085205078, -37.35894012451172, -32.33206558227539, -27.305198669433594, -22.2783260345459, -17.251453399658203, -12.22458267211914, -7.197710037231445, -2.17083740234375, 2.8560333251953125, 7.882907867431641, 12.909778594970703]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 3.0, 5.0, 7.0, 7.0, 7.0, 5.0, 9.0, 13.0, 12.0, 18.0, 13.0, 19.0, 21.0, 24.0, 24.0, 36.0, 27.0, 34.0, 39.0, 43.0, 43.0, 39.0, 40.0, 46.0, 47.0, 46.0, 38.0, 30.0, 35.0, 35.0, 30.0, 27.0, 30.0, 23.0, 21.0, 22.0, 19.0, 13.0, 9.0, 10.0, 10.0, 3.0, 6.0, 1.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-30.17464256286621, -29.319936752319336, -28.46523094177246, -27.610525131225586, -26.755821228027344, -25.90111541748047, -25.046409606933594, -24.19170379638672, -23.336997985839844, -22.48229217529297, -21.627586364746094, -20.77288055419922, -19.918174743652344, -19.06346893310547, -18.208765029907227, -17.35405921936035, -16.499353408813477, -15.644647598266602, -14.789941787719727, -13.935236930847168, -13.080531120300293, -12.225825309753418, -11.37112045288086, -10.516414642333984, -9.66170883178711, -8.807003021240234, -7.952297687530518, -7.097592353820801, -6.242886543273926, -5.388180732727051, -4.533475399017334, -3.678770065307617, -2.824064254760742, -1.9693586826324463, -1.1146531105041504, -0.2599475383758545, 0.5947580337524414, 1.4494638442993164, 2.304169178009033, 3.15887451171875, 4.013580322265625, 4.8682861328125, 5.722991466522217, 6.577696800231934, 7.432402610778809, 8.287108421325684, 9.141813278198242, 9.996519088745117, 10.851224899291992, 11.705930709838867, 12.560636520385742, 13.4153413772583, 14.270047187805176, 15.12475299835205, 15.97945785522461, 16.834163665771484, 17.68886947631836, 18.543575286865234, 19.39828109741211, 20.252986907958984, 21.10769271850586, 21.962398529052734, 22.817102432250977, 23.67180824279785, 24.526514053344727]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 11.0, 12.0, 20.0, 25.0, 30.0, 58.0, 74.0, 154.0, 321.0, 766.0, 2078.0, 7237.0, 36275.0, 247456.0, 1516429.0, 1918647.0, 395292.0, 52150.0, 10497.0, 2967.0, 1418.0, 943.0, 704.0, 403.0, 170.0, 72.0, 26.0, 18.0, 8.0, 5.0, 5.0, 4.0, 1.0], "bins": [-23.25, -22.745849609375, -22.24169921875, -21.737548828125, -21.2333984375, -20.729248046875, -20.22509765625, -19.720947265625, -19.216796875, -18.712646484375, -18.20849609375, -17.704345703125, -17.2001953125, -16.696044921875, -16.19189453125, -15.687744140625, -15.18359375, -14.679443359375, -14.17529296875, -13.671142578125, -13.1669921875, -12.662841796875, -12.15869140625, -11.654541015625, -11.150390625, -10.646240234375, -10.14208984375, -9.637939453125, -9.1337890625, -8.629638671875, -8.12548828125, -7.621337890625, -7.1171875, -6.613037109375, -6.10888671875, -5.604736328125, -5.1005859375, -4.596435546875, -4.09228515625, -3.588134765625, -3.083984375, -2.579833984375, -2.07568359375, -1.571533203125, -1.0673828125, -0.563232421875, -0.05908203125, 0.445068359375, 0.94921875, 1.453369140625, 1.95751953125, 2.461669921875, 2.9658203125, 3.469970703125, 3.97412109375, 4.478271484375, 4.982421875, 5.486572265625, 5.99072265625, 6.494873046875, 6.9990234375, 7.503173828125, 8.00732421875, 8.511474609375, 9.015625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 19.0, 23.0, 29.0, 57.0, 63.0, 86.0, 100.0, 111.0, 110.0, 108.0, 108.0, 61.0, 60.0, 30.0, 16.0, 15.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-37.03125, -36.2901611328125, -35.549072265625, -34.8079833984375, -34.06689453125, -33.3258056640625, -32.584716796875, -31.8436279296875, -31.1025390625, -30.3614501953125, -29.620361328125, -28.8792724609375, -28.13818359375, -27.3970947265625, -26.656005859375, -25.9149169921875, -25.173828125, -24.4327392578125, -23.691650390625, -22.9505615234375, -22.20947265625, -21.4683837890625, -20.727294921875, -19.9862060546875, -19.2451171875, -18.5040283203125, -17.762939453125, -17.0218505859375, -16.28076171875, -15.5396728515625, -14.798583984375, -14.0574951171875, -13.31640625, -12.5753173828125, -11.834228515625, -11.0931396484375, -10.35205078125, -9.6109619140625, -8.869873046875, -8.1287841796875, -7.3876953125, -6.6466064453125, -5.905517578125, -5.1644287109375, -4.42333984375, -3.6822509765625, -2.941162109375, -2.2000732421875, -1.458984375, -0.7178955078125, 0.023193359375, 0.7642822265625, 1.50537109375, 2.2464599609375, 2.987548828125, 3.7286376953125, 4.4697265625, 5.2108154296875, 5.951904296875, 6.6929931640625, 7.43408203125, 8.1751708984375, 8.916259765625, 9.6573486328125, 10.3984375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 11.0, 28.0, 48.0, 99.0, 177.0, 536.0, 5863.0, 4134407.0, 51510.0, 1066.0, 281.0, 114.0, 52.0, 30.0, 20.0, 7.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.59375, -57.17822265625, -54.7626953125, -52.34716796875, -49.931640625, -47.51611328125, -45.1005859375, -42.68505859375, -40.26953125, -37.85400390625, -35.4384765625, -33.02294921875, -30.607421875, -28.19189453125, -25.7763671875, -23.36083984375, -20.9453125, -18.52978515625, -16.1142578125, -13.69873046875, -11.283203125, -8.86767578125, -6.4521484375, -4.03662109375, -1.62109375, 0.79443359375, 3.2099609375, 5.62548828125, 8.041015625, 10.45654296875, 12.8720703125, 15.28759765625, 17.703125, 20.11865234375, 22.5341796875, 24.94970703125, 27.365234375, 29.78076171875, 32.1962890625, 34.61181640625, 37.02734375, 39.44287109375, 41.8583984375, 44.27392578125, 46.689453125, 49.10498046875, 51.5205078125, 53.93603515625, 56.3515625, 58.76708984375, 61.1826171875, 63.59814453125, 66.013671875, 68.42919921875, 70.8447265625, 73.26025390625, 75.67578125, 78.09130859375, 80.5068359375, 82.92236328125, 85.337890625, 87.75341796875, 90.1689453125, 92.58447265625, 95.0]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 9.0, 15.0, 45.0, 73.0, 150.0, 281.0, 690.0, 1088.0, 906.0, 433.0, 210.0, 93.0, 36.0, 18.0, 6.0, 9.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66015625, -6.33795166015625, -6.0157470703125, -5.69354248046875, -5.371337890625, -5.04913330078125, -4.7269287109375, -4.40472412109375, -4.08251953125, -3.76031494140625, -3.4381103515625, -3.11590576171875, -2.793701171875, -2.47149658203125, -2.1492919921875, -1.82708740234375, -1.5048828125, -1.18267822265625, -0.8604736328125, -0.53826904296875, -0.216064453125, 0.10614013671875, 0.4283447265625, 0.75054931640625, 1.07275390625, 1.39495849609375, 1.7171630859375, 2.03936767578125, 2.361572265625, 2.68377685546875, 3.0059814453125, 3.32818603515625, 3.650390625, 3.97259521484375, 4.2947998046875, 4.61700439453125, 4.939208984375, 5.26141357421875, 5.5836181640625, 5.90582275390625, 6.22802734375, 6.55023193359375, 6.8724365234375, 7.19464111328125, 7.516845703125, 7.83905029296875, 8.1612548828125, 8.48345947265625, 8.8056640625, 9.12786865234375, 9.4500732421875, 9.77227783203125, 10.094482421875, 10.41668701171875, 10.7388916015625, 11.06109619140625, 11.38330078125, 11.70550537109375, 12.0277099609375, 12.34991455078125, 12.672119140625, 12.99432373046875, 13.3165283203125, 13.63873291015625, 13.9609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 17.0, 55.0, 92.0, 180.0, 215.0, 194.0, 117.0, 82.0, 34.0, 11.0, 4.0, 3.0, 0.0, 1.0], "bins": [-67.9037857055664, -66.65933990478516, -65.4148941040039, -64.17044830322266, -62.926002502441406, -61.681556701660156, -60.437110900878906, -59.19266128540039, -57.94821548461914, -56.70376968383789, -55.45932388305664, -54.21487808227539, -52.97043228149414, -51.725982666015625, -50.481536865234375, -49.237091064453125, -47.992645263671875, -46.748199462890625, -45.503753662109375, -44.259307861328125, -43.014862060546875, -41.770416259765625, -40.525970458984375, -39.28152084350586, -38.037078857421875, -36.792633056640625, -35.548187255859375, -34.303741455078125, -33.059295654296875, -31.814847946166992, -30.570402145385742, -29.32595443725586, -28.08150863647461, -26.83706283569336, -25.59261703491211, -24.34817123413086, -23.103723526000977, -21.859277725219727, -20.614831924438477, -19.370384216308594, -18.125940322875977, -16.881494522094727, -15.63704776763916, -14.39260196685791, -13.148155212402344, -11.903709411621094, -10.659263610839844, -9.414816856384277, -8.170371055603027, -6.925924777984619, -5.681478500366211, -4.437032699584961, -3.1925864219665527, -1.9481401443481445, -0.7036943435668945, 0.5407524108886719, 1.7851982116699219, 3.02964448928833, 4.274090766906738, 5.518536567687988, 6.7629828453063965, 8.007429122924805, 9.251874923706055, 10.496321678161621, 11.740767478942871]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 12.0, 12.0, 12.0, 21.0, 30.0, 39.0, 65.0, 44.0, 73.0, 69.0, 72.0, 68.0, 76.0, 61.0, 65.0, 58.0, 62.0, 44.0, 35.0, 16.0, 26.0, 13.0, 15.0, 8.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-27.55113410949707, -26.964435577392578, -26.37773895263672, -25.79104232788086, -25.204343795776367, -24.617645263671875, -24.030948638916016, -23.444252014160156, -22.857553482055664, -22.270854949951172, -21.684158325195312, -21.097461700439453, -20.51076316833496, -19.92406463623047, -19.33736801147461, -18.75067138671875, -18.163972854614258, -17.577274322509766, -16.990577697753906, -16.403881072998047, -15.817182540893555, -15.230484962463379, -14.643787384033203, -14.057089805603027, -13.470392227172852, -12.883694648742676, -12.2969970703125, -11.710299491882324, -11.123601913452148, -10.536904335021973, -9.950206756591797, -9.363509178161621, -8.776813507080078, -8.190115928649902, -7.603418350219727, -7.016720771789551, -6.430023193359375, -5.843325614929199, -5.256628036499023, -4.669930458068848, -4.083232879638672, -3.496535301208496, -2.9098377227783203, -2.3231401443481445, -1.7364425659179688, -1.149744987487793, -0.5630474090576172, 0.023650169372558594, 0.6103477478027344, 1.1970453262329102, 1.783742904663086, 2.3704404830932617, 2.9571380615234375, 3.5438356399536133, 4.130533218383789, 4.717230796813965, 5.303928375244141, 5.890625953674316, 6.477323532104492, 7.064021110534668, 7.650718688964844, 8.23741626739502, 8.824113845825195, 9.410811424255371, 9.997509002685547]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 15.0, 24.0, 25.0, 53.0, 70.0, 169.0, 342.0, 836.0, 2206.0, 7013.0, 28115.0, 132580.0, 479848.0, 309678.0, 66203.0, 14729.0, 4051.0, 1449.0, 544.0, 279.0, 126.0, 70.0, 38.0, 31.0, 11.0, 11.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.484375, -5.322021484375, -5.15966796875, -4.997314453125, -4.8349609375, -4.672607421875, -4.51025390625, -4.347900390625, -4.185546875, -4.023193359375, -3.86083984375, -3.698486328125, -3.5361328125, -3.373779296875, -3.21142578125, -3.049072265625, -2.88671875, -2.724365234375, -2.56201171875, -2.399658203125, -2.2373046875, -2.074951171875, -1.91259765625, -1.750244140625, -1.587890625, -1.425537109375, -1.26318359375, -1.100830078125, -0.9384765625, -0.776123046875, -0.61376953125, -0.451416015625, -0.2890625, -0.126708984375, 0.03564453125, 0.197998046875, 0.3603515625, 0.522705078125, 0.68505859375, 0.847412109375, 1.009765625, 1.172119140625, 1.33447265625, 1.496826171875, 1.6591796875, 1.821533203125, 1.98388671875, 2.146240234375, 2.30859375, 2.470947265625, 2.63330078125, 2.795654296875, 2.9580078125, 3.120361328125, 3.28271484375, 3.445068359375, 3.607421875, 3.769775390625, 3.93212890625, 4.094482421875, 4.2568359375, 4.419189453125, 4.58154296875, 4.743896484375, 4.90625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 10.0, 13.0, 16.0, 25.0, 43.0, 54.0, 63.0, 76.0, 82.0, 86.0, 80.0, 96.0, 67.0, 67.0, 60.0, 53.0, 39.0, 25.0, 22.0, 10.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-21.546875, -21.0828857421875, -20.618896484375, -20.1549072265625, -19.69091796875, -19.2269287109375, -18.762939453125, -18.2989501953125, -17.8349609375, -17.3709716796875, -16.906982421875, -16.4429931640625, -15.97900390625, -15.5150146484375, -15.051025390625, -14.5870361328125, -14.123046875, -13.6590576171875, -13.195068359375, -12.7310791015625, -12.26708984375, -11.8031005859375, -11.339111328125, -10.8751220703125, -10.4111328125, -9.9471435546875, -9.483154296875, -9.0191650390625, -8.55517578125, -8.0911865234375, -7.627197265625, -7.1632080078125, -6.69921875, -6.2352294921875, -5.771240234375, -5.3072509765625, -4.84326171875, -4.3792724609375, -3.915283203125, -3.4512939453125, -2.9873046875, -2.5233154296875, -2.059326171875, -1.5953369140625, -1.13134765625, -0.6673583984375, -0.203369140625, 0.2606201171875, 0.724609375, 1.1885986328125, 1.652587890625, 2.1165771484375, 2.58056640625, 3.0445556640625, 3.508544921875, 3.9725341796875, 4.4365234375, 4.9005126953125, 5.364501953125, 5.8284912109375, 6.29248046875, 6.7564697265625, 7.220458984375, 7.6844482421875, 8.1484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 5.0, 5.0, 11.0, 11.0, 12.0, 13.0, 13.0, 25.0, 37.0, 45.0, 72.0, 106.0, 172.0, 279.0, 444.0, 730.0, 1265.0, 2114.0, 3739.0, 6775.0, 12335.0, 22610.0, 40966.0, 74593.0, 126300.0, 184932.0, 200684.0, 153831.0, 95644.0, 53777.0, 29982.0, 16302.0, 8932.0, 4941.0, 2759.0, 1614.0, 937.0, 543.0, 335.0, 193.0, 141.0, 95.0, 61.0, 45.0, 33.0, 25.0, 13.0, 20.0, 11.0, 11.0, 9.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.6318359375, -1.5827178955078125, -1.533599853515625, -1.4844818115234375, -1.43536376953125, -1.3862457275390625, -1.337127685546875, -1.2880096435546875, -1.2388916015625, -1.1897735595703125, -1.140655517578125, -1.0915374755859375, -1.04241943359375, -0.9933013916015625, -0.944183349609375, -0.8950653076171875, -0.845947265625, -0.7968292236328125, -0.747711181640625, -0.6985931396484375, -0.64947509765625, -0.6003570556640625, -0.551239013671875, -0.5021209716796875, -0.4530029296875, -0.4038848876953125, -0.354766845703125, -0.3056488037109375, -0.25653076171875, -0.2074127197265625, -0.158294677734375, -0.1091766357421875, -0.06005859375, -0.0109405517578125, 0.038177490234375, 0.0872955322265625, 0.13641357421875, 0.1855316162109375, 0.234649658203125, 0.2837677001953125, 0.3328857421875, 0.3820037841796875, 0.431121826171875, 0.4802398681640625, 0.52935791015625, 0.5784759521484375, 0.627593994140625, 0.6767120361328125, 0.725830078125, 0.7749481201171875, 0.824066162109375, 0.8731842041015625, 0.92230224609375, 0.9714202880859375, 1.020538330078125, 1.0696563720703125, 1.1187744140625, 1.1678924560546875, 1.217010498046875, 1.2661285400390625, 1.31524658203125, 1.3643646240234375, 1.413482666015625, 1.4626007080078125, 1.51171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 3.0, 7.0, 6.0, 8.0, 14.0, 15.0, 15.0, 25.0, 25.0, 28.0, 29.0, 30.0, 35.0, 29.0, 26.0, 48.0, 51.0, 39.0, 38.0, 45.0, 39.0, 42.0, 45.0, 38.0, 38.0, 39.0, 30.0, 30.0, 32.0, 29.0, 27.0, 13.0, 10.0, 19.0, 12.0, 9.0, 5.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.21875, -13.7901611328125, -13.361572265625, -12.9329833984375, -12.50439453125, -12.0758056640625, -11.647216796875, -11.2186279296875, -10.7900390625, -10.3614501953125, -9.932861328125, -9.5042724609375, -9.07568359375, -8.6470947265625, -8.218505859375, -7.7899169921875, -7.361328125, -6.9327392578125, -6.504150390625, -6.0755615234375, -5.64697265625, -5.2183837890625, -4.789794921875, -4.3612060546875, -3.9326171875, -3.5040283203125, -3.075439453125, -2.6468505859375, -2.21826171875, -1.7896728515625, -1.361083984375, -0.9324951171875, -0.50390625, -0.0753173828125, 0.353271484375, 0.7818603515625, 1.21044921875, 1.6390380859375, 2.067626953125, 2.4962158203125, 2.9248046875, 3.3533935546875, 3.781982421875, 4.2105712890625, 4.63916015625, 5.0677490234375, 5.496337890625, 5.9249267578125, 6.353515625, 6.7821044921875, 7.210693359375, 7.6392822265625, 8.06787109375, 8.4964599609375, 8.925048828125, 9.3536376953125, 9.7822265625, 10.2108154296875, 10.639404296875, 11.0679931640625, 11.49658203125, 11.9251708984375, 12.353759765625, 12.7823486328125, 13.2109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 9.0, 17.0, 14.0, 25.0, 32.0, 39.0, 78.0, 108.0, 161.0, 237.0, 387.0, 704.0, 1297.0, 2394.0, 4760.0, 9761.0, 21682.0, 51265.0, 164261.0, 477837.0, 206312.0, 59715.0, 24690.0, 11321.0, 5307.0, 2678.0, 1419.0, 810.0, 480.0, 227.0, 158.0, 123.0, 70.0, 51.0, 30.0, 31.0, 15.0, 14.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79345703125, -0.766632080078125, -0.73980712890625, -0.712982177734375, -0.6861572265625, -0.659332275390625, -0.63250732421875, -0.605682373046875, -0.578857421875, -0.552032470703125, -0.52520751953125, -0.498382568359375, -0.4715576171875, -0.444732666015625, -0.41790771484375, -0.391082763671875, -0.3642578125, -0.337432861328125, -0.31060791015625, -0.283782958984375, -0.2569580078125, -0.230133056640625, -0.20330810546875, -0.176483154296875, -0.149658203125, -0.122833251953125, -0.09600830078125, -0.069183349609375, -0.0423583984375, -0.015533447265625, 0.01129150390625, 0.038116455078125, 0.06494140625, 0.091766357421875, 0.11859130859375, 0.145416259765625, 0.1722412109375, 0.199066162109375, 0.22589111328125, 0.252716064453125, 0.279541015625, 0.306365966796875, 0.33319091796875, 0.360015869140625, 0.3868408203125, 0.413665771484375, 0.44049072265625, 0.467315673828125, 0.494140625, 0.520965576171875, 0.54779052734375, 0.574615478515625, 0.6014404296875, 0.628265380859375, 0.65509033203125, 0.681915283203125, 0.708740234375, 0.735565185546875, 0.76239013671875, 0.789215087890625, 0.8160400390625, 0.842864990234375, 0.86968994140625, 0.896514892578125, 0.92333984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 2.0, 9.0, 10.0, 11.0, 14.0, 9.0, 16.0, 24.0, 39.0, 43.0, 96.0, 122.0, 128.0, 144.0, 92.0, 49.0, 42.0, 29.0, 25.0, 23.0, 18.0, 10.0, 10.0, 8.0, 7.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007677078247070312, -0.000744938850402832, -0.0007221698760986328, -0.0006994009017944336, -0.0006766319274902344, -0.0006538629531860352, -0.0006310939788818359, -0.0006083250045776367, -0.0005855560302734375, -0.0005627870559692383, -0.0005400180816650391, -0.0005172491073608398, -0.0004944801330566406, -0.0004717111587524414, -0.0004489421844482422, -0.00042617321014404297, -0.00040340423583984375, -0.00038063526153564453, -0.0003578662872314453, -0.0003350973129272461, -0.0003123283386230469, -0.00028955936431884766, -0.00026679039001464844, -0.00024402141571044922, -0.00022125244140625, -0.00019848346710205078, -0.00017571449279785156, -0.00015294551849365234, -0.00013017654418945312, -0.0001074075698852539, -8.463859558105469e-05, -6.186962127685547e-05, -3.910064697265625e-05, -1.633167266845703e-05, 6.4373016357421875e-06, 2.9206275939941406e-05, 5.1975250244140625e-05, 7.474422454833984e-05, 9.751319885253906e-05, 0.00012028217315673828, 0.0001430511474609375, 0.00016582012176513672, 0.00018858909606933594, 0.00021135807037353516, 0.00023412704467773438, 0.0002568960189819336, 0.0002796649932861328, 0.00030243396759033203, 0.00032520294189453125, 0.00034797191619873047, 0.0003707408905029297, 0.0003935098648071289, 0.0004162788391113281, 0.00043904781341552734, 0.00046181678771972656, 0.0004845857620239258, 0.000507354736328125, 0.0005301237106323242, 0.0005528926849365234, 0.0005756616592407227, 0.0005984306335449219, 0.0006211996078491211, 0.0006439685821533203, 0.0006667375564575195, 0.0006895065307617188]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 0.0, 4.0, 7.0, 8.0, 10.0, 9.0, 19.0, 34.0, 65.0, 128.0, 272.0, 575.0, 1580.0, 5040.0, 19252.0, 105969.0, 714421.0, 164592.0, 26764.0, 6646.0, 1873.0, 727.0, 278.0, 123.0, 58.0, 37.0, 24.0, 12.0, 4.0, 10.0, 5.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8623046875, -1.80517578125, -1.748046875, -1.69091796875, -1.6337890625, -1.57666015625, -1.51953125, -1.46240234375, -1.4052734375, -1.34814453125, -1.291015625, -1.23388671875, -1.1767578125, -1.11962890625, -1.0625, -1.00537109375, -0.9482421875, -0.89111328125, -0.833984375, -0.77685546875, -0.7197265625, -0.66259765625, -0.60546875, -0.54833984375, -0.4912109375, -0.43408203125, -0.376953125, -0.31982421875, -0.2626953125, -0.20556640625, -0.1484375, -0.09130859375, -0.0341796875, 0.02294921875, 0.080078125, 0.13720703125, 0.1943359375, 0.25146484375, 0.30859375, 0.36572265625, 0.4228515625, 0.47998046875, 0.537109375, 0.59423828125, 0.6513671875, 0.70849609375, 0.765625, 0.82275390625, 0.8798828125, 0.93701171875, 0.994140625, 1.05126953125, 1.1083984375, 1.16552734375, 1.22265625, 1.27978515625, 1.3369140625, 1.39404296875, 1.451171875, 1.50830078125, 1.5654296875, 1.62255859375, 1.6796875, 1.73681640625, 1.7939453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 5.0, 18.0, 12.0, 23.0, 28.0, 34.0, 53.0, 78.0, 124.0, 139.0, 147.0, 111.0, 61.0, 39.0, 32.0, 19.0, 17.0, 8.0, 7.0, 5.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40478515625, -0.38962554931640625, -0.3744659423828125, -0.35930633544921875, -0.344146728515625, -0.32898712158203125, -0.3138275146484375, -0.29866790771484375, -0.28350830078125, -0.26834869384765625, -0.2531890869140625, -0.23802947998046875, -0.222869873046875, -0.20771026611328125, -0.1925506591796875, -0.17739105224609375, -0.1622314453125, -0.14707183837890625, -0.1319122314453125, -0.11675262451171875, -0.101593017578125, -0.08643341064453125, -0.0712738037109375, -0.05611419677734375, -0.04095458984375, -0.02579498291015625, -0.0106353759765625, 0.00452423095703125, 0.019683837890625, 0.03484344482421875, 0.0500030517578125, 0.06516265869140625, 0.080322265625, 0.09548187255859375, 0.1106414794921875, 0.12580108642578125, 0.140960693359375, 0.15612030029296875, 0.1712799072265625, 0.18643951416015625, 0.20159912109375, 0.21675872802734375, 0.2319183349609375, 0.24707794189453125, 0.262237548828125, 0.27739715576171875, 0.2925567626953125, 0.30771636962890625, 0.3228759765625, 0.33803558349609375, 0.3531951904296875, 0.36835479736328125, 0.383514404296875, 0.39867401123046875, 0.4138336181640625, 0.42899322509765625, 0.44415283203125, 0.45931243896484375, 0.4744720458984375, 0.48963165283203125, 0.504791259765625, 0.5199508666992188, 0.5351104736328125, 0.5502700805664062, 0.5654296875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 12.0, 33.0, 73.0, 148.0, 208.0, 204.0, 155.0, 91.0, 42.0, 15.0, 12.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.71110153198242, -38.94668960571289, -38.18227767944336, -37.41786575317383, -36.6534538269043, -35.889041900634766, -35.124629974365234, -34.3602180480957, -33.59580612182617, -32.83139419555664, -32.06698226928711, -31.302570343017578, -30.538158416748047, -29.773746490478516, -29.009334564208984, -28.24492073059082, -27.480506896972656, -26.716094970703125, -25.951683044433594, -25.187271118164062, -24.42285919189453, -23.658447265625, -22.89403533935547, -22.129621505737305, -21.365211486816406, -20.600799560546875, -19.836387634277344, -19.071975708007812, -18.30756378173828, -17.54315185546875, -16.77873992919922, -16.014326095581055, -15.249914169311523, -14.485502243041992, -13.721090316772461, -12.95667839050293, -12.192265510559082, -11.42785358428955, -10.66344165802002, -9.899028778076172, -9.13461685180664, -8.37020492553711, -7.60579252243042, -6.841380596160889, -6.076968193054199, -5.312556266784668, -4.548144340515137, -3.7837319374084473, -3.019320487976074, -2.254908323287964, -1.490496277809143, -0.7260842323303223, 0.038327932357788086, 0.8027400970458984, 1.5671520233154297, 2.331564426422119, 3.0959763526916504, 3.8603885173797607, 4.624800682067871, 5.389212608337402, 6.153624534606934, 6.918036937713623, 7.682448863983154, 8.446861267089844, 9.211273193359375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 18.0, 17.0, 13.0, 26.0, 50.0, 50.0, 66.0, 65.0, 88.0, 89.0, 68.0, 77.0, 84.0, 57.0, 62.0, 56.0, 34.0, 23.0, 14.0, 19.0, 16.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-20.904251098632812, -20.454286575317383, -20.00432014465332, -19.55435562133789, -19.10439109802246, -18.6544246673584, -18.20446014404297, -17.75449562072754, -17.304529190063477, -16.854564666748047, -16.404598236083984, -15.954633712768555, -15.504668235778809, -15.054703712463379, -14.604738235473633, -14.154773712158203, -13.704809188842773, -13.254843711853027, -12.804879188537598, -12.354913711547852, -11.904948234558105, -11.454983711242676, -11.00501823425293, -10.5550537109375, -10.105087280273438, -9.655121803283691, -9.205157279968262, -8.755191802978516, -8.30522632598877, -7.85526180267334, -7.405296325683594, -6.955331325531006, -6.505366802215576, -6.055401802062988, -5.605436325073242, -5.155471324920654, -4.705506324768066, -4.25554084777832, -3.8055758476257324, -3.3556108474731445, -2.9056456089019775, -2.4556803703308105, -2.0057153701782227, -1.5557501316070557, -1.1057850122451782, -0.6558198928833008, -0.2058546543121338, 0.2441103458404541, 0.6940755844116211, 1.1440407037734985, 1.594005823135376, 2.043971061706543, 2.493936061859131, 2.943901300430298, 3.393866539001465, 3.8438315391540527, 4.293796539306641, 4.7437615394592285, 5.193727016448975, 5.6436920166015625, 6.09365701675415, 6.543622016906738, 6.993587493896484, 7.443552494049072, 7.893517971038818]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 10.0, 8.0, 22.0, 30.0, 42.0, 72.0, 124.0, 235.0, 468.0, 859.0, 2007.0, 4263.0, 9610.0, 23188.0, 61913.0, 168606.0, 366062.0, 254236.0, 96018.0, 35441.0, 14093.0, 5920.0, 2691.0, 1306.0, 632.0, 297.0, 164.0, 97.0, 46.0, 34.0, 15.0, 10.0, 10.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.33380126953125, -5.1480712890625, -4.96234130859375, -4.776611328125, -4.59088134765625, -4.4051513671875, -4.21942138671875, -4.03369140625, -3.84796142578125, -3.6622314453125, -3.47650146484375, -3.290771484375, -3.10504150390625, -2.9193115234375, -2.73358154296875, -2.5478515625, -2.36212158203125, -2.1763916015625, -1.99066162109375, -1.804931640625, -1.61920166015625, -1.4334716796875, -1.24774169921875, -1.06201171875, -0.87628173828125, -0.6905517578125, -0.50482177734375, -0.319091796875, -0.13336181640625, 0.0523681640625, 0.23809814453125, 0.423828125, 0.60955810546875, 0.7952880859375, 0.98101806640625, 1.166748046875, 1.35247802734375, 1.5382080078125, 1.72393798828125, 1.90966796875, 2.09539794921875, 2.2811279296875, 2.46685791015625, 2.652587890625, 2.83831787109375, 3.0240478515625, 3.20977783203125, 3.3955078125, 3.58123779296875, 3.7669677734375, 3.95269775390625, 4.138427734375, 4.32415771484375, 4.5098876953125, 4.69561767578125, 4.88134765625, 5.06707763671875, 5.2528076171875, 5.43853759765625, 5.624267578125, 5.80999755859375, 5.9957275390625, 6.18145751953125, 6.3671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 7.0, 13.0, 22.0, 19.0, 29.0, 47.0, 51.0, 63.0, 49.0, 57.0, 63.0, 67.0, 77.0, 69.0, 60.0, 57.0, 62.0, 48.0, 28.0, 33.0, 19.0, 16.0, 16.0, 11.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-30.609375, -29.9107666015625, -29.212158203125, -28.5135498046875, -27.81494140625, -27.1163330078125, -26.417724609375, -25.7191162109375, -25.0205078125, -24.3218994140625, -23.623291015625, -22.9246826171875, -22.22607421875, -21.5274658203125, -20.828857421875, -20.1302490234375, -19.431640625, -18.7330322265625, -18.034423828125, -17.3358154296875, -16.63720703125, -15.9385986328125, -15.239990234375, -14.5413818359375, -13.8427734375, -13.1441650390625, -12.445556640625, -11.7469482421875, -11.04833984375, -10.3497314453125, -9.651123046875, -8.9525146484375, -8.25390625, -7.5552978515625, -6.856689453125, -6.1580810546875, -5.45947265625, -4.7608642578125, -4.062255859375, -3.3636474609375, -2.6650390625, -1.9664306640625, -1.267822265625, -0.5692138671875, 0.12939453125, 0.8280029296875, 1.526611328125, 2.2252197265625, 2.923828125, 3.6224365234375, 4.321044921875, 5.0196533203125, 5.71826171875, 6.4168701171875, 7.115478515625, 7.8140869140625, 8.5126953125, 9.2113037109375, 9.909912109375, 10.6085205078125, 11.30712890625, 12.0057373046875, 12.704345703125, 13.4029541015625, 14.1015625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 6.0, 5.0, 10.0, 9.0, 9.0, 16.0, 14.0, 32.0, 32.0, 51.0, 79.0, 114.0, 147.0, 435.0, 29263.0, 1015896.0, 1794.0, 224.0, 114.0, 91.0, 48.0, 36.0, 42.0, 15.0, 16.0, 20.0, 12.0, 8.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-67.0, -64.923828125, -62.84765625, -60.771484375, -58.6953125, -56.619140625, -54.54296875, -52.466796875, -50.390625, -48.314453125, -46.23828125, -44.162109375, -42.0859375, -40.009765625, -37.93359375, -35.857421875, -33.78125, -31.705078125, -29.62890625, -27.552734375, -25.4765625, -23.400390625, -21.32421875, -19.248046875, -17.171875, -15.095703125, -13.01953125, -10.943359375, -8.8671875, -6.791015625, -4.71484375, -2.638671875, -0.5625, 1.513671875, 3.58984375, 5.666015625, 7.7421875, 9.818359375, 11.89453125, 13.970703125, 16.046875, 18.123046875, 20.19921875, 22.275390625, 24.3515625, 26.427734375, 28.50390625, 30.580078125, 32.65625, 34.732421875, 36.80859375, 38.884765625, 40.9609375, 43.037109375, 45.11328125, 47.189453125, 49.265625, 51.341796875, 53.41796875, 55.494140625, 57.5703125, 59.646484375, 61.72265625, 63.798828125, 65.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 10.0, 14.0, 8.0, 19.0, 21.0, 25.0, 27.0, 51.0, 58.0, 66.0, 69.0, 74.0, 65.0, 87.0, 66.0, 61.0, 51.0, 52.0, 37.0, 34.0, 22.0, 18.0, 14.0, 11.0, 8.0, 8.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.5625, -27.640380859375, -26.71826171875, -25.796142578125, -24.8740234375, -23.951904296875, -23.02978515625, -22.107666015625, -21.185546875, -20.263427734375, -19.34130859375, -18.419189453125, -17.4970703125, -16.574951171875, -15.65283203125, -14.730712890625, -13.80859375, -12.886474609375, -11.96435546875, -11.042236328125, -10.1201171875, -9.197998046875, -8.27587890625, -7.353759765625, -6.431640625, -5.509521484375, -4.58740234375, -3.665283203125, -2.7431640625, -1.821044921875, -0.89892578125, 0.023193359375, 0.9453125, 1.867431640625, 2.78955078125, 3.711669921875, 4.6337890625, 5.555908203125, 6.47802734375, 7.400146484375, 8.322265625, 9.244384765625, 10.16650390625, 11.088623046875, 12.0107421875, 12.932861328125, 13.85498046875, 14.777099609375, 15.69921875, 16.621337890625, 17.54345703125, 18.465576171875, 19.3876953125, 20.309814453125, 21.23193359375, 22.154052734375, 23.076171875, 23.998291015625, 24.92041015625, 25.842529296875, 26.7646484375, 27.686767578125, 28.60888671875, 29.531005859375, 30.453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 12.0, 9.0, 22.0, 24.0, 42.0, 94.0, 257.0, 788.0, 4179.0, 525674.0, 511888.0, 4146.0, 864.0, 260.0, 113.0, 65.0, 31.0, 23.0, 15.0, 6.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-23.296875, -22.7286376953125, -22.160400390625, -21.5921630859375, -21.02392578125, -20.4556884765625, -19.887451171875, -19.3192138671875, -18.7509765625, -18.1827392578125, -17.614501953125, -17.0462646484375, -16.47802734375, -15.9097900390625, -15.341552734375, -14.7733154296875, -14.205078125, -13.6368408203125, -13.068603515625, -12.5003662109375, -11.93212890625, -11.3638916015625, -10.795654296875, -10.2274169921875, -9.6591796875, -9.0909423828125, -8.522705078125, -7.9544677734375, -7.38623046875, -6.8179931640625, -6.249755859375, -5.6815185546875, -5.11328125, -4.5450439453125, -3.976806640625, -3.4085693359375, -2.84033203125, -2.2720947265625, -1.703857421875, -1.1356201171875, -0.5673828125, 0.0008544921875, 0.569091796875, 1.1373291015625, 1.70556640625, 2.2738037109375, 2.842041015625, 3.4102783203125, 3.978515625, 4.5467529296875, 5.114990234375, 5.6832275390625, 6.25146484375, 6.8197021484375, 7.387939453125, 7.9561767578125, 8.5244140625, 9.0926513671875, 9.660888671875, 10.2291259765625, 10.79736328125, 11.3656005859375, 11.933837890625, 12.5020751953125, 13.0703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 6.0, 9.0, 19.0, 34.0, 70.0, 143.0, 237.0, 196.0, 133.0, 60.0, 40.0, 15.0, 15.0, 10.0, 4.0, 4.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013570785522460938, -0.0013222098350524902, -0.0012873411178588867, -0.0012524724006652832, -0.0012176036834716797, -0.0011827349662780762, -0.0011478662490844727, -0.0011129975318908691, -0.0010781288146972656, -0.0010432600975036621, -0.0010083913803100586, -0.0009735226631164551, -0.0009386539459228516, -0.000903785228729248, -0.0008689165115356445, -0.000834047794342041, -0.0007991790771484375, -0.000764310359954834, -0.0007294416427612305, -0.000694572925567627, -0.0006597042083740234, -0.0006248354911804199, -0.0005899667739868164, -0.0005550980567932129, -0.0005202293395996094, -0.00048536062240600586, -0.00045049190521240234, -0.00041562318801879883, -0.0003807544708251953, -0.0003458857536315918, -0.0003110170364379883, -0.00027614831924438477, -0.00024127960205078125, -0.00020641088485717773, -0.00017154216766357422, -0.0001366734504699707, -0.00010180473327636719, -6.693601608276367e-05, -3.2067298889160156e-05, 2.8014183044433594e-06, 3.7670135498046875e-05, 7.253885269165039e-05, 0.0001074075698852539, 0.00014227628707885742, 0.00017714500427246094, 0.00021201372146606445, 0.00024688243865966797, 0.0002817511558532715, 0.000316619873046875, 0.0003514885902404785, 0.00038635730743408203, 0.00042122602462768555, 0.00045609474182128906, 0.0004909634590148926, 0.0005258321762084961, 0.0005607008934020996, 0.0005955696105957031, 0.0006304383277893066, 0.0006653070449829102, 0.0007001757621765137, 0.0007350444793701172, 0.0007699131965637207, 0.0008047819137573242, 0.0008396506309509277, 0.0008745193481445312]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 7.0, 7.0, 12.0, 22.0, 32.0, 44.0, 73.0, 151.0, 304.0, 686.0, 2432.0, 14658.0, 786152.0, 233606.0, 7813.0, 1576.0, 505.0, 203.0, 102.0, 50.0, 30.0, 20.0, 7.0, 12.0, 9.0, 3.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.953125, -7.619873046875, -7.28662109375, -6.953369140625, -6.6201171875, -6.286865234375, -5.95361328125, -5.620361328125, -5.287109375, -4.953857421875, -4.62060546875, -4.287353515625, -3.9541015625, -3.620849609375, -3.28759765625, -2.954345703125, -2.62109375, -2.287841796875, -1.95458984375, -1.621337890625, -1.2880859375, -0.954833984375, -0.62158203125, -0.288330078125, 0.044921875, 0.378173828125, 0.71142578125, 1.044677734375, 1.3779296875, 1.711181640625, 2.04443359375, 2.377685546875, 2.7109375, 3.044189453125, 3.37744140625, 3.710693359375, 4.0439453125, 4.377197265625, 4.71044921875, 5.043701171875, 5.376953125, 5.710205078125, 6.04345703125, 6.376708984375, 6.7099609375, 7.043212890625, 7.37646484375, 7.709716796875, 8.04296875, 8.376220703125, 8.70947265625, 9.042724609375, 9.3759765625, 9.709228515625, 10.04248046875, 10.375732421875, 10.708984375, 11.042236328125, 11.37548828125, 11.708740234375, 12.0419921875, 12.375244140625, 12.70849609375, 13.041748046875, 13.375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 7.0, 6.0, 12.0, 27.0, 55.0, 108.0, 236.0, 269.0, 136.0, 45.0, 34.0, 14.0, 6.0, 4.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.125, -5.003265380859375, -4.88153076171875, -4.759796142578125, -4.6380615234375, -4.516326904296875, -4.39459228515625, -4.272857666015625, -4.151123046875, -4.029388427734375, -3.90765380859375, -3.785919189453125, -3.6641845703125, -3.542449951171875, -3.42071533203125, -3.298980712890625, -3.17724609375, -3.055511474609375, -2.93377685546875, -2.812042236328125, -2.6903076171875, -2.568572998046875, -2.44683837890625, -2.325103759765625, -2.203369140625, -2.081634521484375, -1.95989990234375, -1.838165283203125, -1.7164306640625, -1.594696044921875, -1.47296142578125, -1.351226806640625, -1.2294921875, -1.107757568359375, -0.98602294921875, -0.864288330078125, -0.7425537109375, -0.620819091796875, -0.49908447265625, -0.377349853515625, -0.255615234375, -0.133880615234375, -0.01214599609375, 0.109588623046875, 0.2313232421875, 0.353057861328125, 0.47479248046875, 0.596527099609375, 0.71826171875, 0.839996337890625, 0.96173095703125, 1.083465576171875, 1.2052001953125, 1.326934814453125, 1.44866943359375, 1.570404052734375, 1.692138671875, 1.813873291015625, 1.93560791015625, 2.057342529296875, 2.1790771484375, 2.300811767578125, 2.42254638671875, 2.544281005859375, 2.666015625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 62.0, 859.0, 94.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.55731773376465, -14.806574821472168, -5.0558319091796875, 4.694910049438477, 14.445653915405273, 24.19639778137207, 33.94713592529297, 43.69788360595703, 53.44862365722656, 63.19936752319336, 72.95011138916016, 82.70085144042969, 92.45159912109375, 102.20233917236328, 111.95307922363281, 121.70382690429688, 131.45457458496094, 141.205322265625, 150.9560546875, 160.70680236816406, 170.45755004882812, 180.20828247070312, 189.9590301513672, 199.70977783203125, 209.46051025390625, 219.2112579345703, 228.9619903564453, 238.71273803710938, 248.46348571777344, 258.2142333984375, 267.9649658203125, 277.7156982421875, 287.4664611816406, 297.2171936035156, 306.96795654296875, 316.71868896484375, 326.46942138671875, 336.2201843261719, 345.9709167480469, 355.7216796875, 365.472412109375, 375.22314453125, 384.9739074707031, 394.7246398925781, 404.4753723144531, 414.22613525390625, 423.97686767578125, 433.72760009765625, 443.47833251953125, 453.22906494140625, 462.9798278808594, 472.7305603027344, 482.4812927246094, 492.2320556640625, 501.9827880859375, 511.7335205078125, 521.4843139648438, 531.2350463867188, 540.9857788085938, 550.736572265625, 560.4873046875, 570.238037109375, 579.98876953125, 589.739501953125, 599.490234375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 6.0, 5.0, 7.0, 10.0, 10.0, 19.0, 24.0, 23.0, 27.0, 25.0, 26.0, 43.0, 31.0, 31.0, 43.0, 46.0, 42.0, 40.0, 46.0, 42.0, 43.0, 41.0, 30.0, 34.0, 37.0, 48.0, 23.0, 33.0, 22.0, 17.0, 28.0, 15.0, 12.0, 7.0, 16.0, 6.0, 9.0, 8.0, 4.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-24.720640182495117, -23.956268310546875, -23.191896438598633, -22.427526473999023, -21.66315460205078, -20.89878273010254, -20.134410858154297, -19.370040893554688, -18.605669021606445, -17.841297149658203, -17.07692527770996, -16.31255531311035, -15.54818344116211, -14.783811569213867, -14.019439697265625, -13.2550687789917, -12.490696907043457, -11.726325035095215, -10.961954116821289, -10.197582244873047, -9.433211326599121, -8.668839454650879, -7.904468059539795, -7.140096664428711, -6.375725269317627, -5.611353874206543, -4.846982479095459, -4.082611083984375, -3.318239450454712, -2.553868055343628, -1.7894964218139648, -1.0251250267028809, -0.2607536315917969, 0.5036178231239319, 1.2679892778396606, 2.032360792160034, 2.796732187271118, 3.561103582382202, 4.325475215911865, 5.089846611022949, 5.854218006134033, 6.618589401245117, 7.382960796356201, 8.147332191467285, 8.911704063415527, 9.676074981689453, 10.440446853637695, 11.204818725585938, 11.969189643859863, 12.733561515808105, 13.497932434082031, 14.262304306030273, 15.0266752243042, 15.791047096252441, 16.555418014526367, 17.31978988647461, 18.08416175842285, 18.848533630371094, 19.612905502319336, 20.377275466918945, 21.141647338867188, 21.90601921081543, 22.670391082763672, 23.43476104736328, 24.199132919311523]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 7.0, 14.0, 32.0, 22.0, 31.0, 58.0, 67.0, 141.0, 209.0, 650.0, 2983.0, 28799.0, 512050.0, 2978019.0, 630390.0, 33117.0, 4359.0, 1798.0, 912.0, 286.0, 97.0, 67.0, 54.0, 31.0, 22.0, 11.0, 10.0, 15.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.53125, -18.822021484375, -18.11279296875, -17.403564453125, -16.6943359375, -15.985107421875, -15.27587890625, -14.566650390625, -13.857421875, -13.148193359375, -12.43896484375, -11.729736328125, -11.0205078125, -10.311279296875, -9.60205078125, -8.892822265625, -8.18359375, -7.474365234375, -6.76513671875, -6.055908203125, -5.3466796875, -4.637451171875, -3.92822265625, -3.218994140625, -2.509765625, -1.800537109375, -1.09130859375, -0.382080078125, 0.3271484375, 1.036376953125, 1.74560546875, 2.454833984375, 3.1640625, 3.873291015625, 4.58251953125, 5.291748046875, 6.0009765625, 6.710205078125, 7.41943359375, 8.128662109375, 8.837890625, 9.547119140625, 10.25634765625, 10.965576171875, 11.6748046875, 12.384033203125, 13.09326171875, 13.802490234375, 14.51171875, 15.220947265625, 15.93017578125, 16.639404296875, 17.3486328125, 18.057861328125, 18.76708984375, 19.476318359375, 20.185546875, 20.894775390625, 21.60400390625, 22.313232421875, 23.0224609375, 23.731689453125, 24.44091796875, 25.150146484375, 25.859375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 8.0, 9.0, 30.0, 29.0, 56.0, 72.0, 82.0, 100.0, 99.0, 108.0, 90.0, 73.0, 83.0, 53.0, 37.0, 30.0, 13.0, 11.0, 8.0, 4.0, 9.0, 1.0, 2.0, 0.0, 2.0], "bins": [-32.84375, -32.1622314453125, -31.480712890625, -30.7991943359375, -30.11767578125, -29.4361572265625, -28.754638671875, -28.0731201171875, -27.3916015625, -26.7100830078125, -26.028564453125, -25.3470458984375, -24.66552734375, -23.9840087890625, -23.302490234375, -22.6209716796875, -21.939453125, -21.2579345703125, -20.576416015625, -19.8948974609375, -19.21337890625, -18.5318603515625, -17.850341796875, -17.1688232421875, -16.4873046875, -15.8057861328125, -15.124267578125, -14.4427490234375, -13.76123046875, -13.0797119140625, -12.398193359375, -11.7166748046875, -11.03515625, -10.3536376953125, -9.672119140625, -8.9906005859375, -8.30908203125, -7.6275634765625, -6.946044921875, -6.2645263671875, -5.5830078125, -4.9014892578125, -4.219970703125, -3.5384521484375, -2.85693359375, -2.1754150390625, -1.493896484375, -0.8123779296875, -0.130859375, 0.5506591796875, 1.232177734375, 1.9136962890625, 2.59521484375, 3.2767333984375, 3.958251953125, 4.6397705078125, 5.3212890625, 6.0028076171875, 6.684326171875, 7.3658447265625, 8.04736328125, 8.7288818359375, 9.410400390625, 10.0919189453125, 10.7734375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 8.0, 4.0, 6.0, 6.0, 21.0, 44.0, 130.0, 284.0, 998.0, 31140.0, 4150958.0, 9556.0, 725.0, 232.0, 73.0, 34.0, 13.0, 19.0, 10.0, 7.0, 6.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.875, -75.611328125, -73.34765625, -71.083984375, -68.8203125, -66.556640625, -64.29296875, -62.029296875, -59.765625, -57.501953125, -55.23828125, -52.974609375, -50.7109375, -48.447265625, -46.18359375, -43.919921875, -41.65625, -39.392578125, -37.12890625, -34.865234375, -32.6015625, -30.337890625, -28.07421875, -25.810546875, -23.546875, -21.283203125, -19.01953125, -16.755859375, -14.4921875, -12.228515625, -9.96484375, -7.701171875, -5.4375, -3.173828125, -0.91015625, 1.353515625, 3.6171875, 5.880859375, 8.14453125, 10.408203125, 12.671875, 14.935546875, 17.19921875, 19.462890625, 21.7265625, 23.990234375, 26.25390625, 28.517578125, 30.78125, 33.044921875, 35.30859375, 37.572265625, 39.8359375, 42.099609375, 44.36328125, 46.626953125, 48.890625, 51.154296875, 53.41796875, 55.681640625, 57.9453125, 60.208984375, 62.47265625, 64.736328125, 67.0]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 9.0, 12.0, 26.0, 38.0, 50.0, 111.0, 191.0, 383.0, 604.0, 879.0, 760.0, 466.0, 235.0, 131.0, 84.0, 38.0, 18.0, 21.0, 13.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.9609375, -8.70269775390625, -8.4444580078125, -8.18621826171875, -7.927978515625, -7.66973876953125, -7.4114990234375, -7.15325927734375, -6.89501953125, -6.63677978515625, -6.3785400390625, -6.12030029296875, -5.862060546875, -5.60382080078125, -5.3455810546875, -5.08734130859375, -4.8291015625, -4.57086181640625, -4.3126220703125, -4.05438232421875, -3.796142578125, -3.53790283203125, -3.2796630859375, -3.02142333984375, -2.76318359375, -2.50494384765625, -2.2467041015625, -1.98846435546875, -1.730224609375, -1.47198486328125, -1.2137451171875, -0.95550537109375, -0.697265625, -0.43902587890625, -0.1807861328125, 0.07745361328125, 0.335693359375, 0.59393310546875, 0.8521728515625, 1.11041259765625, 1.36865234375, 1.62689208984375, 1.8851318359375, 2.14337158203125, 2.401611328125, 2.65985107421875, 2.9180908203125, 3.17633056640625, 3.4345703125, 3.69281005859375, 3.9510498046875, 4.20928955078125, 4.467529296875, 4.72576904296875, 4.9840087890625, 5.24224853515625, 5.50048828125, 5.75872802734375, 6.0169677734375, 6.27520751953125, 6.533447265625, 6.79168701171875, 7.0499267578125, 7.30816650390625, 7.56640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 2.0, 9.0, 12.0, 10.0, 20.0, 32.0, 50.0, 46.0, 65.0, 77.0, 95.0, 107.0, 82.0, 81.0, 58.0, 66.0, 58.0, 48.0, 19.0, 21.0, 7.0, 7.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.203615188598633, -18.679447174072266, -18.15528106689453, -17.631113052368164, -17.10694694519043, -16.582778930664062, -16.058612823486328, -15.534444808959961, -15.01027774810791, -14.48611068725586, -13.961943626403809, -13.437776565551758, -12.91360855102539, -12.389442443847656, -11.865274429321289, -11.341107368469238, -10.816940307617188, -10.292773246765137, -9.768606185913086, -9.244439125061035, -8.720272064208984, -8.196104049682617, -7.671936988830566, -7.147769927978516, -6.623602867126465, -6.099435806274414, -5.575268745422363, -5.051101207733154, -4.5269341468811035, -4.002767086029053, -3.478599786758423, -2.954432487487793, -2.430265426635742, -1.9060982465744019, -1.3819310665130615, -0.8577638864517212, -0.33359670639038086, 0.19057035446166992, 0.7147376537322998, 1.2389049530029297, 1.7630720138549805, 2.2872390747070312, 2.811406373977661, 3.335573673248291, 3.859740734100342, 4.383907794952393, 4.908075332641602, 5.432242393493652, 5.956409454345703, 6.480576515197754, 7.004743576049805, 7.528911113739014, 8.053077697753906, 8.577245712280273, 9.101412773132324, 9.625579833984375, 10.149746894836426, 10.673913955688477, 11.198081016540527, 11.722248077392578, 12.246416091918945, 12.77058219909668, 13.294750213623047, 13.818917274475098, 14.343084335327148]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 14.0, 22.0, 14.0, 16.0, 21.0, 26.0, 49.0, 46.0, 48.0, 59.0, 49.0, 77.0, 46.0, 55.0, 66.0, 52.0, 47.0, 54.0, 48.0, 37.0, 33.0, 27.0, 23.0, 18.0, 22.0, 8.0, 9.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-19.606321334838867, -19.1185302734375, -18.6307373046875, -18.142946243286133, -17.655155181884766, -17.167362213134766, -16.6795711517334, -16.19178009033203, -15.703987121582031, -15.216195106506348, -14.72840404510498, -14.240612030029297, -13.752820014953613, -13.26502799987793, -12.777236938476562, -12.289444923400879, -11.801653861999512, -11.313861846923828, -10.826070785522461, -10.338278770446777, -9.850486755371094, -9.362695693969727, -8.874903678894043, -8.38711166381836, -7.899320125579834, -7.411528587341309, -6.923736572265625, -6.4359450340271, -5.948153495788574, -5.460361480712891, -4.972569942474365, -4.48477840423584, -3.99698543548584, -3.5091936588287354, -3.021401882171631, -2.5336103439331055, -2.045818567276001, -1.5580267906188965, -1.070235252380371, -0.5824434757232666, -0.09465169906616211, 0.3931400179862976, 0.8809317350387573, 1.3687233924865723, 1.8565151691436768, 2.3443069458007812, 2.8320984840393066, 3.319890260696411, 3.8076820373535156, 4.295473575592041, 4.783265590667725, 5.27105712890625, 5.758849143981934, 6.246640682220459, 6.734432220458984, 7.222224235534668, 7.710015773773193, 8.197807312011719, 8.685599327087402, 9.173391342163086, 9.661182403564453, 10.148974418640137, 10.63676643371582, 11.124557495117188, 11.612349510192871]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 7.0, 7.0, 11.0, 15.0, 30.0, 38.0, 58.0, 113.0, 170.0, 413.0, 880.0, 2857.0, 12621.0, 88899.0, 651721.0, 255127.0, 27848.0, 5173.0, 1472.0, 508.0, 221.0, 127.0, 67.0, 58.0, 30.0, 18.0, 20.0, 10.0, 7.0, 6.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.07135009765625, -4.8575439453125, -4.64373779296875, -4.429931640625, -4.21612548828125, -4.0023193359375, -3.78851318359375, -3.57470703125, -3.36090087890625, -3.1470947265625, -2.93328857421875, -2.719482421875, -2.50567626953125, -2.2918701171875, -2.07806396484375, -1.8642578125, -1.65045166015625, -1.4366455078125, -1.22283935546875, -1.009033203125, -0.79522705078125, -0.5814208984375, -0.36761474609375, -0.15380859375, 0.05999755859375, 0.2738037109375, 0.48760986328125, 0.701416015625, 0.91522216796875, 1.1290283203125, 1.34283447265625, 1.556640625, 1.77044677734375, 1.9842529296875, 2.19805908203125, 2.411865234375, 2.62567138671875, 2.8394775390625, 3.05328369140625, 3.26708984375, 3.48089599609375, 3.6947021484375, 3.90850830078125, 4.122314453125, 4.33612060546875, 4.5499267578125, 4.76373291015625, 4.9775390625, 5.19134521484375, 5.4051513671875, 5.61895751953125, 5.832763671875, 6.04656982421875, 6.2603759765625, 6.47418212890625, 6.68798828125, 6.90179443359375, 7.1156005859375, 7.32940673828125, 7.543212890625, 7.75701904296875, 7.9708251953125, 8.18463134765625, 8.3984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 18.0, 24.0, 27.0, 45.0, 64.0, 76.0, 78.0, 65.0, 81.0, 88.0, 90.0, 82.0, 52.0, 61.0, 44.0, 30.0, 34.0, 17.0, 6.0, 6.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.6875, -18.2628173828125, -17.838134765625, -17.4134521484375, -16.98876953125, -16.5640869140625, -16.139404296875, -15.7147216796875, -15.2900390625, -14.8653564453125, -14.440673828125, -14.0159912109375, -13.59130859375, -13.1666259765625, -12.741943359375, -12.3172607421875, -11.892578125, -11.4678955078125, -11.043212890625, -10.6185302734375, -10.19384765625, -9.7691650390625, -9.344482421875, -8.9197998046875, -8.4951171875, -8.0704345703125, -7.645751953125, -7.2210693359375, -6.79638671875, -6.3717041015625, -5.947021484375, -5.5223388671875, -5.09765625, -4.6729736328125, -4.248291015625, -3.8236083984375, -3.39892578125, -2.9742431640625, -2.549560546875, -2.1248779296875, -1.7001953125, -1.2755126953125, -0.850830078125, -0.4261474609375, -0.00146484375, 0.4232177734375, 0.847900390625, 1.2725830078125, 1.697265625, 2.1219482421875, 2.546630859375, 2.9713134765625, 3.39599609375, 3.8206787109375, 4.245361328125, 4.6700439453125, 5.0947265625, 5.5194091796875, 5.944091796875, 6.3687744140625, 6.79345703125, 7.2181396484375, 7.642822265625, 8.0675048828125, 8.4921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 13.0, 11.0, 18.0, 18.0, 32.0, 51.0, 80.0, 99.0, 184.0, 281.0, 439.0, 715.0, 1215.0, 2051.0, 3743.0, 6494.0, 11979.0, 22419.0, 44648.0, 90650.0, 173323.0, 247738.0, 207010.0, 115727.0, 57096.0, 28476.0, 14915.0, 8198.0, 4486.0, 2545.0, 1478.0, 904.0, 550.0, 326.0, 198.0, 140.0, 89.0, 70.0, 46.0, 19.0, 23.0, 11.0, 14.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.357421875, -1.3083648681640625, -1.259307861328125, -1.2102508544921875, -1.16119384765625, -1.1121368408203125, -1.063079833984375, -1.0140228271484375, -0.9649658203125, -0.9159088134765625, -0.866851806640625, -0.8177947998046875, -0.76873779296875, -0.7196807861328125, -0.670623779296875, -0.6215667724609375, -0.572509765625, -0.5234527587890625, -0.474395751953125, -0.4253387451171875, -0.37628173828125, -0.3272247314453125, -0.278167724609375, -0.2291107177734375, -0.1800537109375, -0.1309967041015625, -0.081939697265625, -0.0328826904296875, 0.01617431640625, 0.0652313232421875, 0.114288330078125, 0.1633453369140625, 0.21240234375, 0.2614593505859375, 0.310516357421875, 0.3595733642578125, 0.40863037109375, 0.4576873779296875, 0.506744384765625, 0.5558013916015625, 0.6048583984375, 0.6539154052734375, 0.702972412109375, 0.7520294189453125, 0.80108642578125, 0.8501434326171875, 0.899200439453125, 0.9482574462890625, 0.997314453125, 1.0463714599609375, 1.095428466796875, 1.1444854736328125, 1.19354248046875, 1.2425994873046875, 1.291656494140625, 1.3407135009765625, 1.3897705078125, 1.4388275146484375, 1.487884521484375, 1.5369415283203125, 1.58599853515625, 1.6350555419921875, 1.684112548828125, 1.7331695556640625, 1.7822265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 8.0, 9.0, 14.0, 23.0, 25.0, 16.0, 33.0, 27.0, 36.0, 34.0, 30.0, 52.0, 40.0, 56.0, 54.0, 46.0, 45.0, 50.0, 49.0, 47.0, 40.0, 37.0, 37.0, 26.0, 18.0, 28.0, 26.0, 14.0, 16.0, 11.0, 8.0, 4.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.5859375, -13.143798828125, -12.70166015625, -12.259521484375, -11.8173828125, -11.375244140625, -10.93310546875, -10.490966796875, -10.048828125, -9.606689453125, -9.16455078125, -8.722412109375, -8.2802734375, -7.838134765625, -7.39599609375, -6.953857421875, -6.51171875, -6.069580078125, -5.62744140625, -5.185302734375, -4.7431640625, -4.301025390625, -3.85888671875, -3.416748046875, -2.974609375, -2.532470703125, -2.09033203125, -1.648193359375, -1.2060546875, -0.763916015625, -0.32177734375, 0.120361328125, 0.5625, 1.004638671875, 1.44677734375, 1.888916015625, 2.3310546875, 2.773193359375, 3.21533203125, 3.657470703125, 4.099609375, 4.541748046875, 4.98388671875, 5.426025390625, 5.8681640625, 6.310302734375, 6.75244140625, 7.194580078125, 7.63671875, 8.078857421875, 8.52099609375, 8.963134765625, 9.4052734375, 9.847412109375, 10.28955078125, 10.731689453125, 11.173828125, 11.615966796875, 12.05810546875, 12.500244140625, 12.9423828125, 13.384521484375, 13.82666015625, 14.268798828125, 14.7109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 8.0, 14.0, 16.0, 27.0, 32.0, 63.0, 72.0, 143.0, 208.0, 365.0, 812.0, 1850.0, 4932.0, 14480.0, 64000.0, 584534.0, 323411.0, 37018.0, 10194.0, 3472.0, 1401.0, 666.0, 304.0, 197.0, 112.0, 63.0, 42.0, 23.0, 24.0, 17.0, 17.0, 11.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.388671875, -1.3463897705078125, -1.304107666015625, -1.2618255615234375, -1.21954345703125, -1.1772613525390625, -1.134979248046875, -1.0926971435546875, -1.0504150390625, -1.0081329345703125, -0.965850830078125, -0.9235687255859375, -0.88128662109375, -0.8390045166015625, -0.796722412109375, -0.7544403076171875, -0.712158203125, -0.6698760986328125, -0.627593994140625, -0.5853118896484375, -0.54302978515625, -0.5007476806640625, -0.458465576171875, -0.4161834716796875, -0.3739013671875, -0.3316192626953125, -0.289337158203125, -0.2470550537109375, -0.20477294921875, -0.1624908447265625, -0.120208740234375, -0.0779266357421875, -0.03564453125, 0.0066375732421875, 0.048919677734375, 0.0912017822265625, 0.13348388671875, 0.1757659912109375, 0.218048095703125, 0.2603302001953125, 0.3026123046875, 0.3448944091796875, 0.387176513671875, 0.4294586181640625, 0.47174072265625, 0.5140228271484375, 0.556304931640625, 0.5985870361328125, 0.640869140625, 0.6831512451171875, 0.725433349609375, 0.7677154541015625, 0.80999755859375, 0.8522796630859375, 0.894561767578125, 0.9368438720703125, 0.9791259765625, 1.0214080810546875, 1.063690185546875, 1.1059722900390625, 1.14825439453125, 1.1905364990234375, 1.232818603515625, 1.2751007080078125, 1.3173828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 11.0, 14.0, 22.0, 29.0, 60.0, 100.0, 171.0, 201.0, 152.0, 100.0, 42.0, 28.0, 15.0, 11.0, 4.0, 11.0, 3.0, 1.0, 6.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0009145736694335938, -0.0008912906050682068, -0.0008680075407028198, -0.0008447244763374329, -0.0008214414119720459, -0.0007981583476066589, -0.000774875283241272, -0.000751592218875885, -0.000728309154510498, -0.0007050260901451111, -0.0006817430257797241, -0.0006584599614143372, -0.0006351768970489502, -0.0006118938326835632, -0.0005886107683181763, -0.0005653277039527893, -0.0005420446395874023, -0.0005187615752220154, -0.0004954785108566284, -0.00047219544649124146, -0.0004489123821258545, -0.00042562931776046753, -0.00040234625339508057, -0.0003790631890296936, -0.00035578012466430664, -0.0003324970602989197, -0.0003092139959335327, -0.00028593093156814575, -0.0002626478672027588, -0.00023936480283737183, -0.00021608173847198486, -0.0001927986741065979, -0.00016951560974121094, -0.00014623254537582397, -0.000122949481010437, -9.966641664505005e-05, -7.638335227966309e-05, -5.310028791427612e-05, -2.981722354888916e-05, -6.534159183502197e-06, 1.6748905181884766e-05, 4.003196954727173e-05, 6.331503391265869e-05, 8.659809827804565e-05, 0.00010988116264343262, 0.00013316422700881958, 0.00015644729137420654, 0.0001797303557395935, 0.00020301342010498047, 0.00022629648447036743, 0.0002495795488357544, 0.00027286261320114136, 0.0002961456775665283, 0.0003194287419319153, 0.00034271180629730225, 0.0003659948706626892, 0.00038927793502807617, 0.00041256099939346313, 0.0004358440637588501, 0.00045912712812423706, 0.000482410192489624, 0.000505693256855011, 0.000528976321220398, 0.0005522593855857849, 0.0005755424499511719]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 5.0, 13.0, 9.0, 18.0, 29.0, 47.0, 80.0, 130.0, 239.0, 591.0, 1632.0, 4903.0, 17442.0, 123945.0, 776516.0, 100038.0, 15800.0, 4555.0, 1444.0, 573.0, 244.0, 103.0, 62.0, 48.0, 21.0, 19.0, 8.0, 8.0, 10.0, 3.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0], "bins": [-1.943359375, -1.8900604248046875, -1.836761474609375, -1.7834625244140625, -1.73016357421875, -1.6768646240234375, -1.623565673828125, -1.5702667236328125, -1.5169677734375, -1.4636688232421875, -1.410369873046875, -1.3570709228515625, -1.30377197265625, -1.2504730224609375, -1.197174072265625, -1.1438751220703125, -1.090576171875, -1.0372772216796875, -0.983978271484375, -0.9306793212890625, -0.87738037109375, -0.8240814208984375, -0.770782470703125, -0.7174835205078125, -0.6641845703125, -0.6108856201171875, -0.557586669921875, -0.5042877197265625, -0.45098876953125, -0.3976898193359375, -0.344390869140625, -0.2910919189453125, -0.23779296875, -0.1844940185546875, -0.131195068359375, -0.0778961181640625, -0.02459716796875, 0.0287017822265625, 0.082000732421875, 0.1352996826171875, 0.1885986328125, 0.2418975830078125, 0.295196533203125, 0.3484954833984375, 0.40179443359375, 0.4550933837890625, 0.508392333984375, 0.5616912841796875, 0.614990234375, 0.6682891845703125, 0.721588134765625, 0.7748870849609375, 0.82818603515625, 0.8814849853515625, 0.934783935546875, 0.9880828857421875, 1.0413818359375, 1.0946807861328125, 1.147979736328125, 1.2012786865234375, 1.25457763671875, 1.3078765869140625, 1.361175537109375, 1.4144744873046875, 1.4677734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 9.0, 14.0, 8.0, 13.0, 23.0, 28.0, 61.0, 99.0, 138.0, 172.0, 145.0, 104.0, 76.0, 24.0, 23.0, 12.0, 15.0, 4.0, 9.0, 1.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5888671875, -0.57183837890625, -0.5548095703125, -0.53778076171875, -0.520751953125, -0.50372314453125, -0.4866943359375, -0.46966552734375, -0.45263671875, -0.43560791015625, -0.4185791015625, -0.40155029296875, -0.384521484375, -0.36749267578125, -0.3504638671875, -0.33343505859375, -0.31640625, -0.29937744140625, -0.2823486328125, -0.26531982421875, -0.248291015625, -0.23126220703125, -0.2142333984375, -0.19720458984375, -0.18017578125, -0.16314697265625, -0.1461181640625, -0.12908935546875, -0.112060546875, -0.09503173828125, -0.0780029296875, -0.06097412109375, -0.0439453125, -0.02691650390625, -0.0098876953125, 0.00714111328125, 0.024169921875, 0.04119873046875, 0.0582275390625, 0.07525634765625, 0.09228515625, 0.10931396484375, 0.1263427734375, 0.14337158203125, 0.160400390625, 0.17742919921875, 0.1944580078125, 0.21148681640625, 0.228515625, 0.24554443359375, 0.2625732421875, 0.27960205078125, 0.296630859375, 0.31365966796875, 0.3306884765625, 0.34771728515625, 0.36474609375, 0.38177490234375, 0.3988037109375, 0.41583251953125, 0.432861328125, 0.44989013671875, 0.4669189453125, 0.48394775390625, 0.5009765625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 9.0, 19.0, 40.0, 92.0, 119.0, 169.0, 180.0, 142.0, 96.0, 68.0, 31.0, 11.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.498085021972656, -24.91822052001953, -24.33835792541504, -23.758493423461914, -23.17862892150879, -22.598764419555664, -22.018901824951172, -21.439037322998047, -20.859172821044922, -20.279308319091797, -19.699445724487305, -19.11958122253418, -18.539716720581055, -17.95985221862793, -17.379989624023438, -16.800125122070312, -16.220260620117188, -15.640397071838379, -15.060532569885254, -14.480669021606445, -13.90080451965332, -13.320940971374512, -12.741077423095703, -12.161212921142578, -11.581350326538086, -11.001486778259277, -10.421622276306152, -9.841758728027344, -9.261894226074219, -8.68203067779541, -8.102167129516602, -7.522302627563477, -6.942438125610352, -6.362574100494385, -5.782710075378418, -5.202846527099609, -4.622982025146484, -4.043118476867676, -3.463254451751709, -2.883390426635742, -2.3035264015197754, -1.7236623764038086, -1.1437984704971313, -0.5639345645904541, 0.015929460525512695, 0.5957934856414795, 1.1756572723388672, 1.755521297454834, 2.335385322570801, 2.9152493476867676, 3.4951133728027344, 4.074976921081543, 4.654841423034668, 5.234704971313477, 5.814568996429443, 6.39443302154541, 6.974297046661377, 7.554161071777344, 8.134024620056152, 8.713889122009277, 9.293752670288086, 9.873617172241211, 10.45348072052002, 11.033344268798828, 11.613208770751953]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 12.0, 15.0, 23.0, 31.0, 36.0, 44.0, 64.0, 51.0, 64.0, 77.0, 81.0, 56.0, 86.0, 66.0, 53.0, 57.0, 46.0, 36.0, 35.0, 23.0, 14.0, 8.0, 9.0, 8.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.612642288208008, -15.240781784057617, -14.86892032623291, -14.49705982208252, -14.125199317932129, -13.753338813781738, -13.381477355957031, -13.00961685180664, -12.63775634765625, -12.26589584350586, -11.894034385681152, -11.522173881530762, -11.150313377380371, -10.77845287322998, -10.406591415405273, -10.034730911254883, -9.662870407104492, -9.291009902954102, -8.919148445129395, -8.547287940979004, -8.175427436828613, -7.8035664558410645, -7.431705474853516, -7.059844970703125, -6.687983512878418, -6.316122531890869, -5.9442620277404785, -5.57240104675293, -5.200540542602539, -4.82867956161499, -4.456818580627441, -4.084958076477051, -3.71309757232666, -3.3412368297576904, -2.9693760871887207, -2.597515106201172, -2.2256546020507812, -1.853793740272522, -1.4819328784942627, -1.110072135925293, -0.7382113933563232, -0.36635062098503113, 0.005510151386260986, 0.3773709535598755, 0.7492316961288452, 1.121092438697815, 1.4929533004760742, 1.864814043045044, 2.2366747856140137, 2.6085355281829834, 2.980396270751953, 3.352257251739502, 3.7241177558898926, 4.095978736877441, 4.467839241027832, 4.839700222015381, 5.21156120300293, 5.5834221839904785, 5.955282688140869, 6.327143669128418, 6.699004173278809, 7.070865154266357, 7.442726135253906, 7.814586639404297, 8.186447143554688]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 6.0, 4.0, 7.0, 12.0, 12.0, 20.0, 17.0, 38.0, 58.0, 133.0, 280.0, 692.0, 2014.0, 6712.0, 26070.0, 119605.0, 470090.0, 328649.0, 71161.0, 16265.0, 4369.0, 1354.0, 509.0, 218.0, 90.0, 53.0, 35.0, 26.0, 15.0, 11.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.1484375, -7.8841552734375, -7.619873046875, -7.3555908203125, -7.09130859375, -6.8270263671875, -6.562744140625, -6.2984619140625, -6.0341796875, -5.7698974609375, -5.505615234375, -5.2413330078125, -4.97705078125, -4.7127685546875, -4.448486328125, -4.1842041015625, -3.919921875, -3.6556396484375, -3.391357421875, -3.1270751953125, -2.86279296875, -2.5985107421875, -2.334228515625, -2.0699462890625, -1.8056640625, -1.5413818359375, -1.277099609375, -1.0128173828125, -0.74853515625, -0.4842529296875, -0.219970703125, 0.0443115234375, 0.30859375, 0.5728759765625, 0.837158203125, 1.1014404296875, 1.36572265625, 1.6300048828125, 1.894287109375, 2.1585693359375, 2.4228515625, 2.6871337890625, 2.951416015625, 3.2156982421875, 3.47998046875, 3.7442626953125, 4.008544921875, 4.2728271484375, 4.537109375, 4.8013916015625, 5.065673828125, 5.3299560546875, 5.59423828125, 5.8585205078125, 6.122802734375, 6.3870849609375, 6.6513671875, 6.9156494140625, 7.179931640625, 7.4442138671875, 7.70849609375, 7.9727783203125, 8.237060546875, 8.5013427734375, 8.765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 10.0, 11.0, 19.0, 25.0, 43.0, 58.0, 66.0, 63.0, 83.0, 75.0, 98.0, 90.0, 71.0, 72.0, 64.0, 48.0, 34.0, 24.0, 22.0, 12.0, 7.0, 9.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -34.95654296875, -34.1318359375, -33.30712890625, -32.482421875, -31.65771484375, -30.8330078125, -30.00830078125, -29.18359375, -28.35888671875, -27.5341796875, -26.70947265625, -25.884765625, -25.06005859375, -24.2353515625, -23.41064453125, -22.5859375, -21.76123046875, -20.9365234375, -20.11181640625, -19.287109375, -18.46240234375, -17.6376953125, -16.81298828125, -15.98828125, -15.16357421875, -14.3388671875, -13.51416015625, -12.689453125, -11.86474609375, -11.0400390625, -10.21533203125, -9.390625, -8.56591796875, -7.7412109375, -6.91650390625, -6.091796875, -5.26708984375, -4.4423828125, -3.61767578125, -2.79296875, -1.96826171875, -1.1435546875, -0.31884765625, 0.505859375, 1.33056640625, 2.1552734375, 2.97998046875, 3.8046875, 4.62939453125, 5.4541015625, 6.27880859375, 7.103515625, 7.92822265625, 8.7529296875, 9.57763671875, 10.40234375, 11.22705078125, 12.0517578125, 12.87646484375, 13.701171875, 14.52587890625, 15.3505859375, 16.17529296875, 17.0]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 6.0, 4.0, 16.0, 12.0, 17.0, 15.0, 20.0, 14.0, 23.0, 18.0, 29.0, 28.0, 34.0, 43.0, 44.0, 58.0, 181.0, 1947.0, 1030757.0, 14563.0, 274.0, 82.0, 56.0, 38.0, 30.0, 32.0, 39.0, 35.0, 18.0, 15.0, 26.0, 24.0, 13.0, 11.0, 11.0, 7.0, 9.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.5625, -46.740234375, -44.91796875, -43.095703125, -41.2734375, -39.451171875, -37.62890625, -35.806640625, -33.984375, -32.162109375, -30.33984375, -28.517578125, -26.6953125, -24.873046875, -23.05078125, -21.228515625, -19.40625, -17.583984375, -15.76171875, -13.939453125, -12.1171875, -10.294921875, -8.47265625, -6.650390625, -4.828125, -3.005859375, -1.18359375, 0.638671875, 2.4609375, 4.283203125, 6.10546875, 7.927734375, 9.75, 11.572265625, 13.39453125, 15.216796875, 17.0390625, 18.861328125, 20.68359375, 22.505859375, 24.328125, 26.150390625, 27.97265625, 29.794921875, 31.6171875, 33.439453125, 35.26171875, 37.083984375, 38.90625, 40.728515625, 42.55078125, 44.373046875, 46.1953125, 48.017578125, 49.83984375, 51.662109375, 53.484375, 55.306640625, 57.12890625, 58.951171875, 60.7734375, 62.595703125, 64.41796875, 66.240234375, 68.0625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 8.0, 5.0, 6.0, 7.0, 11.0, 14.0, 15.0, 21.0, 20.0, 14.0, 19.0, 22.0, 33.0, 28.0, 33.0, 32.0, 33.0, 34.0, 49.0, 42.0, 50.0, 43.0, 40.0, 37.0, 41.0, 39.0, 37.0, 38.0, 37.0, 29.0, 23.0, 25.0, 25.0, 12.0, 25.0, 13.0, 14.0, 8.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1796875, -11.740234375, -11.30078125, -10.861328125, -10.421875, -9.982421875, -9.54296875, -9.103515625, -8.6640625, -8.224609375, -7.78515625, -7.345703125, -6.90625, -6.466796875, -6.02734375, -5.587890625, -5.1484375, -4.708984375, -4.26953125, -3.830078125, -3.390625, -2.951171875, -2.51171875, -2.072265625, -1.6328125, -1.193359375, -0.75390625, -0.314453125, 0.125, 0.564453125, 1.00390625, 1.443359375, 1.8828125, 2.322265625, 2.76171875, 3.201171875, 3.640625, 4.080078125, 4.51953125, 4.958984375, 5.3984375, 5.837890625, 6.27734375, 6.716796875, 7.15625, 7.595703125, 8.03515625, 8.474609375, 8.9140625, 9.353515625, 9.79296875, 10.232421875, 10.671875, 11.111328125, 11.55078125, 11.990234375, 12.4296875, 12.869140625, 13.30859375, 13.748046875, 14.1875, 14.626953125, 15.06640625, 15.505859375, 15.9453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 9.0, 7.0, 11.0, 10.0, 15.0, 35.0, 64.0, 124.0, 253.0, 781.0, 2883.0, 23029.0, 694146.0, 312803.0, 11421.0, 1982.0, 521.0, 214.0, 99.0, 48.0, 33.0, 23.0, 9.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.8359375, -5.63372802734375, -5.4315185546875, -5.22930908203125, -5.027099609375, -4.82489013671875, -4.6226806640625, -4.42047119140625, -4.21826171875, -4.01605224609375, -3.8138427734375, -3.61163330078125, -3.409423828125, -3.20721435546875, -3.0050048828125, -2.80279541015625, -2.6005859375, -2.39837646484375, -2.1961669921875, -1.99395751953125, -1.791748046875, -1.58953857421875, -1.3873291015625, -1.18511962890625, -0.98291015625, -0.78070068359375, -0.5784912109375, -0.37628173828125, -0.174072265625, 0.02813720703125, 0.2303466796875, 0.43255615234375, 0.634765625, 0.83697509765625, 1.0391845703125, 1.24139404296875, 1.443603515625, 1.64581298828125, 1.8480224609375, 2.05023193359375, 2.25244140625, 2.45465087890625, 2.6568603515625, 2.85906982421875, 3.061279296875, 3.26348876953125, 3.4656982421875, 3.66790771484375, 3.8701171875, 4.07232666015625, 4.2745361328125, 4.47674560546875, 4.678955078125, 4.88116455078125, 5.0833740234375, 5.28558349609375, 5.48779296875, 5.69000244140625, 5.8922119140625, 6.09442138671875, 6.296630859375, 6.49884033203125, 6.7010498046875, 6.90325927734375, 7.10546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 12.0, 6.0, 6.0, 13.0, 14.0, 19.0, 31.0, 41.0, 56.0, 73.0, 94.0, 112.0, 101.0, 93.0, 82.0, 74.0, 58.0, 39.0, 29.0, 19.0, 11.0, 6.0, 2.0, 4.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0005946159362792969, -0.0005781911313533783, -0.0005617663264274597, -0.0005453415215015411, -0.0005289167165756226, -0.000512491911649704, -0.0004960671067237854, -0.0004796423017978668, -0.00046321749687194824, -0.00044679269194602966, -0.0004303678870201111, -0.0004139430820941925, -0.0003975182771682739, -0.00038109347224235535, -0.00036466866731643677, -0.0003482438623905182, -0.0003318190574645996, -0.00031539425253868103, -0.00029896944761276245, -0.00028254464268684387, -0.0002661198377609253, -0.0002496950328350067, -0.00023327022790908813, -0.00021684542298316956, -0.00020042061805725098, -0.0001839958131313324, -0.00016757100820541382, -0.00015114620327949524, -0.00013472139835357666, -0.00011829659342765808, -0.0001018717885017395, -8.544698357582092e-05, -6.902217864990234e-05, -5.2597373723983765e-05, -3.6172568798065186e-05, -1.9747763872146606e-05, -3.3229589462280273e-06, 1.3101845979690552e-05, 2.952665090560913e-05, 4.595145583152771e-05, 6.237626075744629e-05, 7.880106568336487e-05, 9.522587060928345e-05, 0.00011165067553520203, 0.0001280754804611206, 0.00014450028538703918, 0.00016092509031295776, 0.00017734989523887634, 0.00019377470016479492, 0.0002101995050907135, 0.00022662431001663208, 0.00024304911494255066, 0.00025947391986846924, 0.0002758987247943878, 0.0002923235297203064, 0.000308748334646225, 0.00032517313957214355, 0.00034159794449806213, 0.0003580227494239807, 0.0003744475543498993, 0.00039087235927581787, 0.00040729716420173645, 0.00042372196912765503, 0.0004401467740535736, 0.0004565715789794922]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 8.0, 7.0, 13.0, 12.0, 29.0, 38.0, 96.0, 225.0, 558.0, 1658.0, 6282.0, 44910.0, 584505.0, 376647.0, 26846.0, 4576.0, 1310.0, 460.0, 178.0, 88.0, 41.0, 24.0, 18.0, 10.0, 10.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.43359375, -4.2852783203125, -4.136962890625, -3.9886474609375, -3.84033203125, -3.6920166015625, -3.543701171875, -3.3953857421875, -3.2470703125, -3.0987548828125, -2.950439453125, -2.8021240234375, -2.65380859375, -2.5054931640625, -2.357177734375, -2.2088623046875, -2.060546875, -1.9122314453125, -1.763916015625, -1.6156005859375, -1.46728515625, -1.3189697265625, -1.170654296875, -1.0223388671875, -0.8740234375, -0.7257080078125, -0.577392578125, -0.4290771484375, -0.28076171875, -0.1324462890625, 0.015869140625, 0.1641845703125, 0.3125, 0.4608154296875, 0.609130859375, 0.7574462890625, 0.90576171875, 1.0540771484375, 1.202392578125, 1.3507080078125, 1.4990234375, 1.6473388671875, 1.795654296875, 1.9439697265625, 2.09228515625, 2.2406005859375, 2.388916015625, 2.5372314453125, 2.685546875, 2.8338623046875, 2.982177734375, 3.1304931640625, 3.27880859375, 3.4271240234375, 3.575439453125, 3.7237548828125, 3.8720703125, 4.0203857421875, 4.168701171875, 4.3170166015625, 4.46533203125, 4.6136474609375, 4.761962890625, 4.9102783203125, 5.05859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 9.0, 16.0, 18.0, 26.0, 49.0, 63.0, 87.0, 95.0, 123.0, 112.0, 110.0, 98.0, 52.0, 43.0, 36.0, 22.0, 13.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.20703125, -2.1508636474609375, -2.094696044921875, -2.0385284423828125, -1.98236083984375, -1.9261932373046875, -1.870025634765625, -1.8138580322265625, -1.7576904296875, -1.7015228271484375, -1.645355224609375, -1.5891876220703125, -1.53302001953125, -1.4768524169921875, -1.420684814453125, -1.3645172119140625, -1.308349609375, -1.2521820068359375, -1.196014404296875, -1.1398468017578125, -1.08367919921875, -1.0275115966796875, -0.971343994140625, -0.9151763916015625, -0.8590087890625, -0.8028411865234375, -0.746673583984375, -0.6905059814453125, -0.63433837890625, -0.5781707763671875, -0.522003173828125, -0.4658355712890625, -0.40966796875, -0.3535003662109375, -0.297332763671875, -0.2411651611328125, -0.18499755859375, -0.1288299560546875, -0.072662353515625, -0.0164947509765625, 0.0396728515625, 0.0958404541015625, 0.152008056640625, 0.2081756591796875, 0.26434326171875, 0.3205108642578125, 0.376678466796875, 0.4328460693359375, 0.489013671875, 0.5451812744140625, 0.601348876953125, 0.6575164794921875, 0.71368408203125, 0.7698516845703125, 0.826019287109375, 0.8821868896484375, 0.9383544921875, 0.9945220947265625, 1.050689697265625, 1.1068572998046875, 1.16302490234375, 1.2191925048828125, 1.275360107421875, 1.3315277099609375, 1.3876953125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 6.0, 12.0, 25.0, 40.0, 83.0, 111.0, 203.0, 194.0, 132.0, 92.0, 60.0, 32.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.53342819213867, -57.25847244262695, -55.983516693115234, -54.708560943603516, -53.43360900878906, -52.158653259277344, -50.883697509765625, -49.608741760253906, -48.33378601074219, -47.05883026123047, -45.78387451171875, -44.50891876220703, -43.23396301269531, -41.95901107788086, -40.68405532836914, -39.40909957885742, -38.1341438293457, -36.859188079833984, -35.584232330322266, -34.30927658081055, -33.034324645996094, -31.759366989135742, -30.484413146972656, -29.209457397460938, -27.93450164794922, -26.6595458984375, -25.38459014892578, -24.109636306762695, -22.834680557250977, -21.559724807739258, -20.284770965576172, -19.009815216064453, -17.7348575592041, -16.459901809692383, -15.18494701385498, -13.909992218017578, -12.63503646850586, -11.36008071899414, -10.085125923156738, -8.810171127319336, -7.535215377807617, -6.260260105133057, -4.985304832458496, -3.7103495597839355, -2.435394287109375, -1.1604390144348145, 0.1145162582397461, 1.3894710540771484, 2.664426803588867, 3.9393820762634277, 5.214337348937988, 6.489292621612549, 7.764247894287109, 9.039203643798828, 10.31415843963623, 11.589113235473633, 12.864068984985352, 14.13902473449707, 15.413979530334473, 16.688934326171875, 17.963890075683594, 19.238845825195312, 20.51380157470703, 21.788755416870117, 23.063711166381836]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 6.0, 9.0, 16.0, 13.0, 15.0, 27.0, 20.0, 28.0, 31.0, 40.0, 41.0, 40.0, 55.0, 47.0, 53.0, 38.0, 48.0, 51.0, 40.0, 40.0, 38.0, 37.0, 42.0, 37.0, 31.0, 25.0, 21.0, 27.0, 15.0, 14.0, 8.0, 9.0, 10.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-26.820026397705078, -26.084226608276367, -25.348426818847656, -24.612628936767578, -23.876829147338867, -23.141029357910156, -22.405229568481445, -21.669429779052734, -20.933631896972656, -20.197832107543945, -19.462032318115234, -18.726234436035156, -17.990434646606445, -17.254634857177734, -16.518835067749023, -15.783035278320312, -15.047235488891602, -14.31143569946289, -13.575636863708496, -12.839837074279785, -12.10403823852539, -11.36823844909668, -10.632438659667969, -9.896638870239258, -9.160840034484863, -8.425040245056152, -7.689241409301758, -6.953441619873047, -6.217642307281494, -5.481842994689941, -4.7460432052612305, -4.010243892669678, -3.274446487426758, -2.538647174835205, -1.8028476238250732, -1.0670480728149414, -0.33124876022338867, 0.40455055236816406, 1.140350341796875, 1.8761496543884277, 2.6119489669799805, 3.347748279571533, 4.083547592163086, 4.819347381591797, 5.55514669418335, 6.290946006774902, 7.026745796203613, 7.762545108795166, 8.498344421386719, 9.23414421081543, 9.969943046569824, 10.705742835998535, 11.44154167175293, 12.17734146118164, 12.913141250610352, 13.648941040039062, 14.384739875793457, 15.120539665222168, 15.856338500976562, 16.592138290405273, 17.327938079833984, 18.063735961914062, 18.799537658691406, 19.535335540771484, 20.271135330200195]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 2.0, 4.0, 9.0, 8.0, 5.0, 9.0, 8.0, 11.0, 17.0, 14.0, 20.0, 31.0, 46.0, 45.0, 78.0, 114.0, 227.0, 541.0, 2048.0, 13292.0, 181562.0, 2169991.0, 1696286.0, 116327.0, 10312.0, 2119.0, 496.0, 196.0, 107.0, 78.0, 60.0, 39.0, 41.0, 31.0, 16.0, 21.0, 16.0, 8.0, 12.0, 10.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-22.484375, -21.801513671875, -21.11865234375, -20.435791015625, -19.7529296875, -19.070068359375, -18.38720703125, -17.704345703125, -17.021484375, -16.338623046875, -15.65576171875, -14.972900390625, -14.2900390625, -13.607177734375, -12.92431640625, -12.241455078125, -11.55859375, -10.875732421875, -10.19287109375, -9.510009765625, -8.8271484375, -8.144287109375, -7.46142578125, -6.778564453125, -6.095703125, -5.412841796875, -4.72998046875, -4.047119140625, -3.3642578125, -2.681396484375, -1.99853515625, -1.315673828125, -0.6328125, 0.050048828125, 0.73291015625, 1.415771484375, 2.0986328125, 2.781494140625, 3.46435546875, 4.147216796875, 4.830078125, 5.512939453125, 6.19580078125, 6.878662109375, 7.5615234375, 8.244384765625, 8.92724609375, 9.610107421875, 10.29296875, 10.975830078125, 11.65869140625, 12.341552734375, 13.0244140625, 13.707275390625, 14.39013671875, 15.072998046875, 15.755859375, 16.438720703125, 17.12158203125, 17.804443359375, 18.4873046875, 19.170166015625, 19.85302734375, 20.535888671875, 21.21875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 15.0, 9.0, 11.0, 27.0, 38.0, 49.0, 48.0, 63.0, 70.0, 82.0, 69.0, 72.0, 87.0, 64.0, 66.0, 40.0, 42.0, 47.0, 37.0, 22.0, 9.0, 8.0, 8.0, 10.0, 6.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.515625, -20.9932861328125, -20.470947265625, -19.9486083984375, -19.42626953125, -18.9039306640625, -18.381591796875, -17.8592529296875, -17.3369140625, -16.8145751953125, -16.292236328125, -15.7698974609375, -15.24755859375, -14.7252197265625, -14.202880859375, -13.6805419921875, -13.158203125, -12.6358642578125, -12.113525390625, -11.5911865234375, -11.06884765625, -10.5465087890625, -10.024169921875, -9.5018310546875, -8.9794921875, -8.4571533203125, -7.934814453125, -7.4124755859375, -6.89013671875, -6.3677978515625, -5.845458984375, -5.3231201171875, -4.80078125, -4.2784423828125, -3.756103515625, -3.2337646484375, -2.71142578125, -2.1890869140625, -1.666748046875, -1.1444091796875, -0.6220703125, -0.0997314453125, 0.422607421875, 0.9449462890625, 1.46728515625, 1.9896240234375, 2.511962890625, 3.0343017578125, 3.556640625, 4.0789794921875, 4.601318359375, 5.1236572265625, 5.64599609375, 6.1683349609375, 6.690673828125, 7.2130126953125, 7.7353515625, 8.2576904296875, 8.780029296875, 9.3023681640625, 9.82470703125, 10.3470458984375, 10.869384765625, 11.3917236328125, 11.9140625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 3.0, 5.0, 3.0, 12.0, 11.0, 24.0, 33.0, 50.0, 106.0, 285.0, 1252.0, 24214.0, 3990790.0, 174330.0, 2488.0, 399.0, 149.0, 51.0, 36.0, 9.0, 6.0, 5.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-41.25, -39.85986328125, -38.4697265625, -37.07958984375, -35.689453125, -34.29931640625, -32.9091796875, -31.51904296875, -30.12890625, -28.73876953125, -27.3486328125, -25.95849609375, -24.568359375, -23.17822265625, -21.7880859375, -20.39794921875, -19.0078125, -17.61767578125, -16.2275390625, -14.83740234375, -13.447265625, -12.05712890625, -10.6669921875, -9.27685546875, -7.88671875, -6.49658203125, -5.1064453125, -3.71630859375, -2.326171875, -0.93603515625, 0.4541015625, 1.84423828125, 3.234375, 4.62451171875, 6.0146484375, 7.40478515625, 8.794921875, 10.18505859375, 11.5751953125, 12.96533203125, 14.35546875, 15.74560546875, 17.1357421875, 18.52587890625, 19.916015625, 21.30615234375, 22.6962890625, 24.08642578125, 25.4765625, 26.86669921875, 28.2568359375, 29.64697265625, 31.037109375, 32.42724609375, 33.8173828125, 35.20751953125, 36.59765625, 37.98779296875, 39.3779296875, 40.76806640625, 42.158203125, 43.54833984375, 44.9384765625, 46.32861328125, 47.71875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 11.0, 27.0, 33.0, 41.0, 61.0, 90.0, 140.0, 199.0, 264.0, 418.0, 560.0, 527.0, 441.0, 380.0, 262.0, 187.0, 112.0, 99.0, 54.0, 31.0, 28.0, 33.0, 14.0, 9.0, 12.0, 6.0, 8.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.74609375, -4.58978271484375, -4.4334716796875, -4.27716064453125, -4.120849609375, -3.96453857421875, -3.8082275390625, -3.65191650390625, -3.49560546875, -3.33929443359375, -3.1829833984375, -3.02667236328125, -2.870361328125, -2.71405029296875, -2.5577392578125, -2.40142822265625, -2.2451171875, -2.08880615234375, -1.9324951171875, -1.77618408203125, -1.619873046875, -1.46356201171875, -1.3072509765625, -1.15093994140625, -0.99462890625, -0.83831787109375, -0.6820068359375, -0.52569580078125, -0.369384765625, -0.21307373046875, -0.0567626953125, 0.09954833984375, 0.255859375, 0.41217041015625, 0.5684814453125, 0.72479248046875, 0.881103515625, 1.03741455078125, 1.1937255859375, 1.35003662109375, 1.50634765625, 1.66265869140625, 1.8189697265625, 1.97528076171875, 2.131591796875, 2.28790283203125, 2.4442138671875, 2.60052490234375, 2.7568359375, 2.91314697265625, 3.0694580078125, 3.22576904296875, 3.382080078125, 3.53839111328125, 3.6947021484375, 3.85101318359375, 4.00732421875, 4.16363525390625, 4.3199462890625, 4.47625732421875, 4.632568359375, 4.78887939453125, 4.9451904296875, 5.10150146484375, 5.2578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 8.0, 10.0, 22.0, 39.0, 52.0, 75.0, 101.0, 144.0, 140.0, 123.0, 109.0, 66.0, 53.0, 28.0, 19.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.99203872680664, -35.20993423461914, -34.427833557128906, -33.645729064941406, -32.863624572753906, -32.081520080566406, -31.29941749572754, -30.517314910888672, -29.735210418701172, -28.953107833862305, -28.171003341674805, -27.388900756835938, -26.606796264648438, -25.82469367980957, -25.04258918762207, -24.260486602783203, -23.478382110595703, -22.696279525756836, -21.914175033569336, -21.13207244873047, -20.34996795654297, -19.5678653717041, -18.7857608795166, -18.003658294677734, -17.221555709838867, -16.439453125, -15.6573486328125, -14.875245094299316, -14.093141555786133, -13.31103801727295, -12.528934478759766, -11.746831893920898, -10.964727401733398, -10.182623863220215, -9.400520324707031, -8.618416786193848, -7.836313247680664, -7.0542097091674805, -6.272106647491455, -5.4900031089782715, -4.707899570465088, -3.9257960319519043, -3.1436924934387207, -2.361589193344116, -1.5794856548309326, -0.797382116317749, -0.015278816223144531, 0.7668247222900391, 1.5489282608032227, 2.3310317993164062, 3.11313533782959, 3.8952386379241943, 4.677342414855957, 5.459445953369141, 6.241549015045166, 7.02365255355835, 7.805756092071533, 8.587859153747559, 9.369962692260742, 10.152066230773926, 10.93416976928711, 11.716273307800293, 12.498376846313477, 13.28048038482666, 14.062583923339844]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 11.0, 19.0, 26.0, 35.0, 32.0, 30.0, 35.0, 55.0, 62.0, 54.0, 55.0, 65.0, 51.0, 61.0, 69.0, 51.0, 46.0, 42.0, 39.0, 38.0, 22.0, 21.0, 20.0, 18.0, 9.0, 4.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.018476486206055, -18.53684425354004, -18.055212020874023, -17.573579788208008, -17.091947555541992, -16.61031723022461, -16.128684997558594, -15.647052764892578, -15.165420532226562, -14.683788299560547, -14.202156066894531, -13.720524787902832, -13.238892555236816, -12.7572603225708, -12.275628089904785, -11.793996810913086, -11.31236457824707, -10.830732345581055, -10.349100112915039, -9.86746883392334, -9.385836601257324, -8.904204368591309, -8.422572135925293, -7.9409403800964355, -7.459307670593262, -6.977675437927246, -6.496043682098389, -6.014411449432373, -5.532779693603516, -5.0511474609375, -4.569515228271484, -4.087883472442627, -3.6062517166137695, -3.124619722366333, -2.6429877281188965, -2.161355495452881, -1.6797236204147339, -1.1980915069580078, -0.7164595127105713, -0.23482751846313477, 0.24680447578430176, 0.7284364700317383, 1.2100684642791748, 1.6917005777359009, 2.173332691192627, 2.6549646854400635, 3.1365966796875, 3.6182286739349365, 4.099860668182373, 4.581492900848389, 5.063124656677246, 5.544756889343262, 6.026388645172119, 6.508020877838135, 6.989652633666992, 7.471284866333008, 7.952917098999023, 8.434549331665039, 8.916181564331055, 9.397812843322754, 9.87944507598877, 10.361077308654785, 10.8427095413208, 11.3243408203125, 11.805973052978516]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 9.0, 5.0, 14.0, 16.0, 16.0, 39.0, 44.0, 89.0, 129.0, 223.0, 399.0, 889.0, 2758.0, 12524.0, 82638.0, 535628.0, 355896.0, 45840.0, 7847.0, 1950.0, 733.0, 341.0, 219.0, 110.0, 70.0, 37.0, 28.0, 25.0, 10.0, 10.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.50390625, -6.352142333984375, -6.20037841796875, -6.048614501953125, -5.8968505859375, -5.745086669921875, -5.59332275390625, -5.441558837890625, -5.289794921875, -5.138031005859375, -4.98626708984375, -4.834503173828125, -4.6827392578125, -4.530975341796875, -4.37921142578125, -4.227447509765625, -4.07568359375, -3.923919677734375, -3.77215576171875, -3.620391845703125, -3.4686279296875, -3.316864013671875, -3.16510009765625, -3.013336181640625, -2.861572265625, -2.709808349609375, -2.55804443359375, -2.406280517578125, -2.2545166015625, -2.102752685546875, -1.95098876953125, -1.799224853515625, -1.6474609375, -1.495697021484375, -1.34393310546875, -1.192169189453125, -1.0404052734375, -0.888641357421875, -0.73687744140625, -0.585113525390625, -0.433349609375, -0.281585693359375, -0.12982177734375, 0.021942138671875, 0.1737060546875, 0.325469970703125, 0.47723388671875, 0.628997802734375, 0.78076171875, 0.932525634765625, 1.08428955078125, 1.236053466796875, 1.3878173828125, 1.539581298828125, 1.69134521484375, 1.843109130859375, 1.994873046875, 2.146636962890625, 2.29840087890625, 2.450164794921875, 2.6019287109375, 2.753692626953125, 2.90545654296875, 3.057220458984375, 3.208984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 7.0, 16.0, 19.0, 50.0, 31.0, 39.0, 56.0, 63.0, 64.0, 76.0, 74.0, 81.0, 73.0, 53.0, 70.0, 54.0, 41.0, 33.0, 30.0, 16.0, 15.0, 9.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.3359375, -13.984130859375, -13.63232421875, -13.280517578125, -12.9287109375, -12.576904296875, -12.22509765625, -11.873291015625, -11.521484375, -11.169677734375, -10.81787109375, -10.466064453125, -10.1142578125, -9.762451171875, -9.41064453125, -9.058837890625, -8.70703125, -8.355224609375, -8.00341796875, -7.651611328125, -7.2998046875, -6.947998046875, -6.59619140625, -6.244384765625, -5.892578125, -5.540771484375, -5.18896484375, -4.837158203125, -4.4853515625, -4.133544921875, -3.78173828125, -3.429931640625, -3.078125, -2.726318359375, -2.37451171875, -2.022705078125, -1.6708984375, -1.319091796875, -0.96728515625, -0.615478515625, -0.263671875, 0.088134765625, 0.43994140625, 0.791748046875, 1.1435546875, 1.495361328125, 1.84716796875, 2.198974609375, 2.55078125, 2.902587890625, 3.25439453125, 3.606201171875, 3.9580078125, 4.309814453125, 4.66162109375, 5.013427734375, 5.365234375, 5.717041015625, 6.06884765625, 6.420654296875, 6.7724609375, 7.124267578125, 7.47607421875, 7.827880859375, 8.1796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 16.0, 10.0, 5.0, 14.0, 27.0, 31.0, 33.0, 71.0, 114.0, 165.0, 247.0, 422.0, 626.0, 1054.0, 1784.0, 3265.0, 5703.0, 10669.0, 20275.0, 38659.0, 74011.0, 135272.0, 205117.0, 215372.0, 152951.0, 86383.0, 44851.0, 23200.0, 12451.0, 6741.0, 3686.0, 2092.0, 1176.0, 783.0, 426.0, 292.0, 184.0, 106.0, 81.0, 57.0, 30.0, 30.0, 22.0, 12.0, 15.0, 9.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.134765625, -1.0970916748046875, -1.059417724609375, -1.0217437744140625, -0.98406982421875, -0.9463958740234375, -0.908721923828125, -0.8710479736328125, -0.8333740234375, -0.7957000732421875, -0.758026123046875, -0.7203521728515625, -0.68267822265625, -0.6450042724609375, -0.607330322265625, -0.5696563720703125, -0.531982421875, -0.4943084716796875, -0.456634521484375, -0.4189605712890625, -0.38128662109375, -0.3436126708984375, -0.305938720703125, -0.2682647705078125, -0.2305908203125, -0.1929168701171875, -0.155242919921875, -0.1175689697265625, -0.07989501953125, -0.0422210693359375, -0.004547119140625, 0.0331268310546875, 0.07080078125, 0.1084747314453125, 0.146148681640625, 0.1838226318359375, 0.22149658203125, 0.2591705322265625, 0.296844482421875, 0.3345184326171875, 0.3721923828125, 0.4098663330078125, 0.447540283203125, 0.4852142333984375, 0.52288818359375, 0.5605621337890625, 0.598236083984375, 0.6359100341796875, 0.673583984375, 0.7112579345703125, 0.748931884765625, 0.7866058349609375, 0.82427978515625, 0.8619537353515625, 0.899627685546875, 0.9373016357421875, 0.9749755859375, 1.0126495361328125, 1.050323486328125, 1.0879974365234375, 1.12567138671875, 1.1633453369140625, 1.201019287109375, 1.2386932373046875, 1.2763671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 11.0, 6.0, 11.0, 9.0, 14.0, 13.0, 13.0, 27.0, 32.0, 27.0, 32.0, 34.0, 39.0, 43.0, 52.0, 48.0, 49.0, 37.0, 31.0, 43.0, 37.0, 50.0, 34.0, 46.0, 41.0, 31.0, 29.0, 31.0, 19.0, 27.0, 14.0, 8.0, 10.0, 14.0, 4.0, 14.0, 4.0, 6.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.4453125, -14.024169921875, -13.60302734375, -13.181884765625, -12.7607421875, -12.339599609375, -11.91845703125, -11.497314453125, -11.076171875, -10.655029296875, -10.23388671875, -9.812744140625, -9.3916015625, -8.970458984375, -8.54931640625, -8.128173828125, -7.70703125, -7.285888671875, -6.86474609375, -6.443603515625, -6.0224609375, -5.601318359375, -5.18017578125, -4.759033203125, -4.337890625, -3.916748046875, -3.49560546875, -3.074462890625, -2.6533203125, -2.232177734375, -1.81103515625, -1.389892578125, -0.96875, -0.547607421875, -0.12646484375, 0.294677734375, 0.7158203125, 1.136962890625, 1.55810546875, 1.979248046875, 2.400390625, 2.821533203125, 3.24267578125, 3.663818359375, 4.0849609375, 4.506103515625, 4.92724609375, 5.348388671875, 5.76953125, 6.190673828125, 6.61181640625, 7.032958984375, 7.4541015625, 7.875244140625, 8.29638671875, 8.717529296875, 9.138671875, 9.559814453125, 9.98095703125, 10.402099609375, 10.8232421875, 11.244384765625, 11.66552734375, 12.086669921875, 12.5078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 6.0, 11.0, 7.0, 15.0, 22.0, 43.0, 54.0, 106.0, 151.0, 265.0, 442.0, 829.0, 1729.0, 3529.0, 8022.0, 20821.0, 62422.0, 209236.0, 406136.0, 227620.0, 68311.0, 22331.0, 8755.0, 3735.0, 1798.0, 907.0, 511.0, 278.0, 142.0, 111.0, 76.0, 47.0, 21.0, 20.0, 6.0, 13.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.533203125, -0.5181999206542969, -0.5031967163085938, -0.4881935119628906, -0.4731903076171875, -0.4581871032714844, -0.44318389892578125, -0.4281806945800781, -0.413177490234375, -0.3981742858886719, -0.38317108154296875, -0.3681678771972656, -0.3531646728515625, -0.3381614685058594, -0.32315826416015625, -0.3081550598144531, -0.29315185546875, -0.2781486511230469, -0.26314544677734375, -0.24814224243164062, -0.2331390380859375, -0.21813583374023438, -0.20313262939453125, -0.18812942504882812, -0.173126220703125, -0.15812301635742188, -0.14311981201171875, -0.12811660766601562, -0.1131134033203125, -0.09811019897460938, -0.08310699462890625, -0.06810379028320312, -0.0531005859375, -0.038097381591796875, -0.02309417724609375, -0.008090972900390625, 0.0069122314453125, 0.021915435791015625, 0.03691864013671875, 0.051921844482421875, 0.066925048828125, 0.08192825317382812, 0.09693145751953125, 0.11193466186523438, 0.1269378662109375, 0.14194107055664062, 0.15694427490234375, 0.17194747924804688, 0.18695068359375, 0.20195388793945312, 0.21695709228515625, 0.23196029663085938, 0.2469635009765625, 0.2619667053222656, 0.27696990966796875, 0.2919731140136719, 0.306976318359375, 0.3219795227050781, 0.33698272705078125, 0.3519859313964844, 0.3669891357421875, 0.3819923400878906, 0.39699554443359375, 0.4119987487792969, 0.427001953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 7.0, 8.0, 9.0, 13.0, 20.0, 30.0, 30.0, 43.0, 43.0, 71.0, 100.0, 96.0, 96.0, 76.0, 78.0, 84.0, 52.0, 34.0, 18.0, 18.0, 20.0, 11.0, 10.0, 2.0, 7.0, 4.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.000293731689453125, -0.000285126268863678, -0.00027652084827423096, -0.00026791542768478394, -0.0002593100070953369, -0.0002507045865058899, -0.00024209916591644287, -0.00023349374532699585, -0.00022488832473754883, -0.0002162829041481018, -0.00020767748355865479, -0.00019907206296920776, -0.00019046664237976074, -0.00018186122179031372, -0.0001732558012008667, -0.00016465038061141968, -0.00015604496002197266, -0.00014743953943252563, -0.0001388341188430786, -0.0001302286982536316, -0.00012162327766418457, -0.00011301785707473755, -0.00010441243648529053, -9.58070158958435e-05, -8.720159530639648e-05, -7.859617471694946e-05, -6.999075412750244e-05, -6.138533353805542e-05, -5.27799129486084e-05, -4.417449235916138e-05, -3.5569071769714355e-05, -2.6963651180267334e-05, -1.8358230590820312e-05, -9.752810001373291e-06, -1.1473894119262695e-06, 7.458031177520752e-06, 1.6063451766967773e-05, 2.4668872356414795e-05, 3.3274292945861816e-05, 4.187971353530884e-05, 5.048513412475586e-05, 5.909055471420288e-05, 6.76959753036499e-05, 7.630139589309692e-05, 8.490681648254395e-05, 9.351223707199097e-05, 0.00010211765766143799, 0.00011072307825088501, 0.00011932849884033203, 0.00012793391942977905, 0.00013653934001922607, 0.0001451447606086731, 0.00015375018119812012, 0.00016235560178756714, 0.00017096102237701416, 0.00017956644296646118, 0.0001881718635559082, 0.00019677728414535522, 0.00020538270473480225, 0.00021398812532424927, 0.0002225935459136963, 0.0002311989665031433, 0.00023980438709259033, 0.00024840980768203735, 0.0002570152282714844]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 13.0, 15.0, 29.0, 46.0, 99.0, 168.0, 426.0, 1306.0, 5428.0, 27996.0, 216195.0, 648682.0, 124382.0, 18264.0, 3775.0, 976.0, 369.0, 161.0, 85.0, 45.0, 32.0, 21.0, 14.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.01171875, -0.9814071655273438, -0.9510955810546875, -0.9207839965820312, -0.890472412109375, -0.8601608276367188, -0.8298492431640625, -0.7995376586914062, -0.76922607421875, -0.7389144897460938, -0.7086029052734375, -0.6782913208007812, -0.647979736328125, -0.6176681518554688, -0.5873565673828125, -0.5570449829101562, -0.5267333984375, -0.49642181396484375, -0.4661102294921875, -0.43579864501953125, -0.405487060546875, -0.37517547607421875, -0.3448638916015625, -0.31455230712890625, -0.28424072265625, -0.25392913818359375, -0.2236175537109375, -0.19330596923828125, -0.162994384765625, -0.13268280029296875, -0.1023712158203125, -0.07205963134765625, -0.041748046875, -0.01143646240234375, 0.0188751220703125, 0.04918670654296875, 0.079498291015625, 0.10980987548828125, 0.1401214599609375, 0.17043304443359375, 0.20074462890625, 0.23105621337890625, 0.2613677978515625, 0.29167938232421875, 0.321990966796875, 0.35230255126953125, 0.3826141357421875, 0.41292572021484375, 0.4432373046875, 0.47354888916015625, 0.5038604736328125, 0.5341720581054688, 0.564483642578125, 0.5947952270507812, 0.6251068115234375, 0.6554183959960938, 0.68572998046875, 0.7160415649414062, 0.7463531494140625, 0.7766647338867188, 0.806976318359375, 0.8372879028320312, 0.8675994873046875, 0.8979110717773438, 0.92822265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 9.0, 5.0, 16.0, 19.0, 30.0, 22.0, 51.0, 56.0, 105.0, 85.0, 123.0, 96.0, 87.0, 75.0, 67.0, 37.0, 25.0, 27.0, 14.0, 13.0, 13.0, 8.0, 4.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1890869140625, -0.18049049377441406, -0.17189407348632812, -0.1632976531982422, -0.15470123291015625, -0.1461048126220703, -0.13750839233398438, -0.12891197204589844, -0.1203155517578125, -0.11171913146972656, -0.10312271118164062, -0.09452629089355469, -0.08592987060546875, -0.07733345031738281, -0.06873703002929688, -0.06014060974121094, -0.051544189453125, -0.04294776916503906, -0.034351348876953125, -0.025754928588867188, -0.01715850830078125, -0.008562088012695312, 3.4332275390625e-05, 0.008630752563476562, 0.0172271728515625, 0.025823593139648438, 0.034420013427734375, 0.04301643371582031, 0.05161285400390625, 0.06020927429199219, 0.06880569458007812, 0.07740211486816406, 0.08599853515625, 0.09459495544433594, 0.10319137573242188, 0.11178779602050781, 0.12038421630859375, 0.1289806365966797, 0.13757705688476562, 0.14617347717285156, 0.1547698974609375, 0.16336631774902344, 0.17196273803710938, 0.1805591583251953, 0.18915557861328125, 0.1977519989013672, 0.20634841918945312, 0.21494483947753906, 0.223541259765625, 0.23213768005371094, 0.24073410034179688, 0.2493305206298828, 0.25792694091796875, 0.2665233612060547, 0.2751197814941406, 0.28371620178222656, 0.2923126220703125, 0.30090904235839844, 0.3095054626464844, 0.3181018829345703, 0.32669830322265625, 0.3352947235107422, 0.3438911437988281, 0.35248756408691406, 0.361083984375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 12.0, 30.0, 107.0, 249.0, 326.0, 203.0, 59.0, 17.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.834693908691406, -57.7685661315918, -56.70244216918945, -55.636314392089844, -54.5701904296875, -53.50406265258789, -52.43793487548828, -51.37181091308594, -50.30568313598633, -49.23955535888672, -48.173431396484375, -47.107303619384766, -46.04117965698242, -44.97505187988281, -43.90892791748047, -42.84280014038086, -41.77667236328125, -40.71054458618164, -39.6444206237793, -38.57829284667969, -37.512168884277344, -36.446041107177734, -35.379913330078125, -34.31378936767578, -33.24766540527344, -32.18153762817383, -31.115413665771484, -30.049285888671875, -28.9831600189209, -27.917034149169922, -26.850908279418945, -25.78478240966797, -24.71865463256836, -23.652528762817383, -22.586402893066406, -21.520275115966797, -20.45414924621582, -19.388023376464844, -18.321897506713867, -17.25577163696289, -16.18964385986328, -15.123517990112305, -14.057391166687012, -12.991265296936035, -11.925138473510742, -10.859012603759766, -9.792886734008789, -8.726760864257812, -7.660634994506836, -6.594508647918701, -5.528382301330566, -4.46225643157959, -3.396130084991455, -2.3300037384033203, -1.2638778686523438, -0.19775152206420898, 0.8683748245239258, 1.934501051902771, 3.000627279281616, 4.066753387451172, 5.132879734039307, 6.199006080627441, 7.265131950378418, 8.331258773803711, 9.397384643554688]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 11.0, 28.0, 34.0, 45.0, 40.0, 66.0, 73.0, 64.0, 86.0, 72.0, 79.0, 74.0, 69.0, 53.0, 44.0, 41.0, 28.0, 22.0, 14.0, 17.0, 9.0, 8.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.099833488464355, -14.734400749206543, -14.36896800994873, -14.003535270690918, -13.638102531433105, -13.272669792175293, -12.907236099243164, -12.541803359985352, -12.176370620727539, -11.810937881469727, -11.445505142211914, -11.080072402954102, -10.714639663696289, -10.349206924438477, -9.983774185180664, -9.618341445922852, -9.252908706665039, -8.887475967407227, -8.522043228149414, -8.156610488891602, -7.791177749633789, -7.425745010375977, -7.060311794281006, -6.694879055023193, -6.329446315765381, -5.964013576507568, -5.598580837249756, -5.233147621154785, -4.867714881896973, -4.50228214263916, -4.136849403381348, -3.771416664123535, -3.405984878540039, -3.0405521392822266, -2.675119400024414, -2.3096864223480225, -1.94425368309021, -1.5788209438323975, -1.2133879661560059, -0.8479552268981934, -0.48252248764038086, -0.11708968877792358, 0.2483431100845337, 0.6137759685516357, 0.9792087078094482, 1.3446414470672607, 1.7100744247436523, 2.075507164001465, 2.4409399032592773, 2.80637264251709, 3.1718053817749023, 3.537238359451294, 3.9026710987091064, 4.26810359954834, 4.6335368156433105, 4.998969554901123, 5.3644022941589355, 5.729835033416748, 6.0952677726745605, 6.460700988769531, 6.826133728027344, 7.191566467285156, 7.556999206542969, 7.922431945800781, 8.287864685058594]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 5.0, 5.0, 16.0, 25.0, 21.0, 40.0, 72.0, 121.0, 184.0, 417.0, 971.0, 2347.0, 5912.0, 16519.0, 49180.0, 146565.0, 343905.0, 304931.0, 116704.0, 38869.0, 13442.0, 4825.0, 1846.0, 791.0, 362.0, 172.0, 104.0, 61.0, 46.0, 24.0, 20.0, 18.0, 10.0, 9.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.046875, -6.8111572265625, -6.575439453125, -6.3397216796875, -6.10400390625, -5.8682861328125, -5.632568359375, -5.3968505859375, -5.1611328125, -4.9254150390625, -4.689697265625, -4.4539794921875, -4.21826171875, -3.9825439453125, -3.746826171875, -3.5111083984375, -3.275390625, -3.0396728515625, -2.803955078125, -2.5682373046875, -2.33251953125, -2.0968017578125, -1.861083984375, -1.6253662109375, -1.3896484375, -1.1539306640625, -0.918212890625, -0.6824951171875, -0.44677734375, -0.2110595703125, 0.024658203125, 0.2603759765625, 0.49609375, 0.7318115234375, 0.967529296875, 1.2032470703125, 1.43896484375, 1.6746826171875, 1.910400390625, 2.1461181640625, 2.3818359375, 2.6175537109375, 2.853271484375, 3.0889892578125, 3.32470703125, 3.5604248046875, 3.796142578125, 4.0318603515625, 4.267578125, 4.5032958984375, 4.739013671875, 4.9747314453125, 5.21044921875, 5.4461669921875, 5.681884765625, 5.9176025390625, 6.1533203125, 6.3890380859375, 6.624755859375, 6.8604736328125, 7.09619140625, 7.3319091796875, 7.567626953125, 7.8033447265625, 8.0390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 2.0, 3.0, 12.0, 15.0, 26.0, 31.0, 45.0, 44.0, 44.0, 52.0, 54.0, 67.0, 69.0, 72.0, 68.0, 64.0, 66.0, 43.0, 40.0, 49.0, 31.0, 29.0, 17.0, 11.0, 14.0, 10.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-23.828125, -23.2215576171875, -22.614990234375, -22.0084228515625, -21.40185546875, -20.7952880859375, -20.188720703125, -19.5821533203125, -18.9755859375, -18.3690185546875, -17.762451171875, -17.1558837890625, -16.54931640625, -15.9427490234375, -15.336181640625, -14.7296142578125, -14.123046875, -13.5164794921875, -12.909912109375, -12.3033447265625, -11.69677734375, -11.0902099609375, -10.483642578125, -9.8770751953125, -9.2705078125, -8.6639404296875, -8.057373046875, -7.4508056640625, -6.84423828125, -6.2376708984375, -5.631103515625, -5.0245361328125, -4.41796875, -3.8114013671875, -3.204833984375, -2.5982666015625, -1.99169921875, -1.3851318359375, -0.778564453125, -0.1719970703125, 0.4345703125, 1.0411376953125, 1.647705078125, 2.2542724609375, 2.86083984375, 3.4674072265625, 4.073974609375, 4.6805419921875, 5.287109375, 5.8936767578125, 6.500244140625, 7.1068115234375, 7.71337890625, 8.3199462890625, 8.926513671875, 9.5330810546875, 10.1396484375, 10.7462158203125, 11.352783203125, 11.9593505859375, 12.56591796875, 13.1724853515625, 13.779052734375, 14.3856201171875, 14.9921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 7.0, 6.0, 11.0, 12.0, 16.0, 19.0, 25.0, 34.0, 38.0, 47.0, 45.0, 102.0, 177.0, 419.0, 5695.0, 1005393.0, 35270.0, 652.0, 198.0, 101.0, 47.0, 49.0, 42.0, 23.0, 21.0, 27.0, 18.0, 11.0, 14.0, 11.0, 3.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.03125, -50.529296875, -49.02734375, -47.525390625, -46.0234375, -44.521484375, -43.01953125, -41.517578125, -40.015625, -38.513671875, -37.01171875, -35.509765625, -34.0078125, -32.505859375, -31.00390625, -29.501953125, -28.0, -26.498046875, -24.99609375, -23.494140625, -21.9921875, -20.490234375, -18.98828125, -17.486328125, -15.984375, -14.482421875, -12.98046875, -11.478515625, -9.9765625, -8.474609375, -6.97265625, -5.470703125, -3.96875, -2.466796875, -0.96484375, 0.537109375, 2.0390625, 3.541015625, 5.04296875, 6.544921875, 8.046875, 9.548828125, 11.05078125, 12.552734375, 14.0546875, 15.556640625, 17.05859375, 18.560546875, 20.0625, 21.564453125, 23.06640625, 24.568359375, 26.0703125, 27.572265625, 29.07421875, 30.576171875, 32.078125, 33.580078125, 35.08203125, 36.583984375, 38.0859375, 39.587890625, 41.08984375, 42.591796875, 44.09375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 13.0, 9.0, 11.0, 17.0, 23.0, 27.0, 27.0, 36.0, 21.0, 38.0, 43.0, 48.0, 35.0, 51.0, 51.0, 45.0, 44.0, 46.0, 51.0, 46.0, 40.0, 37.0, 32.0, 26.0, 30.0, 19.0, 23.0, 16.0, 19.0, 9.0, 13.0, 12.0, 5.0, 5.0, 3.0, 2.0, 8.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.3515625, -14.9102783203125, -14.468994140625, -14.0277099609375, -13.58642578125, -13.1451416015625, -12.703857421875, -12.2625732421875, -11.8212890625, -11.3800048828125, -10.938720703125, -10.4974365234375, -10.05615234375, -9.6148681640625, -9.173583984375, -8.7322998046875, -8.291015625, -7.8497314453125, -7.408447265625, -6.9671630859375, -6.52587890625, -6.0845947265625, -5.643310546875, -5.2020263671875, -4.7607421875, -4.3194580078125, -3.878173828125, -3.4368896484375, -2.99560546875, -2.5543212890625, -2.113037109375, -1.6717529296875, -1.23046875, -0.7891845703125, -0.347900390625, 0.0933837890625, 0.53466796875, 0.9759521484375, 1.417236328125, 1.8585205078125, 2.2998046875, 2.7410888671875, 3.182373046875, 3.6236572265625, 4.06494140625, 4.5062255859375, 4.947509765625, 5.3887939453125, 5.830078125, 6.2713623046875, 6.712646484375, 7.1539306640625, 7.59521484375, 8.0364990234375, 8.477783203125, 8.9190673828125, 9.3603515625, 9.8016357421875, 10.242919921875, 10.6842041015625, 11.12548828125, 11.5667724609375, 12.008056640625, 12.4493408203125, 12.890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 5.0, 7.0, 15.0, 21.0, 36.0, 72.0, 105.0, 204.0, 376.0, 870.0, 2384.0, 9517.0, 89020.0, 676208.0, 244246.0, 19374.0, 3722.0, 1193.0, 507.0, 280.0, 144.0, 84.0, 40.0, 24.0, 25.0, 15.0, 9.0, 7.0, 3.0, 6.0, 7.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.68359375, -5.5286865234375, -5.373779296875, -5.2188720703125, -5.06396484375, -4.9090576171875, -4.754150390625, -4.5992431640625, -4.4443359375, -4.2894287109375, -4.134521484375, -3.9796142578125, -3.82470703125, -3.6697998046875, -3.514892578125, -3.3599853515625, -3.205078125, -3.0501708984375, -2.895263671875, -2.7403564453125, -2.58544921875, -2.4305419921875, -2.275634765625, -2.1207275390625, -1.9658203125, -1.8109130859375, -1.656005859375, -1.5010986328125, -1.34619140625, -1.1912841796875, -1.036376953125, -0.8814697265625, -0.7265625, -0.5716552734375, -0.416748046875, -0.2618408203125, -0.10693359375, 0.0479736328125, 0.202880859375, 0.3577880859375, 0.5126953125, 0.6676025390625, 0.822509765625, 0.9774169921875, 1.13232421875, 1.2872314453125, 1.442138671875, 1.5970458984375, 1.751953125, 1.9068603515625, 2.061767578125, 2.2166748046875, 2.37158203125, 2.5264892578125, 2.681396484375, 2.8363037109375, 2.9912109375, 3.1461181640625, 3.301025390625, 3.4559326171875, 3.61083984375, 3.7657470703125, 3.920654296875, 4.0755615234375, 4.23046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 10.0, 17.0, 36.0, 47.0, 49.0, 72.0, 101.0, 122.0, 107.0, 111.0, 86.0, 69.0, 53.0, 35.0, 27.0, 12.0, 13.0, 9.0, 8.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008263587951660156, -0.000804804265499115, -0.0007832497358322144, -0.0007616952061653137, -0.0007401406764984131, -0.0007185861468315125, -0.0006970316171646118, -0.0006754770874977112, -0.0006539225578308105, -0.0006323680281639099, -0.0006108134984970093, -0.0005892589688301086, -0.000567704439163208, -0.0005461499094963074, -0.0005245953798294067, -0.0005030408501625061, -0.00048148632049560547, -0.00045993179082870483, -0.0004383772611618042, -0.00041682273149490356, -0.00039526820182800293, -0.0003737136721611023, -0.00035215914249420166, -0.000330604612827301, -0.0003090500831604004, -0.00028749555349349976, -0.0002659410238265991, -0.0002443864941596985, -0.00022283196449279785, -0.00020127743482589722, -0.00017972290515899658, -0.00015816837549209595, -0.0001366138458251953, -0.00011505931615829468, -9.350478649139404e-05, -7.195025682449341e-05, -5.0395727157592773e-05, -2.884119749069214e-05, -7.286667823791504e-06, 1.4267861843109131e-05, 3.5822391510009766e-05, 5.73769211769104e-05, 7.893145084381104e-05, 0.00010048598051071167, 0.0001220405101776123, 0.00014359503984451294, 0.00016514956951141357, 0.0001867040991783142, 0.00020825862884521484, 0.00022981315851211548, 0.0002513676881790161, 0.00027292221784591675, 0.0002944767475128174, 0.000316031277179718, 0.00033758580684661865, 0.0003591403365135193, 0.0003806948661804199, 0.00040224939584732056, 0.0004238039255142212, 0.0004453584551811218, 0.00046691298484802246, 0.0004884675145149231, 0.0005100220441818237, 0.0005315765738487244, 0.000553131103515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 4.0, 5.0, 14.0, 14.0, 20.0, 38.0, 50.0, 97.0, 218.0, 556.0, 1572.0, 7227.0, 63422.0, 615890.0, 328772.0, 24968.0, 3930.0, 1020.0, 363.0, 137.0, 82.0, 51.0, 38.0, 22.0, 7.0, 7.0, 9.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.27557373046875, -5.1097412109375, -4.94390869140625, -4.778076171875, -4.61224365234375, -4.4464111328125, -4.28057861328125, -4.11474609375, -3.94891357421875, -3.7830810546875, -3.61724853515625, -3.451416015625, -3.28558349609375, -3.1197509765625, -2.95391845703125, -2.7880859375, -2.62225341796875, -2.4564208984375, -2.29058837890625, -2.124755859375, -1.95892333984375, -1.7930908203125, -1.62725830078125, -1.46142578125, -1.29559326171875, -1.1297607421875, -0.96392822265625, -0.798095703125, -0.63226318359375, -0.4664306640625, -0.30059814453125, -0.134765625, 0.03106689453125, 0.1968994140625, 0.36273193359375, 0.528564453125, 0.69439697265625, 0.8602294921875, 1.02606201171875, 1.19189453125, 1.35772705078125, 1.5235595703125, 1.68939208984375, 1.855224609375, 2.02105712890625, 2.1868896484375, 2.35272216796875, 2.5185546875, 2.68438720703125, 2.8502197265625, 3.01605224609375, 3.181884765625, 3.34771728515625, 3.5135498046875, 3.67938232421875, 3.84521484375, 4.01104736328125, 4.1768798828125, 4.34271240234375, 4.508544921875, 4.67437744140625, 4.8402099609375, 5.00604248046875, 5.171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 1.0, 4.0, 6.0, 11.0, 9.0, 18.0, 17.0, 17.0, 33.0, 47.0, 58.0, 63.0, 51.0, 74.0, 69.0, 61.0, 74.0, 67.0, 62.0, 44.0, 36.0, 34.0, 36.0, 24.0, 18.0, 17.0, 9.0, 7.0, 11.0, 2.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5478515625, -1.5027923583984375, -1.457733154296875, -1.4126739501953125, -1.36761474609375, -1.3225555419921875, -1.277496337890625, -1.2324371337890625, -1.1873779296875, -1.1423187255859375, -1.097259521484375, -1.0522003173828125, -1.00714111328125, -0.9620819091796875, -0.917022705078125, -0.8719635009765625, -0.826904296875, -0.7818450927734375, -0.736785888671875, -0.6917266845703125, -0.64666748046875, -0.6016082763671875, -0.556549072265625, -0.5114898681640625, -0.4664306640625, -0.4213714599609375, -0.376312255859375, -0.3312530517578125, -0.28619384765625, -0.2411346435546875, -0.196075439453125, -0.1510162353515625, -0.10595703125, -0.0608978271484375, -0.015838623046875, 0.0292205810546875, 0.07427978515625, 0.1193389892578125, 0.164398193359375, 0.2094573974609375, 0.2545166015625, 0.2995758056640625, 0.344635009765625, 0.3896942138671875, 0.43475341796875, 0.4798126220703125, 0.524871826171875, 0.5699310302734375, 0.614990234375, 0.6600494384765625, 0.705108642578125, 0.7501678466796875, 0.79522705078125, 0.8402862548828125, 0.885345458984375, 0.9304046630859375, 0.9754638671875, 1.0205230712890625, 1.065582275390625, 1.1106414794921875, 1.15570068359375, 1.2007598876953125, 1.245819091796875, 1.2908782958984375, 1.3359375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 28.0, 149.0, 450.0, 322.0, 54.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.27066040039062, -68.93173217773438, -65.59280395507812, -62.253875732421875, -58.914947509765625, -55.576019287109375, -52.237091064453125, -48.898162841796875, -45.559234619140625, -42.220306396484375, -38.881378173828125, -35.542449951171875, -32.203521728515625, -28.864591598510742, -25.525663375854492, -22.186735153198242, -18.84780502319336, -15.50887680053711, -12.16994857788086, -8.831019401550293, -5.492091178894043, -2.1531620025634766, 1.1857662200927734, 4.524694442749023, 7.863622665405273, 11.202550888061523, 14.541479110717773, 17.880409240722656, 21.219337463378906, 24.558265686035156, 27.897193908691406, 31.236122131347656, 34.575050354003906, 37.913978576660156, 41.252906799316406, 44.591835021972656, 47.930763244628906, 51.269691467285156, 54.608619689941406, 57.947547912597656, 61.286476135253906, 64.62540435791016, 67.9643325805664, 71.30326080322266, 74.6421890258789, 77.98111724853516, 81.3200454711914, 84.65897369384766, 87.99790954589844, 91.33683776855469, 94.67576599121094, 98.01469421386719, 101.35362243652344, 104.69255065917969, 108.03147888183594, 111.37040710449219, 114.70933532714844, 118.04826354980469, 121.38719177246094, 124.72611999511719, 128.06504821777344, 131.4039764404297, 134.74290466308594, 138.0818328857422, 141.42076110839844]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 8.0, 10.0, 7.0, 8.0, 18.0, 10.0, 14.0, 32.0, 29.0, 30.0, 46.0, 34.0, 42.0, 48.0, 48.0, 42.0, 52.0, 53.0, 55.0, 45.0, 45.0, 35.0, 43.0, 33.0, 44.0, 20.0, 31.0, 26.0, 20.0, 20.0, 10.0, 7.0, 6.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.464340209960938, -28.640134811401367, -27.815929412841797, -26.991722106933594, -26.167516708374023, -25.343311309814453, -24.519105911254883, -23.694900512695312, -22.870695114135742, -22.046489715576172, -21.2222843170166, -20.39807891845703, -19.573871612548828, -18.749666213989258, -17.925460815429688, -17.101255416870117, -16.277050018310547, -15.452844619750977, -14.62863826751709, -13.80443286895752, -12.98022747039795, -12.156021118164062, -11.331815719604492, -10.507610321044922, -9.683403015136719, -8.859197616577148, -8.034991264343262, -7.210785865783691, -6.386580467224121, -5.562374591827393, -4.738168716430664, -3.9139633178710938, -3.0897579193115234, -2.265552282333374, -1.441346526145935, -0.6171407699584961, 0.20706486701965332, 1.0312705039978027, 1.8554763793945312, 2.6796817779541016, 3.50388765335083, 4.328093528747559, 5.152298927307129, 5.976504802703857, 6.800710678100586, 7.624916076660156, 8.449121475219727, 9.273326873779297, 10.097533226013184, 10.921738624572754, 11.74594497680664, 12.570150375366211, 13.394355773925781, 14.218561172485352, 15.042767524719238, 15.866972923278809, 16.691179275512695, 17.515384674072266, 18.339590072631836, 19.163795471191406, 19.98800277709961, 20.81220817565918, 21.63641357421875, 22.46061897277832, 23.28482437133789]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 12.0, 11.0, 19.0, 30.0, 50.0, 88.0, 124.0, 243.0, 518.0, 1752.0, 18098.0, 971629.0, 3078071.0, 117667.0, 4309.0, 766.0, 319.0, 194.0, 126.0, 81.0, 53.0, 39.0, 26.0, 16.0, 13.0, 9.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.375, -34.449951171875, -33.52490234375, -32.599853515625, -31.6748046875, -30.749755859375, -29.82470703125, -28.899658203125, -27.974609375, -27.049560546875, -26.12451171875, -25.199462890625, -24.2744140625, -23.349365234375, -22.42431640625, -21.499267578125, -20.57421875, -19.649169921875, -18.72412109375, -17.799072265625, -16.8740234375, -15.948974609375, -15.02392578125, -14.098876953125, -13.173828125, -12.248779296875, -11.32373046875, -10.398681640625, -9.4736328125, -8.548583984375, -7.62353515625, -6.698486328125, -5.7734375, -4.848388671875, -3.92333984375, -2.998291015625, -2.0732421875, -1.148193359375, -0.22314453125, 0.701904296875, 1.626953125, 2.552001953125, 3.47705078125, 4.402099609375, 5.3271484375, 6.252197265625, 7.17724609375, 8.102294921875, 9.02734375, 9.952392578125, 10.87744140625, 11.802490234375, 12.7275390625, 13.652587890625, 14.57763671875, 15.502685546875, 16.427734375, 17.352783203125, 18.27783203125, 19.202880859375, 20.1279296875, 21.052978515625, 21.97802734375, 22.903076171875, 23.828125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 5.0, 8.0, 17.0, 25.0, 23.0, 28.0, 34.0, 49.0, 48.0, 55.0, 65.0, 60.0, 63.0, 50.0, 71.0, 47.0, 52.0, 54.0, 45.0, 44.0, 30.0, 22.0, 27.0, 23.0, 18.0, 9.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0, -13.5902099609375, -13.180419921875, -12.7706298828125, -12.36083984375, -11.9510498046875, -11.541259765625, -11.1314697265625, -10.7216796875, -10.3118896484375, -9.902099609375, -9.4923095703125, -9.08251953125, -8.6727294921875, -8.262939453125, -7.8531494140625, -7.443359375, -7.0335693359375, -6.623779296875, -6.2139892578125, -5.80419921875, -5.3944091796875, -4.984619140625, -4.5748291015625, -4.1650390625, -3.7552490234375, -3.345458984375, -2.9356689453125, -2.52587890625, -2.1160888671875, -1.706298828125, -1.2965087890625, -0.88671875, -0.4769287109375, -0.067138671875, 0.3426513671875, 0.75244140625, 1.1622314453125, 1.572021484375, 1.9818115234375, 2.3916015625, 2.8013916015625, 3.211181640625, 3.6209716796875, 4.03076171875, 4.4405517578125, 4.850341796875, 5.2601318359375, 5.669921875, 6.0797119140625, 6.489501953125, 6.8992919921875, 7.30908203125, 7.7188720703125, 8.128662109375, 8.5384521484375, 8.9482421875, 9.3580322265625, 9.767822265625, 10.1776123046875, 10.58740234375, 10.9971923828125, 11.406982421875, 11.8167724609375, 12.2265625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 11.0, 3.0, 6.0, 6.0, 9.0, 15.0, 15.0, 14.0, 17.0, 19.0, 23.0, 46.0, 40.0, 84.0, 194.0, 674.0, 11607.0, 4087494.0, 92024.0, 1299.0, 299.0, 108.0, 70.0, 50.0, 28.0, 21.0, 21.0, 9.0, 11.0, 17.0, 8.0, 7.0, 11.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-55.90625, -54.33837890625, -52.7705078125, -51.20263671875, -49.634765625, -48.06689453125, -46.4990234375, -44.93115234375, -43.36328125, -41.79541015625, -40.2275390625, -38.65966796875, -37.091796875, -35.52392578125, -33.9560546875, -32.38818359375, -30.8203125, -29.25244140625, -27.6845703125, -26.11669921875, -24.548828125, -22.98095703125, -21.4130859375, -19.84521484375, -18.27734375, -16.70947265625, -15.1416015625, -13.57373046875, -12.005859375, -10.43798828125, -8.8701171875, -7.30224609375, -5.734375, -4.16650390625, -2.5986328125, -1.03076171875, 0.537109375, 2.10498046875, 3.6728515625, 5.24072265625, 6.80859375, 8.37646484375, 9.9443359375, 11.51220703125, 13.080078125, 14.64794921875, 16.2158203125, 17.78369140625, 19.3515625, 20.91943359375, 22.4873046875, 24.05517578125, 25.623046875, 27.19091796875, 28.7587890625, 30.32666015625, 31.89453125, 33.46240234375, 35.0302734375, 36.59814453125, 38.166015625, 39.73388671875, 41.3017578125, 42.86962890625, 44.4375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 5.0, 3.0, 13.0, 5.0, 13.0, 18.0, 20.0, 46.0, 65.0, 88.0, 134.0, 220.0, 287.0, 434.0, 546.0, 530.0, 519.0, 402.0, 243.0, 170.0, 114.0, 85.0, 40.0, 22.0, 20.0, 8.0, 8.0, 8.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.80859375, -5.656585693359375, -5.50457763671875, -5.352569580078125, -5.2005615234375, -5.048553466796875, -4.89654541015625, -4.744537353515625, -4.592529296875, -4.440521240234375, -4.28851318359375, -4.136505126953125, -3.9844970703125, -3.832489013671875, -3.68048095703125, -3.528472900390625, -3.37646484375, -3.224456787109375, -3.07244873046875, -2.920440673828125, -2.7684326171875, -2.616424560546875, -2.46441650390625, -2.312408447265625, -2.160400390625, -2.008392333984375, -1.85638427734375, -1.704376220703125, -1.5523681640625, -1.400360107421875, -1.24835205078125, -1.096343994140625, -0.9443359375, -0.792327880859375, -0.64031982421875, -0.488311767578125, -0.3363037109375, -0.184295654296875, -0.03228759765625, 0.119720458984375, 0.271728515625, 0.423736572265625, 0.57574462890625, 0.727752685546875, 0.8797607421875, 1.031768798828125, 1.18377685546875, 1.335784912109375, 1.48779296875, 1.639801025390625, 1.79180908203125, 1.943817138671875, 2.0958251953125, 2.247833251953125, 2.39984130859375, 2.551849365234375, 2.703857421875, 2.855865478515625, 3.00787353515625, 3.159881591796875, 3.3118896484375, 3.463897705078125, 3.61590576171875, 3.767913818359375, 3.919921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 8.0, 6.0, 14.0, 35.0, 50.0, 87.0, 128.0, 145.0, 118.0, 123.0, 121.0, 70.0, 43.0, 26.0, 16.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0], "bins": [-38.06821823120117, -37.32301712036133, -36.57781982421875, -35.832618713378906, -35.08741760253906, -34.342220306396484, -33.59701919555664, -32.85182189941406, -32.10662078857422, -31.361421585083008, -30.616222381591797, -29.871021270751953, -29.125822067260742, -28.38062286376953, -27.635421752929688, -26.890222549438477, -26.145023345947266, -25.399824142456055, -24.654624938964844, -23.909423828125, -23.16422462463379, -22.419025421142578, -21.673824310302734, -20.928625106811523, -20.183425903320312, -19.4382266998291, -18.69302749633789, -17.947826385498047, -17.202627182006836, -16.457427978515625, -15.712227821350098, -14.96702766418457, -14.22182846069336, -13.476629257202148, -12.731429100036621, -11.986228942871094, -11.241029739379883, -10.495830535888672, -9.750630378723145, -9.005430221557617, -8.260231018066406, -7.515031337738037, -6.769831657409668, -6.024631977081299, -5.27943229675293, -4.5342326164245605, -3.7890329360961914, -3.0438332557678223, -2.298633575439453, -1.553433895111084, -0.8082342147827148, -0.0630345344543457, 0.6821651458740234, 1.4273648262023926, 2.1725645065307617, 2.917764186859131, 3.6629638671875, 4.408163547515869, 5.153363227844238, 5.898562908172607, 6.643762588500977, 7.388962268829346, 8.134161949157715, 8.879362106323242, 9.624561309814453]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 5.0, 7.0, 15.0, 14.0, 21.0, 22.0, 30.0, 38.0, 37.0, 50.0, 42.0, 55.0, 55.0, 50.0, 59.0, 63.0, 55.0, 56.0, 53.0, 48.0, 40.0, 34.0, 22.0, 24.0, 25.0, 20.0, 20.0, 6.0, 4.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.89266586303711, -15.46429443359375, -15.03592300415039, -14.607552528381348, -14.179181098937988, -13.750809669494629, -13.32243824005127, -12.894067764282227, -12.465696334838867, -12.037324905395508, -11.608953475952148, -11.180583000183105, -10.752211570739746, -10.323840141296387, -9.895468711853027, -9.467098236083984, -9.038726806640625, -8.610355377197266, -8.181983947753906, -7.753612995147705, -7.325242042541504, -6.8968706130981445, -6.468499183654785, -6.040128231048584, -5.611756324768066, -5.183384895324707, -4.755013942718506, -4.3266425132751465, -3.8982715606689453, -3.469900131225586, -3.0415289402008057, -2.6131577491760254, -2.184786796569824, -1.756415605545044, -1.3280444145202637, -0.8996731042861938, -0.4713019132614136, -0.04293060302734375, 0.3854405879974365, 0.8138117790222168, 1.242182970046997, 1.6705541610717773, 2.0989253520965576, 2.527296543121338, 2.9556679725646973, 3.3840391635894775, 3.812410354614258, 4.240781784057617, 4.669152736663818, 5.097524166107178, 5.525895118713379, 5.954266548156738, 6.3826375007629395, 6.811008930206299, 7.2393798828125, 7.667751312255859, 8.096122741699219, 8.524494171142578, 8.952865600585938, 9.38123607635498, 9.80960750579834, 10.2379789352417, 10.666350364685059, 11.094720840454102, 11.523092269897461]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 4.0, 7.0, 11.0, 10.0, 13.0, 20.0, 37.0, 44.0, 48.0, 85.0, 135.0, 231.0, 333.0, 553.0, 982.0, 1958.0, 4081.0, 10447.0, 31607.0, 108979.0, 333377.0, 366013.0, 130549.0, 37302.0, 12121.0, 4659.0, 2147.0, 1137.0, 598.0, 357.0, 224.0, 183.0, 95.0, 63.0, 35.0, 30.0, 25.0, 21.0, 10.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.35546875, -2.28424072265625, -2.2130126953125, -2.14178466796875, -2.070556640625, -1.99932861328125, -1.9281005859375, -1.85687255859375, -1.78564453125, -1.71441650390625, -1.6431884765625, -1.57196044921875, -1.500732421875, -1.42950439453125, -1.3582763671875, -1.28704833984375, -1.2158203125, -1.14459228515625, -1.0733642578125, -1.00213623046875, -0.930908203125, -0.85968017578125, -0.7884521484375, -0.71722412109375, -0.64599609375, -0.57476806640625, -0.5035400390625, -0.43231201171875, -0.361083984375, -0.28985595703125, -0.2186279296875, -0.14739990234375, -0.076171875, -0.00494384765625, 0.0662841796875, 0.13751220703125, 0.208740234375, 0.27996826171875, 0.3511962890625, 0.42242431640625, 0.49365234375, 0.56488037109375, 0.6361083984375, 0.70733642578125, 0.778564453125, 0.84979248046875, 0.9210205078125, 0.99224853515625, 1.0634765625, 1.13470458984375, 1.2059326171875, 1.27716064453125, 1.348388671875, 1.41961669921875, 1.4908447265625, 1.56207275390625, 1.63330078125, 1.70452880859375, 1.7757568359375, 1.84698486328125, 1.918212890625, 1.98944091796875, 2.0606689453125, 2.13189697265625, 2.203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 7.0, 11.0, 12.0, 16.0, 21.0, 28.0, 45.0, 36.0, 52.0, 68.0, 64.0, 71.0, 68.0, 84.0, 73.0, 62.0, 65.0, 46.0, 30.0, 32.0, 23.0, 27.0, 11.0, 11.0, 9.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9921875, -12.656005859375, -12.31982421875, -11.983642578125, -11.6474609375, -11.311279296875, -10.97509765625, -10.638916015625, -10.302734375, -9.966552734375, -9.63037109375, -9.294189453125, -8.9580078125, -8.621826171875, -8.28564453125, -7.949462890625, -7.61328125, -7.277099609375, -6.94091796875, -6.604736328125, -6.2685546875, -5.932373046875, -5.59619140625, -5.260009765625, -4.923828125, -4.587646484375, -4.25146484375, -3.915283203125, -3.5791015625, -3.242919921875, -2.90673828125, -2.570556640625, -2.234375, -1.898193359375, -1.56201171875, -1.225830078125, -0.8896484375, -0.553466796875, -0.21728515625, 0.118896484375, 0.455078125, 0.791259765625, 1.12744140625, 1.463623046875, 1.7998046875, 2.135986328125, 2.47216796875, 2.808349609375, 3.14453125, 3.480712890625, 3.81689453125, 4.153076171875, 4.4892578125, 4.825439453125, 5.16162109375, 5.497802734375, 5.833984375, 6.170166015625, 6.50634765625, 6.842529296875, 7.1787109375, 7.514892578125, 7.85107421875, 8.187255859375, 8.5234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 6.0, 1.0, 10.0, 19.0, 13.0, 26.0, 54.0, 77.0, 103.0, 189.0, 306.0, 482.0, 832.0, 1506.0, 2727.0, 5166.0, 10122.0, 20415.0, 41548.0, 82230.0, 151263.0, 217721.0, 214024.0, 143822.0, 77440.0, 38813.0, 18944.0, 9677.0, 4973.0, 2697.0, 1367.0, 802.0, 459.0, 248.0, 156.0, 95.0, 65.0, 49.0, 29.0, 21.0, 14.0, 7.0, 11.0, 11.0, 10.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.1787109375, -1.1439971923828125, -1.109283447265625, -1.0745697021484375, -1.03985595703125, -1.0051422119140625, -0.970428466796875, -0.9357147216796875, -0.9010009765625, -0.8662872314453125, -0.831573486328125, -0.7968597412109375, -0.76214599609375, -0.7274322509765625, -0.692718505859375, -0.6580047607421875, -0.623291015625, -0.5885772705078125, -0.553863525390625, -0.5191497802734375, -0.48443603515625, -0.4497222900390625, -0.415008544921875, -0.3802947998046875, -0.3455810546875, -0.3108673095703125, -0.276153564453125, -0.2414398193359375, -0.20672607421875, -0.1720123291015625, -0.137298583984375, -0.1025848388671875, -0.06787109375, -0.0331573486328125, 0.001556396484375, 0.0362701416015625, 0.07098388671875, 0.1056976318359375, 0.140411376953125, 0.1751251220703125, 0.2098388671875, 0.2445526123046875, 0.279266357421875, 0.3139801025390625, 0.34869384765625, 0.3834075927734375, 0.418121337890625, 0.4528350830078125, 0.487548828125, 0.5222625732421875, 0.556976318359375, 0.5916900634765625, 0.62640380859375, 0.6611175537109375, 0.695831298828125, 0.7305450439453125, 0.7652587890625, 0.7999725341796875, 0.834686279296875, 0.8694000244140625, 0.90411376953125, 0.9388275146484375, 0.973541259765625, 1.0082550048828125, 1.04296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 9.0, 5.0, 8.0, 5.0, 8.0, 19.0, 12.0, 15.0, 24.0, 31.0, 26.0, 26.0, 20.0, 28.0, 44.0, 46.0, 41.0, 49.0, 55.0, 51.0, 42.0, 43.0, 39.0, 42.0, 57.0, 43.0, 30.0, 19.0, 30.0, 28.0, 19.0, 15.0, 13.0, 8.0, 10.0, 8.0, 9.0, 8.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3203125, -11.9046630859375, -11.489013671875, -11.0733642578125, -10.65771484375, -10.2420654296875, -9.826416015625, -9.4107666015625, -8.9951171875, -8.5794677734375, -8.163818359375, -7.7481689453125, -7.33251953125, -6.9168701171875, -6.501220703125, -6.0855712890625, -5.669921875, -5.2542724609375, -4.838623046875, -4.4229736328125, -4.00732421875, -3.5916748046875, -3.176025390625, -2.7603759765625, -2.3447265625, -1.9290771484375, -1.513427734375, -1.0977783203125, -0.68212890625, -0.2664794921875, 0.149169921875, 0.5648193359375, 0.98046875, 1.3961181640625, 1.811767578125, 2.2274169921875, 2.64306640625, 3.0587158203125, 3.474365234375, 3.8900146484375, 4.3056640625, 4.7213134765625, 5.136962890625, 5.5526123046875, 5.96826171875, 6.3839111328125, 6.799560546875, 7.2152099609375, 7.630859375, 8.0465087890625, 8.462158203125, 8.8778076171875, 9.29345703125, 9.7091064453125, 10.124755859375, 10.5404052734375, 10.9560546875, 11.3717041015625, 11.787353515625, 12.2030029296875, 12.61865234375, 13.0343017578125, 13.449951171875, 13.8656005859375, 14.28125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 5.0, 12.0, 13.0, 41.0, 57.0, 59.0, 97.0, 140.0, 236.0, 411.0, 710.0, 1229.0, 2389.0, 4849.0, 11269.0, 28226.0, 76123.0, 188674.0, 313232.0, 244207.0, 108043.0, 40031.0, 15293.0, 6424.0, 3058.0, 1567.0, 854.0, 455.0, 305.0, 176.0, 135.0, 67.0, 49.0, 29.0, 28.0, 17.0, 16.0, 8.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.338134765625, -0.3283843994140625, -0.318634033203125, -0.3088836669921875, -0.29913330078125, -0.2893829345703125, -0.279632568359375, -0.2698822021484375, -0.2601318359375, -0.2503814697265625, -0.240631103515625, -0.2308807373046875, -0.22113037109375, -0.2113800048828125, -0.201629638671875, -0.1918792724609375, -0.18212890625, -0.1723785400390625, -0.162628173828125, -0.1528778076171875, -0.14312744140625, -0.1333770751953125, -0.123626708984375, -0.1138763427734375, -0.1041259765625, -0.0943756103515625, -0.084625244140625, -0.0748748779296875, -0.06512451171875, -0.0553741455078125, -0.045623779296875, -0.0358734130859375, -0.026123046875, -0.0163726806640625, -0.006622314453125, 0.0031280517578125, 0.01287841796875, 0.0226287841796875, 0.032379150390625, 0.0421295166015625, 0.0518798828125, 0.0616302490234375, 0.071380615234375, 0.0811309814453125, 0.09088134765625, 0.1006317138671875, 0.110382080078125, 0.1201324462890625, 0.1298828125, 0.1396331787109375, 0.149383544921875, 0.1591339111328125, 0.16888427734375, 0.1786346435546875, 0.188385009765625, 0.1981353759765625, 0.2078857421875, 0.2176361083984375, 0.227386474609375, 0.2371368408203125, 0.24688720703125, 0.2566375732421875, 0.266387939453125, 0.2761383056640625, 0.285888671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 7.0, 14.0, 14.0, 24.0, 34.0, 61.0, 83.0, 101.0, 117.0, 107.0, 104.0, 109.0, 67.0, 59.0, 40.0, 26.0, 13.0, 6.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00041937828063964844, -0.00040952861309051514, -0.00039967894554138184, -0.00038982927799224854, -0.00037997961044311523, -0.00037012994289398193, -0.00036028027534484863, -0.00035043060779571533, -0.00034058094024658203, -0.00033073127269744873, -0.00032088160514831543, -0.00031103193759918213, -0.00030118227005004883, -0.00029133260250091553, -0.0002814829349517822, -0.0002716332674026489, -0.0002617835998535156, -0.0002519339323043823, -0.00024208426475524902, -0.00023223459720611572, -0.00022238492965698242, -0.00021253526210784912, -0.00020268559455871582, -0.00019283592700958252, -0.00018298625946044922, -0.00017313659191131592, -0.00016328692436218262, -0.00015343725681304932, -0.00014358758926391602, -0.00013373792171478271, -0.00012388825416564941, -0.00011403858661651611, -0.00010418891906738281, -9.433925151824951e-05, -8.448958396911621e-05, -7.463991641998291e-05, -6.479024887084961e-05, -5.494058132171631e-05, -4.509091377258301e-05, -3.524124622344971e-05, -2.5391578674316406e-05, -1.5541911125183105e-05, -5.692243576049805e-06, 4.157423973083496e-06, 1.4007091522216797e-05, 2.3856759071350098e-05, 3.37064266204834e-05, 4.35560941696167e-05, 5.340576171875e-05, 6.32554292678833e-05, 7.31050968170166e-05, 8.29547643661499e-05, 9.28044319152832e-05, 0.0001026540994644165, 0.0001125037670135498, 0.0001223534345626831, 0.0001322031021118164, 0.0001420527696609497, 0.000151902437210083, 0.0001617521047592163, 0.0001716017723083496, 0.0001814514398574829, 0.0001913011074066162, 0.0002011507749557495, 0.0002110004425048828]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 5.0, 5.0, 12.0, 13.0, 20.0, 23.0, 25.0, 40.0, 70.0, 102.0, 126.0, 221.0, 449.0, 788.0, 2070.0, 5213.0, 14472.0, 40920.0, 109081.0, 232511.0, 300290.0, 202541.0, 88099.0, 32154.0, 11607.0, 4282.0, 1732.0, 680.0, 359.0, 201.0, 120.0, 83.0, 41.0, 52.0, 30.0, 30.0, 15.0, 14.0, 12.0, 15.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26220703125, -0.2532844543457031, -0.24436187744140625, -0.23543930053710938, -0.2265167236328125, -0.21759414672851562, -0.20867156982421875, -0.19974899291992188, -0.190826416015625, -0.18190383911132812, -0.17298126220703125, -0.16405868530273438, -0.1551361083984375, -0.14621353149414062, -0.13729095458984375, -0.12836837768554688, -0.11944580078125, -0.11052322387695312, -0.10160064697265625, -0.09267807006835938, -0.0837554931640625, -0.07483291625976562, -0.06591033935546875, -0.056987762451171875, -0.048065185546875, -0.039142608642578125, -0.03022003173828125, -0.021297454833984375, -0.0123748779296875, -0.003452301025390625, 0.00547027587890625, 0.014392852783203125, 0.0233154296875, 0.032238006591796875, 0.04116058349609375, 0.050083160400390625, 0.0590057373046875, 0.06792831420898438, 0.07685089111328125, 0.08577346801757812, 0.094696044921875, 0.10361862182617188, 0.11254119873046875, 0.12146377563476562, 0.1303863525390625, 0.13930892944335938, 0.14823150634765625, 0.15715408325195312, 0.16607666015625, 0.17499923706054688, 0.18392181396484375, 0.19284439086914062, 0.2017669677734375, 0.21068954467773438, 0.21961212158203125, 0.22853469848632812, 0.237457275390625, 0.24637985229492188, 0.25530242919921875, 0.2642250061035156, 0.2731475830078125, 0.2820701599121094, 0.29099273681640625, 0.2999153137207031, 0.308837890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 2.0, 6.0, 12.0, 13.0, 5.0, 13.0, 25.0, 15.0, 21.0, 27.0, 37.0, 30.0, 43.0, 37.0, 44.0, 44.0, 54.0, 71.0, 56.0, 56.0, 43.0, 47.0, 50.0, 35.0, 25.0, 43.0, 28.0, 14.0, 20.0, 16.0, 11.0, 9.0, 13.0, 5.0, 9.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.101806640625, -0.09880733489990234, -0.09580802917480469, -0.09280872344970703, -0.08980941772460938, -0.08681011199951172, -0.08381080627441406, -0.0808115005493164, -0.07781219482421875, -0.0748128890991211, -0.07181358337402344, -0.06881427764892578, -0.06581497192382812, -0.06281566619873047, -0.05981636047363281, -0.056817054748535156, -0.0538177490234375, -0.050818443298339844, -0.04781913757324219, -0.04481983184814453, -0.041820526123046875, -0.03882122039794922, -0.03582191467285156, -0.032822608947753906, -0.02982330322265625, -0.026823997497558594, -0.023824691772460938, -0.02082538604736328, -0.017826080322265625, -0.014826774597167969, -0.011827468872070312, -0.008828163146972656, -0.005828857421875, -0.0028295516967773438, 0.0001697540283203125, 0.0031690597534179688, 0.006168365478515625, 0.009167671203613281, 0.012166976928710938, 0.015166282653808594, 0.01816558837890625, 0.021164894104003906, 0.024164199829101562, 0.02716350555419922, 0.030162811279296875, 0.03316211700439453, 0.03616142272949219, 0.039160728454589844, 0.0421600341796875, 0.045159339904785156, 0.04815864562988281, 0.05115795135498047, 0.054157257080078125, 0.05715656280517578, 0.06015586853027344, 0.0631551742553711, 0.06615447998046875, 0.0691537857055664, 0.07215309143066406, 0.07515239715576172, 0.07815170288085938, 0.08115100860595703, 0.08415031433105469, 0.08714962005615234, 0.09014892578125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 15.0, 40.0, 233.0, 402.0, 256.0, 49.0, 12.0, 3.0, 1.0], "bins": [-76.35668182373047, -75.05049133300781, -73.74429321289062, -72.43810272216797, -71.13191223144531, -69.82572174072266, -68.51952362060547, -67.21333312988281, -65.90714263916016, -64.6009521484375, -63.29475784301758, -61.988563537597656, -60.682373046875, -59.37617874145508, -58.06998825073242, -56.7637939453125, -55.45759963989258, -54.151405334472656, -52.84521484375, -51.53902053833008, -50.23283004760742, -48.9266357421875, -47.620445251464844, -46.31425094604492, -45.008056640625, -43.70186233520508, -42.39567184448242, -41.0894775390625, -39.783287048339844, -38.47709274291992, -37.170902252197266, -35.864707946777344, -34.55852127075195, -33.25232696533203, -31.946136474609375, -30.639944076538086, -29.333751678466797, -28.027557373046875, -26.721364974975586, -25.415172576904297, -24.108978271484375, -22.802785873413086, -21.496593475341797, -20.190401077270508, -18.88420867919922, -17.578014373779297, -16.271821975708008, -14.965629577636719, -13.659438133239746, -12.353245735168457, -11.047052383422852, -9.740859985351562, -8.434667587280273, -7.128475189208984, -5.822282314300537, -4.51608943939209, -3.209897041320801, -1.9037044048309326, -0.5975117683410645, 0.7086808681488037, 2.014873504638672, 3.321065902709961, 4.627258777618408, 5.9334516525268555, 7.2396440505981445]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 5.0, 1.0, 5.0, 8.0, 17.0, 13.0, 27.0, 28.0, 42.0, 56.0, 64.0, 63.0, 69.0, 74.0, 92.0, 66.0, 90.0, 58.0, 58.0, 31.0, 31.0, 36.0, 18.0, 18.0, 8.0, 14.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.512425422668457, -12.156085014343262, -11.79974365234375, -11.443403244018555, -11.08706283569336, -10.730722427368164, -10.374382019042969, -10.018040657043457, -9.661700248718262, -9.305359840393066, -8.949018478393555, -8.59267807006836, -8.236337661743164, -7.879997253417969, -7.523656368255615, -7.167315483093262, -6.810975074768066, -6.454634666442871, -6.098293781280518, -5.741952896118164, -5.385612487792969, -5.029272079467773, -4.67293119430542, -4.316590309143066, -3.960249900817871, -3.6039092540740967, -3.2475686073303223, -2.891227960586548, -2.5348873138427734, -2.178546667098999, -1.8222060203552246, -1.4658653736114502, -1.1095237731933594, -0.753183126449585, -0.39684247970581055, -0.04050183296203613, 0.3158388137817383, 0.6721794605255127, 1.028520107269287, 1.3848607540130615, 1.741201400756836, 2.0975420475006104, 2.4538826942443848, 2.810223340988159, 3.1665639877319336, 3.522904634475708, 3.8792452812194824, 4.235586166381836, 4.591926574707031, 4.948266983032227, 5.30460786819458, 5.660948753356934, 6.017289161682129, 6.373629570007324, 6.729970455169678, 7.086311340332031, 7.442651748657227, 7.798992156982422, 8.155332565307617, 8.511673927307129, 8.868014335632324, 9.22435474395752, 9.580696105957031, 9.937036514282227, 10.293376922607422]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 7.0, 9.0, 15.0, 17.0, 13.0, 19.0, 21.0, 24.0, 34.0, 60.0, 113.0, 239.0, 1096.0, 7811.0, 78731.0, 556906.0, 358923.0, 39161.0, 4216.0, 655.0, 179.0, 91.0, 51.0, 33.0, 27.0, 21.0, 14.0, 12.0, 6.0, 4.0, 14.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.109375, -13.63671875, -13.1640625, -12.69140625, -12.21875, -11.74609375, -11.2734375, -10.80078125, -10.328125, -9.85546875, -9.3828125, -8.91015625, -8.4375, -7.96484375, -7.4921875, -7.01953125, -6.546875, -6.07421875, -5.6015625, -5.12890625, -4.65625, -4.18359375, -3.7109375, -3.23828125, -2.765625, -2.29296875, -1.8203125, -1.34765625, -0.875, -0.40234375, 0.0703125, 0.54296875, 1.015625, 1.48828125, 1.9609375, 2.43359375, 2.90625, 3.37890625, 3.8515625, 4.32421875, 4.796875, 5.26953125, 5.7421875, 6.21484375, 6.6875, 7.16015625, 7.6328125, 8.10546875, 8.578125, 9.05078125, 9.5234375, 9.99609375, 10.46875, 10.94140625, 11.4140625, 11.88671875, 12.359375, 12.83203125, 13.3046875, 13.77734375, 14.25, 14.72265625, 15.1953125, 15.66796875, 16.140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 6.0, 17.0, 25.0, 35.0, 56.0, 78.0, 80.0, 76.0, 108.0, 108.0, 103.0, 78.0, 64.0, 47.0, 31.0, 31.0, 26.0, 8.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-40.875, -40.0213623046875, -39.167724609375, -38.3140869140625, -37.46044921875, -36.6068115234375, -35.753173828125, -34.8995361328125, -34.0458984375, -33.1922607421875, -32.338623046875, -31.4849853515625, -30.63134765625, -29.7777099609375, -28.924072265625, -28.0704345703125, -27.216796875, -26.3631591796875, -25.509521484375, -24.6558837890625, -23.80224609375, -22.9486083984375, -22.094970703125, -21.2413330078125, -20.3876953125, -19.5340576171875, -18.680419921875, -17.8267822265625, -16.97314453125, -16.1195068359375, -15.265869140625, -14.4122314453125, -13.55859375, -12.7049560546875, -11.851318359375, -10.9976806640625, -10.14404296875, -9.2904052734375, -8.436767578125, -7.5831298828125, -6.7294921875, -5.8758544921875, -5.022216796875, -4.1685791015625, -3.31494140625, -2.4613037109375, -1.607666015625, -0.7540283203125, 0.099609375, 0.9532470703125, 1.806884765625, 2.6605224609375, 3.51416015625, 4.3677978515625, 5.221435546875, 6.0750732421875, 6.9287109375, 7.7823486328125, 8.635986328125, 9.4896240234375, 10.34326171875, 11.1968994140625, 12.050537109375, 12.9041748046875, 13.7578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 6.0, 8.0, 23.0, 25.0, 27.0, 49.0, 46.0, 65.0, 85.0, 88.0, 141.0, 150.0, 194.0, 220.0, 477.0, 1979.0, 30092.0, 615391.0, 381482.0, 15189.0, 1276.0, 455.0, 256.0, 170.0, 144.0, 102.0, 96.0, 67.0, 55.0, 34.0, 36.0, 34.0, 18.0, 15.0, 14.0, 12.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.625, -18.041015625, -17.45703125, -16.873046875, -16.2890625, -15.705078125, -15.12109375, -14.537109375, -13.953125, -13.369140625, -12.78515625, -12.201171875, -11.6171875, -11.033203125, -10.44921875, -9.865234375, -9.28125, -8.697265625, -8.11328125, -7.529296875, -6.9453125, -6.361328125, -5.77734375, -5.193359375, -4.609375, -4.025390625, -3.44140625, -2.857421875, -2.2734375, -1.689453125, -1.10546875, -0.521484375, 0.0625, 0.646484375, 1.23046875, 1.814453125, 2.3984375, 2.982421875, 3.56640625, 4.150390625, 4.734375, 5.318359375, 5.90234375, 6.486328125, 7.0703125, 7.654296875, 8.23828125, 8.822265625, 9.40625, 9.990234375, 10.57421875, 11.158203125, 11.7421875, 12.326171875, 12.91015625, 13.494140625, 14.078125, 14.662109375, 15.24609375, 15.830078125, 16.4140625, 16.998046875, 17.58203125, 18.166015625, 18.75]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 3.0, 11.0, 24.0, 12.0, 17.0, 23.0, 25.0, 20.0, 35.0, 40.0, 39.0, 37.0, 45.0, 51.0, 55.0, 40.0, 49.0, 58.0, 48.0, 64.0, 36.0, 34.0, 46.0, 38.0, 23.0, 18.0, 20.0, 18.0, 14.0, 17.0, 12.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.390625, -16.9193115234375, -16.447998046875, -15.9766845703125, -15.50537109375, -15.0340576171875, -14.562744140625, -14.0914306640625, -13.6201171875, -13.1488037109375, -12.677490234375, -12.2061767578125, -11.73486328125, -11.2635498046875, -10.792236328125, -10.3209228515625, -9.849609375, -9.3782958984375, -8.906982421875, -8.4356689453125, -7.96435546875, -7.4930419921875, -7.021728515625, -6.5504150390625, -6.0791015625, -5.6077880859375, -5.136474609375, -4.6651611328125, -4.19384765625, -3.7225341796875, -3.251220703125, -2.7799072265625, -2.30859375, -1.8372802734375, -1.365966796875, -0.8946533203125, -0.42333984375, 0.0479736328125, 0.519287109375, 0.9906005859375, 1.4619140625, 1.9332275390625, 2.404541015625, 2.8758544921875, 3.34716796875, 3.8184814453125, 4.289794921875, 4.7611083984375, 5.232421875, 5.7037353515625, 6.175048828125, 6.6463623046875, 7.11767578125, 7.5889892578125, 8.060302734375, 8.5316162109375, 9.0029296875, 9.4742431640625, 9.945556640625, 10.4168701171875, 10.88818359375, 11.3594970703125, 11.830810546875, 12.3021240234375, 12.7734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 11.0, 18.0, 40.0, 104.0, 319.0, 1958.0, 66116.0, 964689.0, 13823.0, 1069.0, 243.0, 85.0, 43.0, 13.0, 9.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.4844970703125, -12.086181640625, -11.6878662109375, -11.28955078125, -10.8912353515625, -10.492919921875, -10.0946044921875, -9.6962890625, -9.2979736328125, -8.899658203125, -8.5013427734375, -8.10302734375, -7.7047119140625, -7.306396484375, -6.9080810546875, -6.509765625, -6.1114501953125, -5.713134765625, -5.3148193359375, -4.91650390625, -4.5181884765625, -4.119873046875, -3.7215576171875, -3.3232421875, -2.9249267578125, -2.526611328125, -2.1282958984375, -1.72998046875, -1.3316650390625, -0.933349609375, -0.5350341796875, -0.13671875, 0.2615966796875, 0.659912109375, 1.0582275390625, 1.45654296875, 1.8548583984375, 2.253173828125, 2.6514892578125, 3.0498046875, 3.4481201171875, 3.846435546875, 4.2447509765625, 4.64306640625, 5.0413818359375, 5.439697265625, 5.8380126953125, 6.236328125, 6.6346435546875, 7.032958984375, 7.4312744140625, 7.82958984375, 8.2279052734375, 8.626220703125, 9.0245361328125, 9.4228515625, 9.8211669921875, 10.219482421875, 10.6177978515625, 11.01611328125, 11.4144287109375, 11.812744140625, 12.2110595703125, 12.609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 4.0, 9.0, 11.0, 28.0, 34.0, 39.0, 67.0, 80.0, 109.0, 117.0, 98.0, 99.0, 81.0, 78.0, 44.0, 32.0, 17.0, 13.0, 7.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00057220458984375, -0.0005515366792678833, -0.0005308687686920166, -0.0005102008581161499, -0.0004895329475402832, -0.0004688650369644165, -0.0004481971263885498, -0.0004275292158126831, -0.0004068613052368164, -0.0003861933946609497, -0.000365525484085083, -0.0003448575735092163, -0.0003241896629333496, -0.0003035217523574829, -0.0002828538417816162, -0.0002621859312057495, -0.0002415180206298828, -0.0002208501100540161, -0.00020018219947814941, -0.00017951428890228271, -0.00015884637832641602, -0.00013817846775054932, -0.00011751055717468262, -9.684264659881592e-05, -7.617473602294922e-05, -5.550682544708252e-05, -3.483891487121582e-05, -1.4171004295349121e-05, 6.496906280517578e-06, 2.7164816856384277e-05, 4.7832727432250977e-05, 6.850063800811768e-05, 8.916854858398438e-05, 0.00010983645915985107, 0.00013050436973571777, 0.00015117228031158447, 0.00017184019088745117, 0.00019250810146331787, 0.00021317601203918457, 0.00023384392261505127, 0.00025451183319091797, 0.00027517974376678467, 0.00029584765434265137, 0.00031651556491851807, 0.00033718347549438477, 0.00035785138607025146, 0.00037851929664611816, 0.00039918720722198486, 0.00041985511779785156, 0.00044052302837371826, 0.00046119093894958496, 0.00048185884952545166, 0.0005025267601013184, 0.0005231946706771851, 0.0005438625812530518, 0.0005645304918289185, 0.0005851984024047852, 0.0006058663129806519, 0.0006265342235565186, 0.0006472021341323853, 0.000667870044708252, 0.0006885379552841187, 0.0007092058658599854, 0.000729873776435852, 0.0007505416870117188]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 11.0, 19.0, 30.0, 33.0, 82.0, 203.0, 796.0, 7064.0, 569680.0, 463358.0, 6169.0, 717.0, 188.0, 91.0, 41.0, 21.0, 12.0, 6.0, 7.0, 4.0, 9.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.4453125, -12.0894775390625, -11.733642578125, -11.3778076171875, -11.02197265625, -10.6661376953125, -10.310302734375, -9.9544677734375, -9.5986328125, -9.2427978515625, -8.886962890625, -8.5311279296875, -8.17529296875, -7.8194580078125, -7.463623046875, -7.1077880859375, -6.751953125, -6.3961181640625, -6.040283203125, -5.6844482421875, -5.32861328125, -4.9727783203125, -4.616943359375, -4.2611083984375, -3.9052734375, -3.5494384765625, -3.193603515625, -2.8377685546875, -2.48193359375, -2.1260986328125, -1.770263671875, -1.4144287109375, -1.05859375, -0.7027587890625, -0.346923828125, 0.0089111328125, 0.36474609375, 0.7205810546875, 1.076416015625, 1.4322509765625, 1.7880859375, 2.1439208984375, 2.499755859375, 2.8555908203125, 3.21142578125, 3.5672607421875, 3.923095703125, 4.2789306640625, 4.634765625, 4.9906005859375, 5.346435546875, 5.7022705078125, 6.05810546875, 6.4139404296875, 6.769775390625, 7.1256103515625, 7.4814453125, 7.8372802734375, 8.193115234375, 8.5489501953125, 8.90478515625, 9.2606201171875, 9.616455078125, 9.9722900390625, 10.328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 10.0, 9.0, 10.0, 15.0, 30.0, 37.0, 58.0, 72.0, 85.0, 134.0, 128.0, 101.0, 89.0, 74.0, 46.0, 36.0, 21.0, 20.0, 7.0, 11.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8115386962890625, -1.745147705078125, -1.6787567138671875, -1.61236572265625, -1.5459747314453125, -1.479583740234375, -1.4131927490234375, -1.3468017578125, -1.2804107666015625, -1.214019775390625, -1.1476287841796875, -1.08123779296875, -1.0148468017578125, -0.948455810546875, -0.8820648193359375, -0.815673828125, -0.7492828369140625, -0.682891845703125, -0.6165008544921875, -0.55010986328125, -0.4837188720703125, -0.417327880859375, -0.3509368896484375, -0.2845458984375, -0.2181549072265625, -0.151763916015625, -0.0853729248046875, -0.01898193359375, 0.0474090576171875, 0.113800048828125, 0.1801910400390625, 0.24658203125, 0.3129730224609375, 0.379364013671875, 0.4457550048828125, 0.51214599609375, 0.5785369873046875, 0.644927978515625, 0.7113189697265625, 0.7777099609375, 0.8441009521484375, 0.910491943359375, 0.9768829345703125, 1.04327392578125, 1.1096649169921875, 1.176055908203125, 1.2424468994140625, 1.308837890625, 1.3752288818359375, 1.441619873046875, 1.5080108642578125, 1.57440185546875, 1.6407928466796875, 1.707183837890625, 1.7735748291015625, 1.8399658203125, 1.9063568115234375, 1.972747802734375, 2.0391387939453125, 2.10552978515625, 2.1719207763671875, 2.238311767578125, 2.3047027587890625, 2.37109375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 10.0, 28.0, 54.0, 127.0, 256.0, 256.0, 160.0, 76.0, 23.0, 13.0, 5.0, 2.0, 1.0, 1.0], "bins": [-88.96086120605469, -87.34244537353516, -85.72402954101562, -84.1056137084961, -82.48719787597656, -80.8687744140625, -79.25035858154297, -77.63194274902344, -76.0135269165039, -74.39511108398438, -72.77669525146484, -71.15827941894531, -69.53985595703125, -67.92144012451172, -66.30302429199219, -64.68460845947266, -63.066192626953125, -61.447776794433594, -59.82936096191406, -58.210941314697266, -56.592525482177734, -54.9741096496582, -53.355690002441406, -51.737274169921875, -50.118858337402344, -48.50044250488281, -46.88202667236328, -45.263607025146484, -43.64519119262695, -42.02677536010742, -40.408355712890625, -38.789939880371094, -37.17152404785156, -35.55310821533203, -33.9346923828125, -32.3162727355957, -30.697856903076172, -29.07944107055664, -27.461023330688477, -25.842605590820312, -24.22418975830078, -22.60577392578125, -20.987356185913086, -19.368938446044922, -17.75052261352539, -16.13210678100586, -14.513689041137695, -12.895272254943848, -11.276856422424316, -9.658439636230469, -8.040022850036621, -6.421606063842773, -4.803189277648926, -3.184772491455078, -1.5663557052612305, 0.05206108093261719, 1.6704778671264648, 3.2888946533203125, 4.90731143951416, 6.525728225708008, 8.144145011901855, 9.762561798095703, 11.38097858428955, 12.999395370483398, 14.617812156677246]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 9.0, 17.0, 12.0, 28.0, 32.0, 30.0, 39.0, 41.0, 45.0, 43.0, 64.0, 66.0, 52.0, 65.0, 55.0, 49.0, 64.0, 64.0, 51.0, 29.0, 28.0, 25.0, 23.0, 12.0, 14.0, 12.0, 7.0, 10.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-43.18204879760742, -42.19626998901367, -41.210487365722656, -40.224708557128906, -39.238929748535156, -38.25314712524414, -37.26736831665039, -36.28158950805664, -35.295806884765625, -34.310028076171875, -33.32424545288086, -32.33846664428711, -31.352685928344727, -30.366905212402344, -29.381126403808594, -28.39534568786621, -27.40956687927246, -26.423786163330078, -25.438007354736328, -24.452226638793945, -23.466445922851562, -22.480667114257812, -21.49488639831543, -20.509105682373047, -19.523326873779297, -18.537546157836914, -17.551767349243164, -16.56598663330078, -15.580205917358398, -14.594426155090332, -13.608646392822266, -12.622865676879883, -11.637086868286133, -10.651307106018066, -9.665526390075684, -8.679746627807617, -7.693966388702393, -6.708186149597168, -5.722406387329102, -4.736626148223877, -3.7508459091186523, -2.7650656700134277, -1.7792856693267822, -0.7935056686401367, 0.1922745704650879, 1.1780548095703125, 2.163834571838379, 3.1496148109436035, 4.135395050048828, 5.121175289154053, 6.106955528259277, 7.092735290527344, 8.078516006469727, 9.064295768737793, 10.05007553100586, 11.035856246948242, 12.021636009216309, 13.007415771484375, 13.993196487426758, 14.978976249694824, 15.96475601196289, 16.950536727905273, 17.936317443847656, 18.922096252441406, 19.90787696838379]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 5.0, 8.0, 12.0, 10.0, 12.0, 25.0, 26.0, 45.0, 63.0, 103.0, 147.0, 225.0, 447.0, 1045.0, 4154.0, 35170.0, 525693.0, 2827970.0, 737654.0, 52661.0, 6147.0, 1315.0, 495.0, 258.0, 150.0, 100.0, 83.0, 60.0, 46.0, 32.0, 30.0, 22.0, 16.0, 9.0, 8.0, 9.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0], "bins": [-18.015625, -17.46240234375, -16.9091796875, -16.35595703125, -15.802734375, -15.24951171875, -14.6962890625, -14.14306640625, -13.58984375, -13.03662109375, -12.4833984375, -11.93017578125, -11.376953125, -10.82373046875, -10.2705078125, -9.71728515625, -9.1640625, -8.61083984375, -8.0576171875, -7.50439453125, -6.951171875, -6.39794921875, -5.8447265625, -5.29150390625, -4.73828125, -4.18505859375, -3.6318359375, -3.07861328125, -2.525390625, -1.97216796875, -1.4189453125, -0.86572265625, -0.3125, 0.24072265625, 0.7939453125, 1.34716796875, 1.900390625, 2.45361328125, 3.0068359375, 3.56005859375, 4.11328125, 4.66650390625, 5.2197265625, 5.77294921875, 6.326171875, 6.87939453125, 7.4326171875, 7.98583984375, 8.5390625, 9.09228515625, 9.6455078125, 10.19873046875, 10.751953125, 11.30517578125, 11.8583984375, 12.41162109375, 12.96484375, 13.51806640625, 14.0712890625, 14.62451171875, 15.177734375, 15.73095703125, 16.2841796875, 16.83740234375, 17.390625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 2.0, 9.0, 6.0, 9.0, 10.0, 24.0, 27.0, 27.0, 44.0, 35.0, 34.0, 50.0, 63.0, 53.0, 60.0, 59.0, 64.0, 56.0, 62.0, 51.0, 50.0, 37.0, 37.0, 29.0, 19.0, 21.0, 15.0, 11.0, 7.0, 10.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-14.8671875, -14.4913330078125, -14.115478515625, -13.7396240234375, -13.36376953125, -12.9879150390625, -12.612060546875, -12.2362060546875, -11.8603515625, -11.4844970703125, -11.108642578125, -10.7327880859375, -10.35693359375, -9.9810791015625, -9.605224609375, -9.2293701171875, -8.853515625, -8.4776611328125, -8.101806640625, -7.7259521484375, -7.35009765625, -6.9742431640625, -6.598388671875, -6.2225341796875, -5.8466796875, -5.4708251953125, -5.094970703125, -4.7191162109375, -4.34326171875, -3.9674072265625, -3.591552734375, -3.2156982421875, -2.83984375, -2.4639892578125, -2.088134765625, -1.7122802734375, -1.33642578125, -0.9605712890625, -0.584716796875, -0.2088623046875, 0.1669921875, 0.5428466796875, 0.918701171875, 1.2945556640625, 1.67041015625, 2.0462646484375, 2.422119140625, 2.7979736328125, 3.173828125, 3.5496826171875, 3.925537109375, 4.3013916015625, 4.67724609375, 5.0531005859375, 5.428955078125, 5.8048095703125, 6.1806640625, 6.5565185546875, 6.932373046875, 7.3082275390625, 7.68408203125, 8.0599365234375, 8.435791015625, 8.8116455078125, 9.1875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 9.0, 10.0, 15.0, 35.0, 105.0, 263.0, 826.0, 4922.0, 1493550.0, 2686728.0, 6455.0, 934.0, 267.0, 82.0, 39.0, 30.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.203125, -14.961181640625, -13.71923828125, -12.477294921875, -11.2353515625, -9.993408203125, -8.75146484375, -7.509521484375, -6.267578125, -5.025634765625, -3.78369140625, -2.541748046875, -1.2998046875, -0.057861328125, 1.18408203125, 2.426025390625, 3.66796875, 4.909912109375, 6.15185546875, 7.393798828125, 8.6357421875, 9.877685546875, 11.11962890625, 12.361572265625, 13.603515625, 14.845458984375, 16.08740234375, 17.329345703125, 18.5712890625, 19.813232421875, 21.05517578125, 22.297119140625, 23.5390625, 24.781005859375, 26.02294921875, 27.264892578125, 28.5068359375, 29.748779296875, 30.99072265625, 32.232666015625, 33.474609375, 34.716552734375, 35.95849609375, 37.200439453125, 38.4423828125, 39.684326171875, 40.92626953125, 42.168212890625, 43.41015625, 44.652099609375, 45.89404296875, 47.135986328125, 48.3779296875, 49.619873046875, 50.86181640625, 52.103759765625, 53.345703125, 54.587646484375, 55.82958984375, 57.071533203125, 58.3134765625, 59.555419921875, 60.79736328125, 62.039306640625, 63.28125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 8.0, 10.0, 20.0, 20.0, 32.0, 49.0, 66.0, 111.0, 173.0, 267.0, 394.0, 563.0, 576.0, 530.0, 392.0, 294.0, 212.0, 106.0, 86.0, 56.0, 43.0, 20.0, 13.0, 8.0, 6.0, 2.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.69921875, -5.56182861328125, -5.4244384765625, -5.28704833984375, -5.149658203125, -5.01226806640625, -4.8748779296875, -4.73748779296875, -4.60009765625, -4.46270751953125, -4.3253173828125, -4.18792724609375, -4.050537109375, -3.91314697265625, -3.7757568359375, -3.63836669921875, -3.5009765625, -3.36358642578125, -3.2261962890625, -3.08880615234375, -2.951416015625, -2.81402587890625, -2.6766357421875, -2.53924560546875, -2.40185546875, -2.26446533203125, -2.1270751953125, -1.98968505859375, -1.852294921875, -1.71490478515625, -1.5775146484375, -1.44012451171875, -1.302734375, -1.16534423828125, -1.0279541015625, -0.89056396484375, -0.753173828125, -0.61578369140625, -0.4783935546875, -0.34100341796875, -0.20361328125, -0.06622314453125, 0.0711669921875, 0.20855712890625, 0.345947265625, 0.48333740234375, 0.6207275390625, 0.75811767578125, 0.8955078125, 1.03289794921875, 1.1702880859375, 1.30767822265625, 1.445068359375, 1.58245849609375, 1.7198486328125, 1.85723876953125, 1.99462890625, 2.13201904296875, 2.2694091796875, 2.40679931640625, 2.544189453125, 2.68157958984375, 2.8189697265625, 2.95635986328125, 3.09375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 17.0, 27.0, 30.0, 44.0, 90.0, 118.0, 143.0, 131.0, 119.0, 105.0, 68.0, 43.0, 27.0, 11.0, 12.0, 2.0, 5.0, 3.0, 0.0, 2.0], "bins": [-35.1694450378418, -34.47749328613281, -33.78554153442383, -33.093589782714844, -32.40163803100586, -31.709684371948242, -31.017732620239258, -30.32577896118164, -29.633827209472656, -28.941875457763672, -28.249923706054688, -27.55797004699707, -26.866018295288086, -26.1740665435791, -25.482114791870117, -24.7901611328125, -24.098209381103516, -23.40625762939453, -22.714305877685547, -22.02235221862793, -21.330400466918945, -20.63844871520996, -19.946496963500977, -19.25454330444336, -18.562593460083008, -17.870641708374023, -17.17868995666504, -16.486736297607422, -15.794784545898438, -15.102832794189453, -14.410881042480469, -13.718928337097168, -13.026976585388184, -12.3350248336792, -11.643072128295898, -10.951120376586914, -10.259167671203613, -9.567215919494629, -8.875263214111328, -8.183311462402344, -7.491359233856201, -6.799407005310059, -6.107454776763916, -5.415502548217773, -4.723550796508789, -4.031598091125488, -3.339646339416504, -2.6476941108703613, -1.9557418823242188, -1.2637896537780762, -0.5718375444412231, 0.12011456489562988, 0.8120667934417725, 1.504019021987915, 2.1959710121154785, 2.887923240661621, 3.5798754692077637, 4.271827697753906, 4.963779926300049, 5.655732154846191, 6.347683906555176, 7.039636611938477, 7.731588363647461, 8.423540115356445, 9.115492820739746]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 9.0, 10.0, 16.0, 14.0, 21.0, 33.0, 30.0, 37.0, 55.0, 53.0, 56.0, 56.0, 73.0, 58.0, 72.0, 57.0, 67.0, 52.0, 54.0, 43.0, 29.0, 26.0, 15.0, 17.0, 13.0, 7.0, 10.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.321880340576172, -15.85970687866211, -15.39753246307373, -14.935358047485352, -14.473184585571289, -14.011011123657227, -13.548836708068848, -13.086662292480469, -12.624488830566406, -12.162315368652344, -11.700140953063965, -11.237966537475586, -10.775793075561523, -10.313619613647461, -9.851445198059082, -9.389270782470703, -8.92709732055664, -8.464923858642578, -8.0027494430542, -7.5405755043029785, -7.078401565551758, -6.616227626800537, -6.154053688049316, -5.691879749298096, -5.229705810546875, -4.767531871795654, -4.305357933044434, -3.843183994293213, -3.381010055541992, -2.9188361167907715, -2.456662178039551, -1.99448823928833, -1.5323152542114258, -1.070141315460205, -0.6079673767089844, -0.14579343795776367, 0.31638050079345703, 0.7785544395446777, 1.2407283782958984, 1.7029023170471191, 2.16507625579834, 2.6272501945495605, 3.0894241333007812, 3.551598072052002, 4.013772010803223, 4.475945949554443, 4.938119888305664, 5.400293827056885, 5.8624677658081055, 6.324641704559326, 6.786815643310547, 7.248989582061768, 7.711163520812988, 8.173337936401367, 8.63551139831543, 9.097684860229492, 9.559859275817871, 10.02203369140625, 10.484207153320312, 10.946380615234375, 11.408555030822754, 11.870729446411133, 12.332902908325195, 12.795076370239258, 13.257250785827637]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 3.0, 7.0, 8.0, 5.0, 10.0, 15.0, 11.0, 15.0, 35.0, 59.0, 79.0, 126.0, 226.0, 360.0, 765.0, 1854.0, 4660.0, 14597.0, 57353.0, 242781.0, 460652.0, 199783.0, 45822.0, 12264.0, 3955.0, 1543.0, 650.0, 326.0, 208.0, 103.0, 77.0, 50.0, 34.0, 22.0, 27.0, 17.0, 13.0, 8.0, 15.0, 8.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.88671875, -2.80035400390625, -2.7139892578125, -2.62762451171875, -2.541259765625, -2.45489501953125, -2.3685302734375, -2.28216552734375, -2.19580078125, -2.10943603515625, -2.0230712890625, -1.93670654296875, -1.850341796875, -1.76397705078125, -1.6776123046875, -1.59124755859375, -1.5048828125, -1.41851806640625, -1.3321533203125, -1.24578857421875, -1.159423828125, -1.07305908203125, -0.9866943359375, -0.90032958984375, -0.81396484375, -0.72760009765625, -0.6412353515625, -0.55487060546875, -0.468505859375, -0.38214111328125, -0.2957763671875, -0.20941162109375, -0.123046875, -0.03668212890625, 0.0496826171875, 0.13604736328125, 0.222412109375, 0.30877685546875, 0.3951416015625, 0.48150634765625, 0.56787109375, 0.65423583984375, 0.7406005859375, 0.82696533203125, 0.913330078125, 0.99969482421875, 1.0860595703125, 1.17242431640625, 1.2587890625, 1.34515380859375, 1.4315185546875, 1.51788330078125, 1.604248046875, 1.69061279296875, 1.7769775390625, 1.86334228515625, 1.94970703125, 2.03607177734375, 2.1224365234375, 2.20880126953125, 2.295166015625, 2.38153076171875, 2.4678955078125, 2.55426025390625, 2.640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 6.0, 3.0, 4.0, 18.0, 15.0, 35.0, 46.0, 68.0, 88.0, 96.0, 109.0, 114.0, 101.0, 98.0, 65.0, 51.0, 36.0, 19.0, 14.0, 10.0, 8.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.556884765625, -13.03564453125, -12.514404296875, -11.9931640625, -11.471923828125, -10.95068359375, -10.429443359375, -9.908203125, -9.386962890625, -8.86572265625, -8.344482421875, -7.8232421875, -7.302001953125, -6.78076171875, -6.259521484375, -5.73828125, -5.217041015625, -4.69580078125, -4.174560546875, -3.6533203125, -3.132080078125, -2.61083984375, -2.089599609375, -1.568359375, -1.047119140625, -0.52587890625, -0.004638671875, 0.5166015625, 1.037841796875, 1.55908203125, 2.080322265625, 2.6015625, 3.122802734375, 3.64404296875, 4.165283203125, 4.6865234375, 5.207763671875, 5.72900390625, 6.250244140625, 6.771484375, 7.292724609375, 7.81396484375, 8.335205078125, 8.8564453125, 9.377685546875, 9.89892578125, 10.420166015625, 10.94140625, 11.462646484375, 11.98388671875, 12.505126953125, 13.0263671875, 13.547607421875, 14.06884765625, 14.590087890625, 15.111328125, 15.632568359375, 16.15380859375, 16.675048828125, 17.1962890625, 17.717529296875, 18.23876953125, 18.760009765625, 19.28125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 4.0, 7.0, 9.0, 9.0, 22.0, 23.0, 54.0, 88.0, 101.0, 164.0, 369.0, 606.0, 1069.0, 2067.0, 3748.0, 7332.0, 14427.0, 29985.0, 62623.0, 127383.0, 216162.0, 243063.0, 167526.0, 87858.0, 42276.0, 20044.0, 10197.0, 5126.0, 2746.0, 1465.0, 817.0, 440.0, 276.0, 153.0, 111.0, 71.0, 38.0, 30.0, 26.0, 8.0, 8.0, 10.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0107421875, -0.969024658203125, -0.92730712890625, -0.885589599609375, -0.8438720703125, -0.802154541015625, -0.76043701171875, -0.718719482421875, -0.677001953125, -0.635284423828125, -0.59356689453125, -0.551849365234375, -0.5101318359375, -0.468414306640625, -0.42669677734375, -0.384979248046875, -0.34326171875, -0.301544189453125, -0.25982666015625, -0.218109130859375, -0.1763916015625, -0.134674072265625, -0.09295654296875, -0.051239013671875, -0.009521484375, 0.032196044921875, 0.07391357421875, 0.115631103515625, 0.1573486328125, 0.199066162109375, 0.24078369140625, 0.282501220703125, 0.32421875, 0.365936279296875, 0.40765380859375, 0.449371337890625, 0.4910888671875, 0.532806396484375, 0.57452392578125, 0.616241455078125, 0.657958984375, 0.699676513671875, 0.74139404296875, 0.783111572265625, 0.8248291015625, 0.866546630859375, 0.90826416015625, 0.949981689453125, 0.99169921875, 1.033416748046875, 1.07513427734375, 1.116851806640625, 1.1585693359375, 1.200286865234375, 1.24200439453125, 1.283721923828125, 1.325439453125, 1.367156982421875, 1.40887451171875, 1.450592041015625, 1.4923095703125, 1.534027099609375, 1.57574462890625, 1.617462158203125, 1.6591796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 6.0, 8.0, 7.0, 15.0, 18.0, 14.0, 22.0, 21.0, 24.0, 27.0, 46.0, 36.0, 50.0, 41.0, 51.0, 41.0, 41.0, 46.0, 48.0, 45.0, 43.0, 41.0, 43.0, 43.0, 25.0, 32.0, 25.0, 19.0, 23.0, 11.0, 15.0, 16.0, 15.0, 5.0, 10.0, 5.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.875, -13.368408203125, -12.86181640625, -12.355224609375, -11.8486328125, -11.342041015625, -10.83544921875, -10.328857421875, -9.822265625, -9.315673828125, -8.80908203125, -8.302490234375, -7.7958984375, -7.289306640625, -6.78271484375, -6.276123046875, -5.76953125, -5.262939453125, -4.75634765625, -4.249755859375, -3.7431640625, -3.236572265625, -2.72998046875, -2.223388671875, -1.716796875, -1.210205078125, -0.70361328125, -0.197021484375, 0.3095703125, 0.816162109375, 1.32275390625, 1.829345703125, 2.3359375, 2.842529296875, 3.34912109375, 3.855712890625, 4.3623046875, 4.868896484375, 5.37548828125, 5.882080078125, 6.388671875, 6.895263671875, 7.40185546875, 7.908447265625, 8.4150390625, 8.921630859375, 9.42822265625, 9.934814453125, 10.44140625, 10.947998046875, 11.45458984375, 11.961181640625, 12.4677734375, 12.974365234375, 13.48095703125, 13.987548828125, 14.494140625, 15.000732421875, 15.50732421875, 16.013916015625, 16.5205078125, 17.027099609375, 17.53369140625, 18.040283203125, 18.546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 4.0, 2.0, 9.0, 9.0, 10.0, 15.0, 26.0, 20.0, 24.0, 51.0, 83.0, 132.0, 312.0, 565.0, 1198.0, 2701.0, 8310.0, 35876.0, 203568.0, 543389.0, 203125.0, 35683.0, 8340.0, 2742.0, 1156.0, 523.0, 288.0, 144.0, 90.0, 46.0, 40.0, 23.0, 20.0, 10.0, 6.0, 3.0, 10.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5721588134765625, -0.550567626953125, -0.5289764404296875, -0.50738525390625, -0.4857940673828125, -0.464202880859375, -0.4426116943359375, -0.4210205078125, -0.3994293212890625, -0.377838134765625, -0.3562469482421875, -0.33465576171875, -0.3130645751953125, -0.291473388671875, -0.2698822021484375, -0.248291015625, -0.2266998291015625, -0.205108642578125, -0.1835174560546875, -0.16192626953125, -0.1403350830078125, -0.118743896484375, -0.0971527099609375, -0.0755615234375, -0.0539703369140625, -0.032379150390625, -0.0107879638671875, 0.01080322265625, 0.0323944091796875, 0.053985595703125, 0.0755767822265625, 0.09716796875, 0.1187591552734375, 0.140350341796875, 0.1619415283203125, 0.18353271484375, 0.2051239013671875, 0.226715087890625, 0.2483062744140625, 0.2698974609375, 0.2914886474609375, 0.313079833984375, 0.3346710205078125, 0.35626220703125, 0.3778533935546875, 0.399444580078125, 0.4210357666015625, 0.442626953125, 0.4642181396484375, 0.485809326171875, 0.5074005126953125, 0.52899169921875, 0.5505828857421875, 0.572174072265625, 0.5937652587890625, 0.6153564453125, 0.6369476318359375, 0.658538818359375, 0.6801300048828125, 0.70172119140625, 0.7233123779296875, 0.744903564453125, 0.7664947509765625, 0.7880859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 12.0, 3.0, 4.0, 10.0, 11.0, 28.0, 19.0, 41.0, 51.0, 55.0, 58.0, 71.0, 85.0, 85.0, 78.0, 72.0, 69.0, 64.0, 44.0, 39.0, 32.0, 23.0, 9.0, 7.0, 6.0, 9.0, 3.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002168416976928711, -0.0002092067152261734, -0.0002015717327594757, -0.00019393675029277802, -0.00018630176782608032, -0.00017866678535938263, -0.00017103180289268494, -0.00016339682042598724, -0.00015576183795928955, -0.00014812685549259186, -0.00014049187302589417, -0.00013285689055919647, -0.00012522190809249878, -0.00011758692562580109, -0.0001099519431591034, -0.0001023169606924057, -9.468197822570801e-05, -8.704699575901031e-05, -7.941201329231262e-05, -7.177703082561493e-05, -6.414204835891724e-05, -5.6507065892219543e-05, -4.887208342552185e-05, -4.123710095882416e-05, -3.3602118492126465e-05, -2.5967136025428772e-05, -1.833215355873108e-05, -1.0697171092033386e-05, -3.0621886253356934e-06, 4.5727938413619995e-06, 1.2207776308059692e-05, 1.9842758774757385e-05, 2.7477741241455078e-05, 3.511272370815277e-05, 4.2747706174850464e-05, 5.038268864154816e-05, 5.801767110824585e-05, 6.565265357494354e-05, 7.328763604164124e-05, 8.092261850833893e-05, 8.855760097503662e-05, 9.619258344173431e-05, 0.00010382756590843201, 0.0001114625483751297, 0.00011909753084182739, 0.00012673251330852509, 0.00013436749577522278, 0.00014200247824192047, 0.00014963746070861816, 0.00015727244317531586, 0.00016490742564201355, 0.00017254240810871124, 0.00018017739057540894, 0.00018781237304210663, 0.00019544735550880432, 0.00020308233797550201, 0.0002107173204421997, 0.0002183523029088974, 0.0002259872853755951, 0.00023362226784229279, 0.00024125725030899048, 0.00024889223277568817, 0.00025652721524238586, 0.00026416219770908356, 0.00027179718017578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 2.0, 12.0, 15.0, 15.0, 28.0, 36.0, 53.0, 62.0, 116.0, 201.0, 320.0, 719.0, 1767.0, 6073.0, 27395.0, 131511.0, 422850.0, 345043.0, 87429.0, 18066.0, 4282.0, 1264.0, 530.0, 256.0, 157.0, 116.0, 66.0, 42.0, 31.0, 28.0, 22.0, 10.0, 9.0, 5.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.402587890625, -0.3864021301269531, -0.37021636962890625, -0.3540306091308594, -0.3378448486328125, -0.3216590881347656, -0.30547332763671875, -0.2892875671386719, -0.273101806640625, -0.2569160461425781, -0.24073028564453125, -0.22454452514648438, -0.2083587646484375, -0.19217300415039062, -0.17598724365234375, -0.15980148315429688, -0.14361572265625, -0.12742996215820312, -0.11124420166015625, -0.09505844116210938, -0.0788726806640625, -0.06268692016601562, -0.04650115966796875, -0.030315399169921875, -0.014129638671875, 0.002056121826171875, 0.01824188232421875, 0.034427642822265625, 0.0506134033203125, 0.06679916381835938, 0.08298492431640625, 0.09917068481445312, 0.1153564453125, 0.13154220581054688, 0.14772796630859375, 0.16391372680664062, 0.1800994873046875, 0.19628524780273438, 0.21247100830078125, 0.22865676879882812, 0.244842529296875, 0.2610282897949219, 0.27721405029296875, 0.2933998107910156, 0.3095855712890625, 0.3257713317871094, 0.34195709228515625, 0.3581428527832031, 0.37432861328125, 0.3905143737792969, 0.40670013427734375, 0.4228858947753906, 0.4390716552734375, 0.4552574157714844, 0.47144317626953125, 0.4876289367675781, 0.503814697265625, 0.5200004577636719, 0.5361862182617188, 0.5523719787597656, 0.5685577392578125, 0.5847434997558594, 0.6009292602539062, 0.6171150207519531, 0.63330078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 6.0, 5.0, 6.0, 9.0, 9.0, 14.0, 12.0, 21.0, 27.0, 30.0, 34.0, 47.0, 59.0, 70.0, 81.0, 78.0, 84.0, 77.0, 71.0, 64.0, 42.0, 36.0, 28.0, 19.0, 17.0, 13.0, 12.0, 11.0, 8.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.2303466796875, -0.2247447967529297, -0.21914291381835938, -0.21354103088378906, -0.20793914794921875, -0.20233726501464844, -0.19673538208007812, -0.1911334991455078, -0.1855316162109375, -0.1799297332763672, -0.17432785034179688, -0.16872596740722656, -0.16312408447265625, -0.15752220153808594, -0.15192031860351562, -0.1463184356689453, -0.140716552734375, -0.1351146697998047, -0.12951278686523438, -0.12391090393066406, -0.11830902099609375, -0.11270713806152344, -0.10710525512695312, -0.10150337219238281, -0.0959014892578125, -0.09029960632324219, -0.08469772338867188, -0.07909584045410156, -0.07349395751953125, -0.06789207458496094, -0.062290191650390625, -0.05668830871582031, -0.05108642578125, -0.04548454284667969, -0.039882659912109375, -0.03428077697753906, -0.02867889404296875, -0.023077011108398438, -0.017475128173828125, -0.011873245239257812, -0.0062713623046875, -0.0006694793701171875, 0.004932403564453125, 0.010534286499023438, 0.01613616943359375, 0.021738052368164062, 0.027339935302734375, 0.03294181823730469, 0.038543701171875, 0.04414558410644531, 0.049747467041015625, 0.05534934997558594, 0.06095123291015625, 0.06655311584472656, 0.07215499877929688, 0.07775688171386719, 0.0833587646484375, 0.08896064758300781, 0.09456253051757812, 0.10016441345214844, 0.10576629638671875, 0.11136817932128906, 0.11697006225585938, 0.12257194519042969, 0.128173828125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 33.0, 140.0, 402.0, 325.0, 87.0, 13.0, 4.0, 3.0], "bins": [-79.73932647705078, -78.38194274902344, -77.0245590209961, -75.66718292236328, -74.30979919433594, -72.9524154663086, -71.59503173828125, -70.2376480102539, -68.8802719116211, -67.52288818359375, -66.1655044555664, -64.8081283569336, -63.45074462890625, -62.093360900878906, -60.73597717285156, -59.378597259521484, -58.021209716796875, -56.66382598876953, -55.30644607543945, -53.94906234741211, -52.59168243408203, -51.23429870605469, -49.876914978027344, -48.519535064697266, -47.16215515136719, -45.804771423339844, -44.447391510009766, -43.09000778198242, -41.732627868652344, -40.375244140625, -39.017860412597656, -37.66048049926758, -36.303096771240234, -34.94571304321289, -33.58833312988281, -32.23094940185547, -30.873567581176758, -29.516185760498047, -28.158803939819336, -26.801422119140625, -25.44403839111328, -24.08665657043457, -22.72927474975586, -21.371891021728516, -20.014509201049805, -18.657127380371094, -17.299745559692383, -15.942362785339355, -14.584980010986328, -13.227598190307617, -11.87021541595459, -10.512833595275879, -9.155450820922852, -7.798069000244141, -6.44068717956543, -5.083304405212402, -3.7259230613708496, -2.3685407638549805, -1.0111587047576904, 0.3462233543395996, 1.7036056518554688, 3.060987949371338, 4.418369770050049, 5.775752544403076, 7.133134365081787]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 1.0, 5.0, 8.0, 24.0, 16.0, 31.0, 42.0, 45.0, 62.0, 64.0, 88.0, 87.0, 86.0, 79.0, 83.0, 74.0, 63.0, 33.0, 36.0, 19.0, 17.0, 15.0, 6.0, 10.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.27345085144043, -12.872393608093262, -12.471336364746094, -12.070279121398926, -11.669221878051758, -11.26816463470459, -10.867107391357422, -10.466049194335938, -10.064992904663086, -9.663935661315918, -9.26287841796875, -8.861821174621582, -8.460763931274414, -8.059706687927246, -7.65864896774292, -7.257591724395752, -6.856534004211426, -6.455476760864258, -6.05441951751709, -5.653362274169922, -5.252305030822754, -4.851247787475586, -4.45019006729126, -4.049132823944092, -3.648075580596924, -3.247018337249756, -2.845961093902588, -2.444903612136841, -2.043846368789673, -1.6427891254425049, -1.2417316436767578, -0.8406744003295898, -0.4396171569824219, -0.03855985403060913, 0.3624974489212036, 0.7635548114776611, 1.164612054824829, 1.565669298171997, 1.9667267799377441, 2.367784023284912, 2.76884126663208, 3.169898509979248, 3.570955753326416, 3.972013235092163, 4.37307071685791, 4.774127960205078, 5.175185203552246, 5.576242446899414, 5.977299690246582, 6.37835693359375, 6.779414176940918, 7.180471420288086, 7.581528663635254, 7.982585906982422, 8.383644104003906, 8.784700393676758, 9.185758590698242, 9.58681583404541, 9.987873077392578, 10.388930320739746, 10.789987564086914, 11.191044807434082, 11.59210205078125, 11.993160247802734, 12.394216537475586]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 7.0, 9.0, 9.0, 32.0, 48.0, 118.0, 434.0, 2952.0, 44340.0, 719861.0, 267867.0, 11310.0, 1128.0, 255.0, 62.0, 43.0, 15.0, 22.0, 13.0, 7.0, 5.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.75, -13.146240234375, -12.54248046875, -11.938720703125, -11.3349609375, -10.731201171875, -10.12744140625, -9.523681640625, -8.919921875, -8.316162109375, -7.71240234375, -7.108642578125, -6.5048828125, -5.901123046875, -5.29736328125, -4.693603515625, -4.08984375, -3.486083984375, -2.88232421875, -2.278564453125, -1.6748046875, -1.071044921875, -0.46728515625, 0.136474609375, 0.740234375, 1.343994140625, 1.94775390625, 2.551513671875, 3.1552734375, 3.759033203125, 4.36279296875, 4.966552734375, 5.5703125, 6.174072265625, 6.77783203125, 7.381591796875, 7.9853515625, 8.589111328125, 9.19287109375, 9.796630859375, 10.400390625, 11.004150390625, 11.60791015625, 12.211669921875, 12.8154296875, 13.419189453125, 14.02294921875, 14.626708984375, 15.23046875, 15.834228515625, 16.43798828125, 17.041748046875, 17.6455078125, 18.249267578125, 18.85302734375, 19.456787109375, 20.060546875, 20.664306640625, 21.26806640625, 21.871826171875, 22.4755859375, 23.079345703125, 23.68310546875, 24.286865234375, 24.890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 11.0, 10.0, 12.0, 22.0, 14.0, 24.0, 42.0, 29.0, 35.0, 51.0, 53.0, 56.0, 61.0, 52.0, 69.0, 50.0, 66.0, 70.0, 47.0, 42.0, 39.0, 28.0, 21.0, 23.0, 15.0, 11.0, 10.0, 8.0, 3.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-21.0625, -20.5457763671875, -20.029052734375, -19.5123291015625, -18.99560546875, -18.4788818359375, -17.962158203125, -17.4454345703125, -16.9287109375, -16.4119873046875, -15.895263671875, -15.3785400390625, -14.86181640625, -14.3450927734375, -13.828369140625, -13.3116455078125, -12.794921875, -12.2781982421875, -11.761474609375, -11.2447509765625, -10.72802734375, -10.2113037109375, -9.694580078125, -9.1778564453125, -8.6611328125, -8.1444091796875, -7.627685546875, -7.1109619140625, -6.59423828125, -6.0775146484375, -5.560791015625, -5.0440673828125, -4.52734375, -4.0106201171875, -3.493896484375, -2.9771728515625, -2.46044921875, -1.9437255859375, -1.427001953125, -0.9102783203125, -0.3935546875, 0.1231689453125, 0.639892578125, 1.1566162109375, 1.67333984375, 2.1900634765625, 2.706787109375, 3.2235107421875, 3.740234375, 4.2569580078125, 4.773681640625, 5.2904052734375, 5.80712890625, 6.3238525390625, 6.840576171875, 7.3572998046875, 7.8740234375, 8.3907470703125, 8.907470703125, 9.4241943359375, 9.94091796875, 10.4576416015625, 10.974365234375, 11.4910888671875, 12.0078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 12.0, 13.0, 24.0, 48.0, 64.0, 99.0, 165.0, 292.0, 659.0, 5222.0, 624911.0, 411825.0, 4007.0, 564.0, 281.0, 138.0, 90.0, 62.0, 27.0, 13.0, 19.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.34375, -24.43701171875, -23.5302734375, -22.62353515625, -21.716796875, -20.81005859375, -19.9033203125, -18.99658203125, -18.08984375, -17.18310546875, -16.2763671875, -15.36962890625, -14.462890625, -13.55615234375, -12.6494140625, -11.74267578125, -10.8359375, -9.92919921875, -9.0224609375, -8.11572265625, -7.208984375, -6.30224609375, -5.3955078125, -4.48876953125, -3.58203125, -2.67529296875, -1.7685546875, -0.86181640625, 0.044921875, 0.95166015625, 1.8583984375, 2.76513671875, 3.671875, 4.57861328125, 5.4853515625, 6.39208984375, 7.298828125, 8.20556640625, 9.1123046875, 10.01904296875, 10.92578125, 11.83251953125, 12.7392578125, 13.64599609375, 14.552734375, 15.45947265625, 16.3662109375, 17.27294921875, 18.1796875, 19.08642578125, 19.9931640625, 20.89990234375, 21.806640625, 22.71337890625, 23.6201171875, 24.52685546875, 25.43359375, 26.34033203125, 27.2470703125, 28.15380859375, 29.060546875, 29.96728515625, 30.8740234375, 31.78076171875, 32.6875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 1.0, 9.0, 8.0, 15.0, 9.0, 7.0, 21.0, 19.0, 29.0, 35.0, 28.0, 32.0, 46.0, 46.0, 45.0, 48.0, 56.0, 43.0, 56.0, 43.0, 52.0, 41.0, 46.0, 47.0, 35.0, 26.0, 26.0, 32.0, 16.0, 17.0, 13.0, 9.0, 9.0, 5.0, 13.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.71875, -17.1796875, -16.640625, -16.1015625, -15.5625, -15.0234375, -14.484375, -13.9453125, -13.40625, -12.8671875, -12.328125, -11.7890625, -11.25, -10.7109375, -10.171875, -9.6328125, -9.09375, -8.5546875, -8.015625, -7.4765625, -6.9375, -6.3984375, -5.859375, -5.3203125, -4.78125, -4.2421875, -3.703125, -3.1640625, -2.625, -2.0859375, -1.546875, -1.0078125, -0.46875, 0.0703125, 0.609375, 1.1484375, 1.6875, 2.2265625, 2.765625, 3.3046875, 3.84375, 4.3828125, 4.921875, 5.4609375, 6.0, 6.5390625, 7.078125, 7.6171875, 8.15625, 8.6953125, 9.234375, 9.7734375, 10.3125, 10.8515625, 11.390625, 11.9296875, 12.46875, 13.0078125, 13.546875, 14.0859375, 14.625, 15.1640625, 15.703125, 16.2421875, 16.78125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 3.0, 8.0, 19.0, 30.0, 48.0, 99.0, 204.0, 459.0, 1823.0, 13079.0, 551655.0, 466809.0, 11617.0, 1797.0, 481.0, 200.0, 91.0, 49.0, 24.0, 16.0, 11.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8828125, -10.610595703125, -10.33837890625, -10.066162109375, -9.7939453125, -9.521728515625, -9.24951171875, -8.977294921875, -8.705078125, -8.432861328125, -8.16064453125, -7.888427734375, -7.6162109375, -7.343994140625, -7.07177734375, -6.799560546875, -6.52734375, -6.255126953125, -5.98291015625, -5.710693359375, -5.4384765625, -5.166259765625, -4.89404296875, -4.621826171875, -4.349609375, -4.077392578125, -3.80517578125, -3.532958984375, -3.2607421875, -2.988525390625, -2.71630859375, -2.444091796875, -2.171875, -1.899658203125, -1.62744140625, -1.355224609375, -1.0830078125, -0.810791015625, -0.53857421875, -0.266357421875, 0.005859375, 0.278076171875, 0.55029296875, 0.822509765625, 1.0947265625, 1.366943359375, 1.63916015625, 1.911376953125, 2.18359375, 2.455810546875, 2.72802734375, 3.000244140625, 3.2724609375, 3.544677734375, 3.81689453125, 4.089111328125, 4.361328125, 4.633544921875, 4.90576171875, 5.177978515625, 5.4501953125, 5.722412109375, 5.99462890625, 6.266845703125, 6.5390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 8.0, 16.0, 25.0, 23.0, 43.0, 64.0, 103.0, 99.0, 178.0, 140.0, 87.0, 68.0, 47.0, 29.0, 28.0, 17.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006384849548339844, -0.0006116107106208801, -0.0005847364664077759, -0.0005578622221946716, -0.0005309879779815674, -0.0005041137337684631, -0.0004772394895553589, -0.00045036524534225464, -0.0004234910011291504, -0.00039661675691604614, -0.0003697425127029419, -0.00034286826848983765, -0.0003159940242767334, -0.00028911978006362915, -0.0002622455358505249, -0.00023537129163742065, -0.0002084970474243164, -0.00018162280321121216, -0.0001547485589981079, -0.00012787431478500366, -0.00010100007057189941, -7.412582635879517e-05, -4.725158214569092e-05, -2.037733793258667e-05, 6.496906280517578e-06, 3.3371150493621826e-05, 6.0245394706726074e-05, 8.711963891983032e-05, 0.00011399388313293457, 0.00014086812734603882, 0.00016774237155914307, 0.00019461661577224731, 0.00022149085998535156, 0.0002483651041984558, 0.00027523934841156006, 0.0003021135926246643, 0.00032898783683776855, 0.0003558620810508728, 0.00038273632526397705, 0.0004096105694770813, 0.00043648481369018555, 0.0004633590579032898, 0.000490233302116394, 0.0005171075463294983, 0.0005439817905426025, 0.0005708560347557068, 0.000597730278968811, 0.0006246045231819153, 0.0006514787673950195, 0.0006783530116081238, 0.000705227255821228, 0.0007321015000343323, 0.0007589757442474365, 0.0007858499884605408, 0.000812724232673645, 0.0008395984768867493, 0.0008664727210998535, 0.0008933469653129578, 0.000920221209526062, 0.0009470954537391663, 0.0009739696979522705, 0.0010008439421653748, 0.001027718186378479, 0.0010545924305915833, 0.0010814666748046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 6.0, 13.0, 11.0, 15.0, 27.0, 72.0, 121.0, 322.0, 1158.0, 8205.0, 434151.0, 592261.0, 10211.0, 1284.0, 358.0, 135.0, 84.0, 42.0, 23.0, 16.0, 10.0, 8.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9921875, -9.6802978515625, -9.368408203125, -9.0565185546875, -8.74462890625, -8.4327392578125, -8.120849609375, -7.8089599609375, -7.4970703125, -7.1851806640625, -6.873291015625, -6.5614013671875, -6.24951171875, -5.9376220703125, -5.625732421875, -5.3138427734375, -5.001953125, -4.6900634765625, -4.378173828125, -4.0662841796875, -3.75439453125, -3.4425048828125, -3.130615234375, -2.8187255859375, -2.5068359375, -2.1949462890625, -1.883056640625, -1.5711669921875, -1.25927734375, -0.9473876953125, -0.635498046875, -0.3236083984375, -0.01171875, 0.3001708984375, 0.612060546875, 0.9239501953125, 1.23583984375, 1.5477294921875, 1.859619140625, 2.1715087890625, 2.4833984375, 2.7952880859375, 3.107177734375, 3.4190673828125, 3.73095703125, 4.0428466796875, 4.354736328125, 4.6666259765625, 4.978515625, 5.2904052734375, 5.602294921875, 5.9141845703125, 6.22607421875, 6.5379638671875, 6.849853515625, 7.1617431640625, 7.4736328125, 7.7855224609375, 8.097412109375, 8.4093017578125, 8.72119140625, 9.0330810546875, 9.344970703125, 9.6568603515625, 9.96875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 4.0, 4.0, 4.0, 14.0, 13.0, 14.0, 25.0, 24.0, 39.0, 49.0, 56.0, 57.0, 85.0, 82.0, 100.0, 85.0, 73.0, 60.0, 40.0, 44.0, 24.0, 23.0, 25.0, 18.0, 12.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5107421875, -1.4640655517578125, -1.417388916015625, -1.3707122802734375, -1.32403564453125, -1.2773590087890625, -1.230682373046875, -1.1840057373046875, -1.1373291015625, -1.0906524658203125, -1.043975830078125, -0.9972991943359375, -0.95062255859375, -0.9039459228515625, -0.857269287109375, -0.8105926513671875, -0.763916015625, -0.7172393798828125, -0.670562744140625, -0.6238861083984375, -0.57720947265625, -0.5305328369140625, -0.483856201171875, -0.4371795654296875, -0.3905029296875, -0.3438262939453125, -0.297149658203125, -0.2504730224609375, -0.20379638671875, -0.1571197509765625, -0.110443115234375, -0.0637664794921875, -0.01708984375, 0.0295867919921875, 0.076263427734375, 0.1229400634765625, 0.16961669921875, 0.2162933349609375, 0.262969970703125, 0.3096466064453125, 0.3563232421875, 0.4029998779296875, 0.449676513671875, 0.4963531494140625, 0.54302978515625, 0.5897064208984375, 0.636383056640625, 0.6830596923828125, 0.729736328125, 0.7764129638671875, 0.823089599609375, 0.8697662353515625, 0.91644287109375, 0.9631195068359375, 1.009796142578125, 1.0564727783203125, 1.1031494140625, 1.1498260498046875, 1.196502685546875, 1.2431793212890625, 1.28985595703125, 1.3365325927734375, 1.383209228515625, 1.4298858642578125, 1.4765625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 8.0, 31.0, 38.0, 84.0, 140.0, 160.0, 198.0, 152.0, 90.0, 53.0, 28.0, 9.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.93447494506836, -51.779808044433594, -50.62514114379883, -49.47047424316406, -48.3158073425293, -47.16114044189453, -46.006473541259766, -44.851806640625, -43.697139739990234, -42.54247283935547, -41.3878059387207, -40.23313903808594, -39.07847213745117, -37.923805236816406, -36.76913833618164, -35.614471435546875, -34.459800720214844, -33.30513381958008, -32.15046691894531, -30.995800018310547, -29.84113311767578, -28.686466217041016, -27.53179931640625, -26.377132415771484, -25.22246551513672, -24.067798614501953, -22.913131713867188, -21.758464813232422, -20.603797912597656, -19.44913101196289, -18.294464111328125, -17.13979721069336, -15.985132217407227, -14.830465316772461, -13.675798416137695, -12.52113151550293, -11.366464614868164, -10.211797714233398, -9.057129859924316, -7.902462959289551, -6.747796058654785, -5.5931291580200195, -4.438462257385254, -3.28379487991333, -2.1291279792785645, -0.9744610786437988, 0.180206298828125, 1.3348731994628906, 2.4895401000976562, 3.644207000732422, 4.7988739013671875, 5.953541278839111, 7.108208179473877, 8.262874603271484, 9.417542457580566, 10.572209358215332, 11.726876258850098, 12.881543159484863, 14.036210060119629, 15.190877914428711, 16.345544815063477, 17.500211715698242, 18.654878616333008, 19.809545516967773, 20.96421241760254]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 5.0, 7.0, 7.0, 7.0, 10.0, 10.0, 11.0, 17.0, 10.0, 19.0, 29.0, 33.0, 27.0, 44.0, 44.0, 38.0, 47.0, 29.0, 59.0, 44.0, 52.0, 44.0, 48.0, 41.0, 47.0, 48.0, 39.0, 36.0, 26.0, 19.0, 21.0, 17.0, 15.0, 10.0, 13.0, 8.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.81801986694336, -29.952289581298828, -29.086557388305664, -28.220827102661133, -27.3550968170166, -26.489364624023438, -25.623634338378906, -24.757904052734375, -23.89217185974121, -23.02644157409668, -22.160709381103516, -21.294979095458984, -20.429248809814453, -19.56351661682129, -18.697786331176758, -17.832054138183594, -16.966323852539062, -16.10059356689453, -15.234862327575684, -14.369131088256836, -13.503399848937988, -12.63766860961914, -11.77193832397461, -10.906207084655762, -10.040477752685547, -9.1747465133667, -8.309016227722168, -7.44328498840332, -6.577553749084473, -5.711822986602783, -4.846092224121094, -3.980360984802246, -3.1146297454833984, -2.24889874458313, -1.3831678628921509, -0.5174369812011719, 0.3482940196990967, 1.2140250205993652, 2.0797557830810547, 2.9454870223999023, 3.811217784881592, 4.676948547363281, 5.542679786682129, 6.408410549163818, 7.274141311645508, 8.139872550964355, 9.005603790283203, 9.871334075927734, 10.737065315246582, 11.60279655456543, 12.468526840209961, 13.334258079528809, 14.199989318847656, 15.065719604492188, 15.931450843811035, 16.797182083129883, 17.662912368774414, 18.528642654418945, 19.39437484741211, 20.26010513305664, 21.125835418701172, 21.991567611694336, 22.857297897338867, 23.72303009033203, 24.588760375976562]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 10.0, 7.0, 15.0, 25.0, 18.0, 52.0, 61.0, 118.0, 227.0, 429.0, 1100.0, 5945.0, 201054.0, 3542644.0, 428241.0, 11963.0, 1424.0, 402.0, 190.0, 111.0, 77.0, 48.0, 38.0, 16.0, 14.0, 13.0, 9.0, 11.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-28.109375, -27.319580078125, -26.52978515625, -25.739990234375, -24.9501953125, -24.160400390625, -23.37060546875, -22.580810546875, -21.791015625, -21.001220703125, -20.21142578125, -19.421630859375, -18.6318359375, -17.842041015625, -17.05224609375, -16.262451171875, -15.47265625, -14.682861328125, -13.89306640625, -13.103271484375, -12.3134765625, -11.523681640625, -10.73388671875, -9.944091796875, -9.154296875, -8.364501953125, -7.57470703125, -6.784912109375, -5.9951171875, -5.205322265625, -4.41552734375, -3.625732421875, -2.8359375, -2.046142578125, -1.25634765625, -0.466552734375, 0.3232421875, 1.113037109375, 1.90283203125, 2.692626953125, 3.482421875, 4.272216796875, 5.06201171875, 5.851806640625, 6.6416015625, 7.431396484375, 8.22119140625, 9.010986328125, 9.80078125, 10.590576171875, 11.38037109375, 12.170166015625, 12.9599609375, 13.749755859375, 14.53955078125, 15.329345703125, 16.119140625, 16.908935546875, 17.69873046875, 18.488525390625, 19.2783203125, 20.068115234375, 20.85791015625, 21.647705078125, 22.4375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 0.0, 6.0, 5.0, 13.0, 9.0, 13.0, 17.0, 21.0, 22.0, 26.0, 35.0, 46.0, 58.0, 59.0, 62.0, 77.0, 71.0, 66.0, 69.0, 60.0, 48.0, 42.0, 40.0, 25.0, 21.0, 24.0, 11.0, 19.0, 9.0, 8.0, 7.0, 7.0, 0.0, 4.0, 1.0, 4.0, 0.0, 1.0], "bins": [-16.3125, -15.9259033203125, -15.539306640625, -15.1527099609375, -14.76611328125, -14.3795166015625, -13.992919921875, -13.6063232421875, -13.2197265625, -12.8331298828125, -12.446533203125, -12.0599365234375, -11.67333984375, -11.2867431640625, -10.900146484375, -10.5135498046875, -10.126953125, -9.7403564453125, -9.353759765625, -8.9671630859375, -8.58056640625, -8.1939697265625, -7.807373046875, -7.4207763671875, -7.0341796875, -6.6475830078125, -6.260986328125, -5.8743896484375, -5.48779296875, -5.1011962890625, -4.714599609375, -4.3280029296875, -3.94140625, -3.5548095703125, -3.168212890625, -2.7816162109375, -2.39501953125, -2.0084228515625, -1.621826171875, -1.2352294921875, -0.8486328125, -0.4620361328125, -0.075439453125, 0.3111572265625, 0.69775390625, 1.0843505859375, 1.470947265625, 1.8575439453125, 2.244140625, 2.6307373046875, 3.017333984375, 3.4039306640625, 3.79052734375, 4.1771240234375, 4.563720703125, 4.9503173828125, 5.3369140625, 5.7235107421875, 6.110107421875, 6.4967041015625, 6.88330078125, 7.2698974609375, 7.656494140625, 8.0430908203125, 8.4296875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 1.0, 2.0, 5.0, 17.0, 16.0, 31.0, 40.0, 64.0, 130.0, 228.0, 502.0, 1208.0, 3788.0, 21145.0, 361141.0, 3462727.0, 317748.0, 19589.0, 3631.0, 1186.0, 479.0, 232.0, 127.0, 90.0, 59.0, 28.0, 24.0, 9.0, 5.0, 12.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5703125, -13.0765380859375, -12.582763671875, -12.0889892578125, -11.59521484375, -11.1014404296875, -10.607666015625, -10.1138916015625, -9.6201171875, -9.1263427734375, -8.632568359375, -8.1387939453125, -7.64501953125, -7.1512451171875, -6.657470703125, -6.1636962890625, -5.669921875, -5.1761474609375, -4.682373046875, -4.1885986328125, -3.69482421875, -3.2010498046875, -2.707275390625, -2.2135009765625, -1.7197265625, -1.2259521484375, -0.732177734375, -0.2384033203125, 0.25537109375, 0.7491455078125, 1.242919921875, 1.7366943359375, 2.23046875, 2.7242431640625, 3.218017578125, 3.7117919921875, 4.20556640625, 4.6993408203125, 5.193115234375, 5.6868896484375, 6.1806640625, 6.6744384765625, 7.168212890625, 7.6619873046875, 8.15576171875, 8.6495361328125, 9.143310546875, 9.6370849609375, 10.130859375, 10.6246337890625, 11.118408203125, 11.6121826171875, 12.10595703125, 12.5997314453125, 13.093505859375, 13.5872802734375, 14.0810546875, 14.5748291015625, 15.068603515625, 15.5623779296875, 16.05615234375, 16.5499267578125, 17.043701171875, 17.5374755859375, 18.03125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 11.0, 19.0, 20.0, 27.0, 59.0, 97.0, 148.0, 276.0, 428.0, 587.0, 632.0, 622.0, 433.0, 281.0, 167.0, 104.0, 59.0, 40.0, 18.0, 17.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.70703125, -4.55743408203125, -4.4078369140625, -4.25823974609375, -4.108642578125, -3.95904541015625, -3.8094482421875, -3.65985107421875, -3.51025390625, -3.36065673828125, -3.2110595703125, -3.06146240234375, -2.911865234375, -2.76226806640625, -2.6126708984375, -2.46307373046875, -2.3134765625, -2.16387939453125, -2.0142822265625, -1.86468505859375, -1.715087890625, -1.56549072265625, -1.4158935546875, -1.26629638671875, -1.11669921875, -0.96710205078125, -0.8175048828125, -0.66790771484375, -0.518310546875, -0.36871337890625, -0.2191162109375, -0.06951904296875, 0.080078125, 0.22967529296875, 0.3792724609375, 0.52886962890625, 0.678466796875, 0.82806396484375, 0.9776611328125, 1.12725830078125, 1.27685546875, 1.42645263671875, 1.5760498046875, 1.72564697265625, 1.875244140625, 2.02484130859375, 2.1744384765625, 2.32403564453125, 2.4736328125, 2.62322998046875, 2.7728271484375, 2.92242431640625, 3.072021484375, 3.22161865234375, 3.3712158203125, 3.52081298828125, 3.67041015625, 3.82000732421875, 3.9696044921875, 4.11920166015625, 4.268798828125, 4.41839599609375, 4.5679931640625, 4.71759033203125, 4.8671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 8.0, 9.0, 28.0, 31.0, 60.0, 80.0, 116.0, 125.0, 123.0, 129.0, 100.0, 70.0, 47.0, 26.0, 20.0, 15.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.108928680419922, -29.469072341918945, -28.82921600341797, -28.189359664916992, -27.549503326416016, -26.909645080566406, -26.26978874206543, -25.629932403564453, -24.990076065063477, -24.3502197265625, -23.710363388061523, -23.070507049560547, -22.430648803710938, -21.79079246520996, -21.150936126708984, -20.511079788208008, -19.87122344970703, -19.231367111206055, -18.591510772705078, -17.9516544342041, -17.311798095703125, -16.671939849853516, -16.03208351135254, -15.392227172851562, -14.752370834350586, -14.11251449584961, -13.472658157348633, -12.83280086517334, -12.192944526672363, -11.553088188171387, -10.913230895996094, -10.273374557495117, -9.633520126342773, -8.993663787841797, -8.35380744934082, -7.713950157165527, -7.074093818664551, -6.434237480163574, -5.7943806648254395, -5.154523849487305, -4.514667510986328, -3.8748109340667725, -3.234954357147217, -2.595097780227661, -1.9552412033081055, -1.3153846263885498, -0.6755280494689941, -0.035671234130859375, 0.6041851043701172, 1.2440416812896729, 1.8838982582092285, 2.523754835128784, 3.16361141204834, 3.8034679889678955, 4.443324565887451, 5.083181381225586, 5.7230377197265625, 6.362894058227539, 7.002750873565674, 7.642607688903809, 8.282464027404785, 8.922320365905762, 9.562177658081055, 10.202033996582031, 10.841890335083008]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 11.0, 14.0, 17.0, 16.0, 13.0, 22.0, 25.0, 21.0, 44.0, 31.0, 44.0, 53.0, 43.0, 53.0, 55.0, 48.0, 67.0, 63.0, 44.0, 49.0, 43.0, 42.0, 29.0, 38.0, 24.0, 15.0, 17.0, 21.0, 11.0, 4.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.287419319152832, -9.924681663513184, -9.561944007873535, -9.199206352233887, -8.836468696594238, -8.47373104095459, -8.110993385314941, -7.748255729675293, -7.3855180740356445, -7.022780418395996, -6.660042762756348, -6.297305107116699, -5.934567451477051, -5.571829795837402, -5.209092140197754, -4.8463544845581055, -4.483616352081299, -4.12087869644165, -3.758141040802002, -3.3954033851623535, -3.032665729522705, -2.6699280738830566, -2.307190179824829, -1.9444525241851807, -1.5817148685455322, -1.2189772129058838, -0.8562394976615906, -0.49350178241729736, -0.13076412677764893, 0.2319735288619995, 0.5947113037109375, 0.9574489593505859, 1.3201866149902344, 1.6829242706298828, 2.0456619262695312, 2.4083995819091797, 2.771137237548828, 3.1338748931884766, 3.496612787246704, 3.8593504428863525, 4.222087860107422, 4.58482551574707, 4.947563171386719, 5.310300827026367, 5.673038482666016, 6.035776138305664, 6.3985137939453125, 6.761251449584961, 7.123989582061768, 7.486727237701416, 7.8494648933410645, 8.212203025817871, 8.57494068145752, 8.937678337097168, 9.300415992736816, 9.663153648376465, 10.025891304016113, 10.388628959655762, 10.75136661529541, 11.114104270935059, 11.476841926574707, 11.839579582214355, 12.202317237854004, 12.565054893493652, 12.9277925491333]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 14.0, 17.0, 18.0, 27.0, 41.0, 69.0, 131.0, 238.0, 473.0, 1324.0, 4325.0, 18215.0, 106174.0, 499588.0, 345263.0, 57204.0, 10898.0, 2825.0, 903.0, 373.0, 186.0, 88.0, 50.0, 26.0, 26.0, 16.0, 15.0, 10.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.224609375, -3.129302978515625, -3.03399658203125, -2.938690185546875, -2.8433837890625, -2.748077392578125, -2.65277099609375, -2.557464599609375, -2.462158203125, -2.366851806640625, -2.27154541015625, -2.176239013671875, -2.0809326171875, -1.985626220703125, -1.89031982421875, -1.795013427734375, -1.69970703125, -1.604400634765625, -1.50909423828125, -1.413787841796875, -1.3184814453125, -1.223175048828125, -1.12786865234375, -1.032562255859375, -0.937255859375, -0.841949462890625, -0.74664306640625, -0.651336669921875, -0.5560302734375, -0.460723876953125, -0.36541748046875, -0.270111083984375, -0.1748046875, -0.079498291015625, 0.01580810546875, 0.111114501953125, 0.2064208984375, 0.301727294921875, 0.39703369140625, 0.492340087890625, 0.587646484375, 0.682952880859375, 0.77825927734375, 0.873565673828125, 0.9688720703125, 1.064178466796875, 1.15948486328125, 1.254791259765625, 1.35009765625, 1.445404052734375, 1.54071044921875, 1.636016845703125, 1.7313232421875, 1.826629638671875, 1.92193603515625, 2.017242431640625, 2.112548828125, 2.207855224609375, 2.30316162109375, 2.398468017578125, 2.4937744140625, 2.589080810546875, 2.68438720703125, 2.779693603515625, 2.875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 17.0, 21.0, 25.0, 22.0, 38.0, 39.0, 62.0, 76.0, 69.0, 81.0, 91.0, 86.0, 95.0, 67.0, 51.0, 48.0, 32.0, 28.0, 15.0, 17.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1953125, -8.8292236328125, -8.463134765625, -8.0970458984375, -7.73095703125, -7.3648681640625, -6.998779296875, -6.6326904296875, -6.2666015625, -5.9005126953125, -5.534423828125, -5.1683349609375, -4.80224609375, -4.4361572265625, -4.070068359375, -3.7039794921875, -3.337890625, -2.9718017578125, -2.605712890625, -2.2396240234375, -1.87353515625, -1.5074462890625, -1.141357421875, -0.7752685546875, -0.4091796875, -0.0430908203125, 0.322998046875, 0.6890869140625, 1.05517578125, 1.4212646484375, 1.787353515625, 2.1534423828125, 2.51953125, 2.8856201171875, 3.251708984375, 3.6177978515625, 3.98388671875, 4.3499755859375, 4.716064453125, 5.0821533203125, 5.4482421875, 5.8143310546875, 6.180419921875, 6.5465087890625, 6.91259765625, 7.2786865234375, 7.644775390625, 8.0108642578125, 8.376953125, 8.7430419921875, 9.109130859375, 9.4752197265625, 9.84130859375, 10.2073974609375, 10.573486328125, 10.9395751953125, 11.3056640625, 11.6717529296875, 12.037841796875, 12.4039306640625, 12.77001953125, 13.1361083984375, 13.502197265625, 13.8682861328125, 14.234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 8.0, 21.0, 29.0, 70.0, 109.0, 172.0, 293.0, 520.0, 967.0, 1845.0, 3532.0, 7360.0, 16009.0, 35846.0, 82047.0, 176415.0, 276184.0, 230868.0, 118870.0, 52611.0, 23553.0, 10616.0, 5046.0, 2432.0, 1364.0, 737.0, 446.0, 219.0, 136.0, 75.0, 64.0, 32.0, 21.0, 13.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3115234375, -1.271453857421875, -1.23138427734375, -1.191314697265625, -1.1512451171875, -1.111175537109375, -1.07110595703125, -1.031036376953125, -0.990966796875, -0.950897216796875, -0.91082763671875, -0.870758056640625, -0.8306884765625, -0.790618896484375, -0.75054931640625, -0.710479736328125, -0.67041015625, -0.630340576171875, -0.59027099609375, -0.550201416015625, -0.5101318359375, -0.470062255859375, -0.42999267578125, -0.389923095703125, -0.349853515625, -0.309783935546875, -0.26971435546875, -0.229644775390625, -0.1895751953125, -0.149505615234375, -0.10943603515625, -0.069366455078125, -0.029296875, 0.010772705078125, 0.05084228515625, 0.090911865234375, 0.1309814453125, 0.171051025390625, 0.21112060546875, 0.251190185546875, 0.291259765625, 0.331329345703125, 0.37139892578125, 0.411468505859375, 0.4515380859375, 0.491607666015625, 0.53167724609375, 0.571746826171875, 0.61181640625, 0.651885986328125, 0.69195556640625, 0.732025146484375, 0.7720947265625, 0.812164306640625, 0.85223388671875, 0.892303466796875, 0.932373046875, 0.972442626953125, 1.01251220703125, 1.052581787109375, 1.0926513671875, 1.132720947265625, 1.17279052734375, 1.212860107421875, 1.2529296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 2.0, 10.0, 14.0, 18.0, 20.0, 15.0, 26.0, 20.0, 42.0, 31.0, 45.0, 39.0, 57.0, 56.0, 55.0, 49.0, 52.0, 55.0, 58.0, 49.0, 52.0, 29.0, 34.0, 17.0, 33.0, 24.0, 19.0, 15.0, 15.0, 13.0, 6.0, 8.0, 9.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.125, -14.6474609375, -14.169921875, -13.6923828125, -13.21484375, -12.7373046875, -12.259765625, -11.7822265625, -11.3046875, -10.8271484375, -10.349609375, -9.8720703125, -9.39453125, -8.9169921875, -8.439453125, -7.9619140625, -7.484375, -7.0068359375, -6.529296875, -6.0517578125, -5.57421875, -5.0966796875, -4.619140625, -4.1416015625, -3.6640625, -3.1865234375, -2.708984375, -2.2314453125, -1.75390625, -1.2763671875, -0.798828125, -0.3212890625, 0.15625, 0.6337890625, 1.111328125, 1.5888671875, 2.06640625, 2.5439453125, 3.021484375, 3.4990234375, 3.9765625, 4.4541015625, 4.931640625, 5.4091796875, 5.88671875, 6.3642578125, 6.841796875, 7.3193359375, 7.796875, 8.2744140625, 8.751953125, 9.2294921875, 9.70703125, 10.1845703125, 10.662109375, 11.1396484375, 11.6171875, 12.0947265625, 12.572265625, 13.0498046875, 13.52734375, 14.0048828125, 14.482421875, 14.9599609375, 15.4375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 9.0, 5.0, 7.0, 6.0, 14.0, 10.0, 25.0, 35.0, 46.0, 81.0, 95.0, 152.0, 183.0, 273.0, 434.0, 667.0, 1001.0, 1813.0, 3745.0, 8558.0, 25651.0, 89748.0, 286904.0, 398975.0, 158510.0, 46054.0, 13959.0, 5297.0, 2384.0, 1370.0, 918.0, 512.0, 308.0, 238.0, 173.0, 118.0, 87.0, 51.0, 41.0, 31.0, 19.0, 13.0, 14.0, 9.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.36328125, -0.35266876220703125, -0.3420562744140625, -0.33144378662109375, -0.320831298828125, -0.31021881103515625, -0.2996063232421875, -0.28899383544921875, -0.27838134765625, -0.26776885986328125, -0.2571563720703125, -0.24654388427734375, -0.235931396484375, -0.22531890869140625, -0.2147064208984375, -0.20409393310546875, -0.1934814453125, -0.18286895751953125, -0.1722564697265625, -0.16164398193359375, -0.151031494140625, -0.14041900634765625, -0.1298065185546875, -0.11919403076171875, -0.10858154296875, -0.09796905517578125, -0.0873565673828125, -0.07674407958984375, -0.066131591796875, -0.05551910400390625, -0.0449066162109375, -0.03429412841796875, -0.023681640625, -0.01306915283203125, -0.0024566650390625, 0.00815582275390625, 0.018768310546875, 0.02938079833984375, 0.0399932861328125, 0.05060577392578125, 0.06121826171875, 0.07183074951171875, 0.0824432373046875, 0.09305572509765625, 0.103668212890625, 0.11428070068359375, 0.1248931884765625, 0.13550567626953125, 0.1461181640625, 0.15673065185546875, 0.1673431396484375, 0.17795562744140625, 0.188568115234375, 0.19918060302734375, 0.2097930908203125, 0.22040557861328125, 0.23101806640625, 0.24163055419921875, 0.2522430419921875, 0.26285552978515625, 0.273468017578125, 0.28408050537109375, 0.2946929931640625, 0.30530548095703125, 0.31591796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 11.0, 12.0, 9.0, 22.0, 30.0, 35.0, 48.0, 73.0, 81.0, 82.0, 80.0, 86.0, 86.0, 61.0, 57.0, 46.0, 35.0, 33.0, 20.0, 22.0, 16.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00016379356384277344, -0.000158797949552536, -0.00015380233526229858, -0.00014880672097206116, -0.00014381110668182373, -0.0001388154923915863, -0.00013381987810134888, -0.00012882426381111145, -0.00012382864952087402, -0.0001188330352306366, -0.00011383742094039917, -0.00010884180665016174, -0.00010384619235992432, -9.885057806968689e-05, -9.385496377944946e-05, -8.885934948921204e-05, -8.386373519897461e-05, -7.886812090873718e-05, -7.387250661849976e-05, -6.887689232826233e-05, -6.38812780380249e-05, -5.8885663747787476e-05, -5.389004945755005e-05, -4.889443516731262e-05, -4.3898820877075195e-05, -3.890320658683777e-05, -3.390759229660034e-05, -2.8911978006362915e-05, -2.3916363716125488e-05, -1.892074942588806e-05, -1.3925135135650635e-05, -8.929520845413208e-06, -3.933906555175781e-06, 1.0617077350616455e-06, 6.057322025299072e-06, 1.1052936315536499e-05, 1.6048550605773926e-05, 2.1044164896011353e-05, 2.603977918624878e-05, 3.1035393476486206e-05, 3.603100776672363e-05, 4.102662205696106e-05, 4.6022236347198486e-05, 5.101785063743591e-05, 5.601346492767334e-05, 6.1009079217910767e-05, 6.60046935081482e-05, 7.100030779838562e-05, 7.599592208862305e-05, 8.099153637886047e-05, 8.59871506690979e-05, 9.098276495933533e-05, 9.597837924957275e-05, 0.00010097399353981018, 0.00010596960783004761, 0.00011096522212028503, 0.00011596083641052246, 0.00012095645070075989, 0.00012595206499099731, 0.00013094767928123474, 0.00013594329357147217, 0.0001409389078617096, 0.00014593452215194702, 0.00015093013644218445, 0.00015592575073242188]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 10.0, 13.0, 11.0, 14.0, 38.0, 40.0, 42.0, 63.0, 106.0, 160.0, 260.0, 420.0, 994.0, 2649.0, 8732.0, 31928.0, 117540.0, 335272.0, 361103.0, 136021.0, 37760.0, 9983.0, 2977.0, 1040.0, 502.0, 300.0, 167.0, 109.0, 91.0, 55.0, 31.0, 20.0, 27.0, 20.0, 13.0, 8.0, 6.0, 5.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31884765625, -0.3085823059082031, -0.29831695556640625, -0.2880516052246094, -0.2777862548828125, -0.2675209045410156, -0.25725555419921875, -0.24699020385742188, -0.236724853515625, -0.22645950317382812, -0.21619415283203125, -0.20592880249023438, -0.1956634521484375, -0.18539810180664062, -0.17513275146484375, -0.16486740112304688, -0.15460205078125, -0.14433670043945312, -0.13407135009765625, -0.12380599975585938, -0.1135406494140625, -0.10327529907226562, -0.09300994873046875, -0.08274459838867188, -0.072479248046875, -0.062213897705078125, -0.05194854736328125, -0.041683197021484375, -0.0314178466796875, -0.021152496337890625, -0.01088714599609375, -0.000621795654296875, 0.0096435546875, 0.019908905029296875, 0.03017425537109375, 0.040439605712890625, 0.0507049560546875, 0.060970306396484375, 0.07123565673828125, 0.08150100708007812, 0.091766357421875, 0.10203170776367188, 0.11229705810546875, 0.12256240844726562, 0.1328277587890625, 0.14309310913085938, 0.15335845947265625, 0.16362380981445312, 0.17388916015625, 0.18415451049804688, 0.19441986083984375, 0.20468521118164062, 0.2149505615234375, 0.22521591186523438, 0.23548126220703125, 0.24574661254882812, 0.256011962890625, 0.2662773132324219, 0.27654266357421875, 0.2868080139160156, 0.2970733642578125, 0.3073387145996094, 0.31760406494140625, 0.3278694152832031, 0.338134765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 7.0, 11.0, 8.0, 7.0, 16.0, 15.0, 21.0, 19.0, 20.0, 29.0, 38.0, 51.0, 50.0, 52.0, 57.0, 79.0, 76.0, 62.0, 61.0, 60.0, 45.0, 40.0, 24.0, 31.0, 23.0, 23.0, 17.0, 15.0, 3.0, 11.0, 10.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1065673828125, -0.10317134857177734, -0.09977531433105469, -0.09637928009033203, -0.09298324584960938, -0.08958721160888672, -0.08619117736816406, -0.0827951431274414, -0.07939910888671875, -0.0760030746459961, -0.07260704040527344, -0.06921100616455078, -0.06581497192382812, -0.06241893768310547, -0.05902290344238281, -0.055626869201660156, -0.0522308349609375, -0.048834800720214844, -0.04543876647949219, -0.04204273223876953, -0.038646697998046875, -0.03525066375732422, -0.03185462951660156, -0.028458595275878906, -0.02506256103515625, -0.021666526794433594, -0.018270492553710938, -0.014874458312988281, -0.011478424072265625, -0.008082389831542969, -0.0046863555908203125, -0.0012903213500976562, 0.002105712890625, 0.005501747131347656, 0.008897781372070312, 0.012293815612792969, 0.015689849853515625, 0.01908588409423828, 0.022481918334960938, 0.025877952575683594, 0.02927398681640625, 0.032670021057128906, 0.03606605529785156, 0.03946208953857422, 0.042858123779296875, 0.04625415802001953, 0.04965019226074219, 0.053046226501464844, 0.0564422607421875, 0.059838294982910156, 0.06323432922363281, 0.06663036346435547, 0.07002639770507812, 0.07342243194580078, 0.07681846618652344, 0.0802145004272461, 0.08361053466796875, 0.0870065689086914, 0.09040260314941406, 0.09379863739013672, 0.09719467163085938, 0.10059070587158203, 0.10398674011230469, 0.10738277435302734, 0.11077880859375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 14.0, 59.0, 167.0, 326.0, 273.0, 117.0, 33.0, 12.0, 1.0, 1.0, 2.0, 1.0], "bins": [-53.010353088378906, -52.05902862548828, -51.107704162597656, -50.156375885009766, -49.20505142211914, -48.253726959228516, -47.30240249633789, -46.35107421875, -45.399749755859375, -44.44842529296875, -43.497100830078125, -42.545772552490234, -41.59444808959961, -40.643123626708984, -39.69179916381836, -38.74047088623047, -37.789146423339844, -36.83782196044922, -35.886497497558594, -34.9351692199707, -33.98384475708008, -33.03252029418945, -32.08119583129883, -31.12986946105957, -30.178546905517578, -29.227222442626953, -28.275896072387695, -27.32457160949707, -26.373245239257812, -25.421920776367188, -24.470596313476562, -23.519269943237305, -22.567943572998047, -21.616619110107422, -20.665292739868164, -19.71396827697754, -18.76264190673828, -17.811317443847656, -16.85999298095703, -15.908666610717773, -14.957341194152832, -14.00601577758789, -13.05469036102295, -12.103364944458008, -11.152040481567383, -10.200714111328125, -9.2493896484375, -8.298064231872559, -7.346738815307617, -6.395413398742676, -5.444087982177734, -4.492763042449951, -3.5414376258850098, -2.5901122093200684, -1.6387872695922852, -0.6874618530273438, 0.26386356353759766, 1.2151888608932495, 2.1665141582489014, 3.1178393363952637, 4.069164752960205, 5.0204901695251465, 5.97181510925293, 6.923140525817871, 7.8744659423828125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 19.0, 18.0, 17.0, 24.0, 25.0, 33.0, 46.0, 51.0, 61.0, 71.0, 74.0, 67.0, 87.0, 78.0, 63.0, 58.0, 44.0, 43.0, 32.0, 23.0, 17.0, 17.0, 8.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.420424461364746, -8.113265991210938, -7.806107044219971, -7.498948574066162, -7.1917901039123535, -6.884631156921387, -6.577472686767578, -6.2703142166137695, -5.963155746459961, -5.655997276306152, -5.3488383293151855, -5.041679859161377, -4.734521389007568, -4.427362442016602, -4.120203971862793, -3.8130455017089844, -3.5058865547180176, -3.19872784614563, -2.8915693759918213, -2.5844106674194336, -2.277252197265625, -1.9700934886932373, -1.6629347801208496, -1.355776309967041, -1.0486176013946533, -0.7414590120315552, -0.43430036306381226, -0.12714171409606934, 0.1800168752670288, 0.48717546463012695, 0.7943341732025146, 1.1014926433563232, 1.408651351928711, 1.715809941291809, 2.0229685306549072, 2.330127239227295, 2.6372857093811035, 2.944444417953491, 3.251603126525879, 3.5587615966796875, 3.865920305252075, 4.173079013824463, 4.4802374839782715, 4.787396430969238, 5.094554901123047, 5.4017133712768555, 5.708871841430664, 6.016030311584473, 6.3231892585754395, 6.630347728729248, 6.937506675720215, 7.244665145874023, 7.551823616027832, 7.858982086181641, 8.166141510009766, 8.473299026489258, 8.780458450317383, 9.087616920471191, 9.394775390625, 9.701934814453125, 10.009093284606934, 10.316251754760742, 10.62341022491455, 10.93056869506836, 11.237727165222168]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 12.0, 16.0, 23.0, 24.0, 51.0, 85.0, 117.0, 235.0, 474.0, 1017.0, 2637.0, 7674.0, 25165.0, 89493.0, 328917.0, 417447.0, 124866.0, 34041.0, 10321.0, 3398.0, 1277.0, 555.0, 278.0, 147.0, 83.0, 60.0, 41.0, 12.0, 20.0, 11.0, 13.0, 4.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.95703125, -6.74700927734375, -6.5369873046875, -6.32696533203125, -6.116943359375, -5.90692138671875, -5.6968994140625, -5.48687744140625, -5.27685546875, -5.06683349609375, -4.8568115234375, -4.64678955078125, -4.436767578125, -4.22674560546875, -4.0167236328125, -3.80670166015625, -3.5966796875, -3.38665771484375, -3.1766357421875, -2.96661376953125, -2.756591796875, -2.54656982421875, -2.3365478515625, -2.12652587890625, -1.91650390625, -1.70648193359375, -1.4964599609375, -1.28643798828125, -1.076416015625, -0.86639404296875, -0.6563720703125, -0.44635009765625, -0.236328125, -0.02630615234375, 0.1837158203125, 0.39373779296875, 0.603759765625, 0.81378173828125, 1.0238037109375, 1.23382568359375, 1.44384765625, 1.65386962890625, 1.8638916015625, 2.07391357421875, 2.283935546875, 2.49395751953125, 2.7039794921875, 2.91400146484375, 3.1240234375, 3.33404541015625, 3.5440673828125, 3.75408935546875, 3.964111328125, 4.17413330078125, 4.3841552734375, 4.59417724609375, 4.80419921875, 5.01422119140625, 5.2242431640625, 5.43426513671875, 5.644287109375, 5.85430908203125, 6.0643310546875, 6.27435302734375, 6.484375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 4.0, 2.0, 3.0, 9.0, 13.0, 16.0, 14.0, 19.0, 19.0, 25.0, 32.0, 24.0, 25.0, 32.0, 53.0, 53.0, 46.0, 48.0, 50.0, 42.0, 58.0, 61.0, 40.0, 55.0, 43.0, 32.0, 45.0, 17.0, 25.0, 16.0, 13.0, 14.0, 11.0, 10.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0], "bins": [-16.921875, -16.4952392578125, -16.068603515625, -15.6419677734375, -15.21533203125, -14.7886962890625, -14.362060546875, -13.9354248046875, -13.5087890625, -13.0821533203125, -12.655517578125, -12.2288818359375, -11.80224609375, -11.3756103515625, -10.948974609375, -10.5223388671875, -10.095703125, -9.6690673828125, -9.242431640625, -8.8157958984375, -8.38916015625, -7.9625244140625, -7.535888671875, -7.1092529296875, -6.6826171875, -6.2559814453125, -5.829345703125, -5.4027099609375, -4.97607421875, -4.5494384765625, -4.122802734375, -3.6961669921875, -3.26953125, -2.8428955078125, -2.416259765625, -1.9896240234375, -1.56298828125, -1.1363525390625, -0.709716796875, -0.2830810546875, 0.1435546875, 0.5701904296875, 0.996826171875, 1.4234619140625, 1.85009765625, 2.2767333984375, 2.703369140625, 3.1300048828125, 3.556640625, 3.9832763671875, 4.409912109375, 4.8365478515625, 5.26318359375, 5.6898193359375, 6.116455078125, 6.5430908203125, 6.9697265625, 7.3963623046875, 7.822998046875, 8.2496337890625, 8.67626953125, 9.1029052734375, 9.529541015625, 9.9561767578125, 10.3828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 8.0, 10.0, 8.0, 15.0, 19.0, 28.0, 50.0, 66.0, 97.0, 118.0, 189.0, 268.0, 574.0, 1700.0, 19331.0, 496658.0, 506548.0, 19613.0, 1807.0, 538.0, 290.0, 195.0, 113.0, 75.0, 74.0, 52.0, 39.0, 24.0, 10.0, 11.0, 5.0, 8.0, 1.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4921875, -13.0269775390625, -12.561767578125, -12.0965576171875, -11.63134765625, -11.1661376953125, -10.700927734375, -10.2357177734375, -9.7705078125, -9.3052978515625, -8.840087890625, -8.3748779296875, -7.90966796875, -7.4444580078125, -6.979248046875, -6.5140380859375, -6.048828125, -5.5836181640625, -5.118408203125, -4.6531982421875, -4.18798828125, -3.7227783203125, -3.257568359375, -2.7923583984375, -2.3271484375, -1.8619384765625, -1.396728515625, -0.9315185546875, -0.46630859375, -0.0010986328125, 0.464111328125, 0.9293212890625, 1.39453125, 1.8597412109375, 2.324951171875, 2.7901611328125, 3.25537109375, 3.7205810546875, 4.185791015625, 4.6510009765625, 5.1162109375, 5.5814208984375, 6.046630859375, 6.5118408203125, 6.97705078125, 7.4422607421875, 7.907470703125, 8.3726806640625, 8.837890625, 9.3031005859375, 9.768310546875, 10.2335205078125, 10.69873046875, 11.1639404296875, 11.629150390625, 12.0943603515625, 12.5595703125, 13.0247802734375, 13.489990234375, 13.9552001953125, 14.42041015625, 14.8856201171875, 15.350830078125, 15.8160400390625, 16.28125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 12.0, 8.0, 16.0, 15.0, 14.0, 16.0, 23.0, 25.0, 16.0, 37.0, 31.0, 46.0, 37.0, 56.0, 49.0, 52.0, 56.0, 49.0, 62.0, 48.0, 42.0, 40.0, 34.0, 32.0, 22.0, 20.0, 19.0, 19.0, 15.0, 16.0, 6.0, 12.0, 6.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.4375, -15.915771484375, -15.39404296875, -14.872314453125, -14.3505859375, -13.828857421875, -13.30712890625, -12.785400390625, -12.263671875, -11.741943359375, -11.22021484375, -10.698486328125, -10.1767578125, -9.655029296875, -9.13330078125, -8.611572265625, -8.08984375, -7.568115234375, -7.04638671875, -6.524658203125, -6.0029296875, -5.481201171875, -4.95947265625, -4.437744140625, -3.916015625, -3.394287109375, -2.87255859375, -2.350830078125, -1.8291015625, -1.307373046875, -0.78564453125, -0.263916015625, 0.2578125, 0.779541015625, 1.30126953125, 1.822998046875, 2.3447265625, 2.866455078125, 3.38818359375, 3.909912109375, 4.431640625, 4.953369140625, 5.47509765625, 5.996826171875, 6.5185546875, 7.040283203125, 7.56201171875, 8.083740234375, 8.60546875, 9.127197265625, 9.64892578125, 10.170654296875, 10.6923828125, 11.214111328125, 11.73583984375, 12.257568359375, 12.779296875, 13.301025390625, 13.82275390625, 14.344482421875, 14.8662109375, 15.387939453125, 15.90966796875, 16.431396484375, 16.953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 9.0, 4.0, 10.0, 26.0, 43.0, 147.0, 647.0, 4788.0, 879660.0, 160419.0, 2270.0, 369.0, 85.0, 31.0, 22.0, 4.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8359375, -13.4014892578125, -12.967041015625, -12.5325927734375, -12.09814453125, -11.6636962890625, -11.229248046875, -10.7947998046875, -10.3603515625, -9.9259033203125, -9.491455078125, -9.0570068359375, -8.62255859375, -8.1881103515625, -7.753662109375, -7.3192138671875, -6.884765625, -6.4503173828125, -6.015869140625, -5.5814208984375, -5.14697265625, -4.7125244140625, -4.278076171875, -3.8436279296875, -3.4091796875, -2.9747314453125, -2.540283203125, -2.1058349609375, -1.67138671875, -1.2369384765625, -0.802490234375, -0.3680419921875, 0.06640625, 0.5008544921875, 0.935302734375, 1.3697509765625, 1.80419921875, 2.2386474609375, 2.673095703125, 3.1075439453125, 3.5419921875, 3.9764404296875, 4.410888671875, 4.8453369140625, 5.27978515625, 5.7142333984375, 6.148681640625, 6.5831298828125, 7.017578125, 7.4520263671875, 7.886474609375, 8.3209228515625, 8.75537109375, 9.1898193359375, 9.624267578125, 10.0587158203125, 10.4931640625, 10.9276123046875, 11.362060546875, 11.7965087890625, 12.23095703125, 12.6654052734375, 13.099853515625, 13.5343017578125, 13.96875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 4.0, 6.0, 8.0, 7.0, 19.0, 28.0, 38.0, 69.0, 91.0, 100.0, 116.0, 112.0, 117.0, 98.0, 62.0, 33.0, 29.0, 23.0, 9.0, 10.0, 4.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006227493286132812, -0.0006025359034538269, -0.0005823224782943726, -0.0005621090531349182, -0.0005418956279754639, -0.0005216822028160095, -0.0005014687776565552, -0.00048125535249710083, -0.0004610419273376465, -0.00044082850217819214, -0.0004206150770187378, -0.00040040165185928345, -0.0003801882266998291, -0.00035997480154037476, -0.0003397613763809204, -0.00031954795122146606, -0.0002993345260620117, -0.0002791211009025574, -0.00025890767574310303, -0.00023869425058364868, -0.00021848082542419434, -0.00019826740026474, -0.00017805397510528564, -0.0001578405499458313, -0.00013762712478637695, -0.00011741369962692261, -9.720027446746826e-05, -7.698684930801392e-05, -5.677342414855957e-05, -3.6559998989105225e-05, -1.634657382965088e-05, 3.866851329803467e-06, 2.4080276489257812e-05, 4.429370164871216e-05, 6.45071268081665e-05, 8.472055196762085e-05, 0.0001049339771270752, 0.00012514740228652954, 0.0001453608274459839, 0.00016557425260543823, 0.00018578767776489258, 0.00020600110292434692, 0.00022621452808380127, 0.0002464279532432556, 0.00026664137840270996, 0.0002868548035621643, 0.00030706822872161865, 0.000327281653881073, 0.00034749507904052734, 0.0003677085041999817, 0.00038792192935943604, 0.0004081353545188904, 0.0004283487796783447, 0.00044856220483779907, 0.0004687756299972534, 0.0004889890551567078, 0.0005092024803161621, 0.0005294159054756165, 0.0005496293306350708, 0.0005698427557945251, 0.0005900561809539795, 0.0006102696061134338, 0.0006304830312728882, 0.0006506964564323425, 0.0006709098815917969]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 8.0, 14.0, 16.0, 51.0, 91.0, 256.0, 1037.0, 6672.0, 534406.0, 497958.0, 6487.0, 1020.0, 284.0, 103.0, 50.0, 35.0, 19.0, 12.0, 8.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.9609375, -12.6285400390625, -12.296142578125, -11.9637451171875, -11.63134765625, -11.2989501953125, -10.966552734375, -10.6341552734375, -10.3017578125, -9.9693603515625, -9.636962890625, -9.3045654296875, -8.97216796875, -8.6397705078125, -8.307373046875, -7.9749755859375, -7.642578125, -7.3101806640625, -6.977783203125, -6.6453857421875, -6.31298828125, -5.9805908203125, -5.648193359375, -5.3157958984375, -4.9833984375, -4.6510009765625, -4.318603515625, -3.9862060546875, -3.65380859375, -3.3214111328125, -2.989013671875, -2.6566162109375, -2.32421875, -1.9918212890625, -1.659423828125, -1.3270263671875, -0.99462890625, -0.6622314453125, -0.329833984375, 0.0025634765625, 0.3349609375, 0.6673583984375, 0.999755859375, 1.3321533203125, 1.66455078125, 1.9969482421875, 2.329345703125, 2.6617431640625, 2.994140625, 3.3265380859375, 3.658935546875, 3.9913330078125, 4.32373046875, 4.6561279296875, 4.988525390625, 5.3209228515625, 5.6533203125, 5.9857177734375, 6.318115234375, 6.6505126953125, 6.98291015625, 7.3153076171875, 7.647705078125, 7.9801025390625, 8.3125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 10.0, 13.0, 26.0, 20.0, 66.0, 72.0, 97.0, 127.0, 141.0, 115.0, 102.0, 61.0, 41.0, 33.0, 18.0, 15.0, 10.0, 7.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.79296875, -1.72528076171875, -1.6575927734375, -1.58990478515625, -1.522216796875, -1.45452880859375, -1.3868408203125, -1.31915283203125, -1.25146484375, -1.18377685546875, -1.1160888671875, -1.04840087890625, -0.980712890625, -0.91302490234375, -0.8453369140625, -0.77764892578125, -0.7099609375, -0.64227294921875, -0.5745849609375, -0.50689697265625, -0.439208984375, -0.37152099609375, -0.3038330078125, -0.23614501953125, -0.16845703125, -0.10076904296875, -0.0330810546875, 0.03460693359375, 0.102294921875, 0.16998291015625, 0.2376708984375, 0.30535888671875, 0.373046875, 0.44073486328125, 0.5084228515625, 0.57611083984375, 0.643798828125, 0.71148681640625, 0.7791748046875, 0.84686279296875, 0.91455078125, 0.98223876953125, 1.0499267578125, 1.11761474609375, 1.185302734375, 1.25299072265625, 1.3206787109375, 1.38836669921875, 1.4560546875, 1.52374267578125, 1.5914306640625, 1.65911865234375, 1.726806640625, 1.79449462890625, 1.8621826171875, 1.92987060546875, 1.99755859375, 2.06524658203125, 2.1329345703125, 2.20062255859375, 2.268310546875, 2.33599853515625, 2.4036865234375, 2.47137451171875, 2.5390625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 12.0, 28.0, 71.0, 137.0, 215.0, 232.0, 164.0, 74.0, 38.0, 14.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.613752365112305, -23.31734275817871, -22.020933151245117, -20.724525451660156, -19.428115844726562, -18.13170623779297, -16.835296630859375, -15.538887977600098, -14.242478370666504, -12.94606876373291, -11.649660110473633, -10.353250503540039, -9.056840896606445, -7.760432243347168, -6.464022636413574, -5.167613983154297, -3.871204376220703, -2.5747952461242676, -1.278385877609253, 0.01802349090576172, 1.3144326210021973, 2.610841751098633, 3.9072513580322266, 5.203660011291504, 6.500069618225098, 7.796478748321533, 9.092887878417969, 10.389297485351562, 11.685707092285156, 12.982115745544434, 14.278525352478027, 15.574934005737305, 16.871341705322266, 18.16775131225586, 19.464160919189453, 20.760570526123047, 22.056978225708008, 23.3533878326416, 24.649797439575195, 25.946205139160156, 27.24261474609375, 28.539024353027344, 29.835433959960938, 31.13184356689453, 32.428253173828125, 33.72466278076172, 35.02107238769531, 36.31747817993164, 37.6138916015625, 38.910301208496094, 40.20671081542969, 41.50312042236328, 42.799530029296875, 44.09593963623047, 45.39234924316406, 46.68875503540039, 47.985164642333984, 49.28157424926758, 50.57798385620117, 51.874393463134766, 53.17080307006836, 54.46720886230469, 55.76361846923828, 57.060028076171875, 58.35643768310547]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 5.0, 8.0, 9.0, 6.0, 9.0, 16.0, 21.0, 21.0, 26.0, 39.0, 25.0, 24.0, 35.0, 32.0, 43.0, 43.0, 50.0, 51.0, 44.0, 36.0, 43.0, 26.0, 43.0, 45.0, 36.0, 41.0, 26.0, 28.0, 20.0, 23.0, 23.0, 14.0, 18.0, 14.0, 17.0, 15.0, 4.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.671180725097656, -27.85697364807129, -27.042768478393555, -26.228561401367188, -25.414356231689453, -24.600149154663086, -23.78594207763672, -22.971736907958984, -22.157529830932617, -21.34332275390625, -20.529117584228516, -19.71491050720215, -18.90070343017578, -18.086498260498047, -17.27229118347168, -16.458084106445312, -15.643878936767578, -14.829672813415527, -14.015466690063477, -13.20125961303711, -12.387053489685059, -11.572847366333008, -10.75864028930664, -9.94443416595459, -9.130228042602539, -8.316021919250488, -7.501815319061279, -6.68760871887207, -5.8734025955200195, -5.059196472167969, -4.24498987197876, -3.430783271789551, -2.616575241088867, -1.8023688793182373, -0.9881625175476074, -0.17395615577697754, 0.6402502059936523, 1.4544563293457031, 2.268662929534912, 3.082869529724121, 3.897075653076172, 4.711281776428223, 5.525488376617432, 6.339694976806641, 7.153901100158691, 7.968107223510742, 8.78231430053711, 9.59652042388916, 10.410726547241211, 11.224932670593262, 12.039138793945312, 12.85334587097168, 13.66755199432373, 14.481758117675781, 15.295965194702148, 16.110172271728516, 16.92437744140625, 17.738584518432617, 18.55278968811035, 19.36699676513672, 20.181201934814453, 20.99540901184082, 21.809616088867188, 22.623821258544922, 23.43802833557129]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 9.0, 10.0, 18.0, 30.0, 42.0, 71.0, 145.0, 297.0, 741.0, 2882.0, 39171.0, 2495223.0, 1625136.0, 27523.0, 1956.0, 511.0, 227.0, 106.0, 57.0, 40.0, 34.0, 15.0, 12.0, 12.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-37.21875, -36.3905029296875, -35.562255859375, -34.7340087890625, -33.90576171875, -33.0775146484375, -32.249267578125, -31.4210205078125, -30.5927734375, -29.7645263671875, -28.936279296875, -28.1080322265625, -27.27978515625, -26.4515380859375, -25.623291015625, -24.7950439453125, -23.966796875, -23.1385498046875, -22.310302734375, -21.4820556640625, -20.65380859375, -19.8255615234375, -18.997314453125, -18.1690673828125, -17.3408203125, -16.5125732421875, -15.684326171875, -14.8560791015625, -14.02783203125, -13.1995849609375, -12.371337890625, -11.5430908203125, -10.71484375, -9.8865966796875, -9.058349609375, -8.2301025390625, -7.40185546875, -6.5736083984375, -5.745361328125, -4.9171142578125, -4.0888671875, -3.2606201171875, -2.432373046875, -1.6041259765625, -0.77587890625, 0.0523681640625, 0.880615234375, 1.7088623046875, 2.537109375, 3.3653564453125, 4.193603515625, 5.0218505859375, 5.85009765625, 6.6783447265625, 7.506591796875, 8.3348388671875, 9.1630859375, 9.9913330078125, 10.819580078125, 11.6478271484375, 12.47607421875, 13.3043212890625, 14.132568359375, 14.9608154296875, 15.7890625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 9.0, 5.0, 6.0, 10.0, 9.0, 14.0, 23.0, 24.0, 28.0, 29.0, 41.0, 46.0, 46.0, 53.0, 67.0, 69.0, 64.0, 57.0, 61.0, 46.0, 56.0, 52.0, 40.0, 25.0, 29.0, 26.0, 18.0, 15.0, 9.0, 8.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.5667724609375, -8.250732421875, -7.9346923828125, -7.61865234375, -7.3026123046875, -6.986572265625, -6.6705322265625, -6.3544921875, -6.0384521484375, -5.722412109375, -5.4063720703125, -5.09033203125, -4.7742919921875, -4.458251953125, -4.1422119140625, -3.826171875, -3.5101318359375, -3.194091796875, -2.8780517578125, -2.56201171875, -2.2459716796875, -1.929931640625, -1.6138916015625, -1.2978515625, -0.9818115234375, -0.665771484375, -0.3497314453125, -0.03369140625, 0.2823486328125, 0.598388671875, 0.9144287109375, 1.23046875, 1.5465087890625, 1.862548828125, 2.1785888671875, 2.49462890625, 2.8106689453125, 3.126708984375, 3.4427490234375, 3.7587890625, 4.0748291015625, 4.390869140625, 4.7069091796875, 5.02294921875, 5.3389892578125, 5.655029296875, 5.9710693359375, 6.287109375, 6.6031494140625, 6.919189453125, 7.2352294921875, 7.55126953125, 7.8673095703125, 8.183349609375, 8.4993896484375, 8.8154296875, 9.1314697265625, 9.447509765625, 9.7635498046875, 10.07958984375, 10.3956298828125, 10.711669921875, 11.0277099609375, 11.34375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 12.0, 15.0, 27.0, 33.0, 47.0, 81.0, 125.0, 206.0, 418.0, 732.0, 1675.0, 4915.0, 24656.0, 299745.0, 3252714.0, 561666.0, 37168.0, 6204.0, 1988.0, 816.0, 398.0, 231.0, 148.0, 88.0, 51.0, 31.0, 29.0, 15.0, 13.0, 11.0, 3.0, 8.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.84375, -9.408203125, -8.97265625, -8.537109375, -8.1015625, -7.666015625, -7.23046875, -6.794921875, -6.359375, -5.923828125, -5.48828125, -5.052734375, -4.6171875, -4.181640625, -3.74609375, -3.310546875, -2.875, -2.439453125, -2.00390625, -1.568359375, -1.1328125, -0.697265625, -0.26171875, 0.173828125, 0.609375, 1.044921875, 1.48046875, 1.916015625, 2.3515625, 2.787109375, 3.22265625, 3.658203125, 4.09375, 4.529296875, 4.96484375, 5.400390625, 5.8359375, 6.271484375, 6.70703125, 7.142578125, 7.578125, 8.013671875, 8.44921875, 8.884765625, 9.3203125, 9.755859375, 10.19140625, 10.626953125, 11.0625, 11.498046875, 11.93359375, 12.369140625, 12.8046875, 13.240234375, 13.67578125, 14.111328125, 14.546875, 14.982421875, 15.41796875, 15.853515625, 16.2890625, 16.724609375, 17.16015625, 17.595703125, 18.03125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 9.0, 12.0, 18.0, 24.0, 27.0, 34.0, 45.0, 63.0, 108.0, 114.0, 159.0, 227.0, 288.0, 376.0, 433.0, 445.0, 388.0, 322.0, 240.0, 207.0, 124.0, 98.0, 75.0, 66.0, 33.0, 26.0, 22.0, 10.0, 10.0, 18.0, 7.0, 3.0, 3.0, 8.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.720703125, -2.626922607421875, -2.53314208984375, -2.439361572265625, -2.3455810546875, -2.251800537109375, -2.15802001953125, -2.064239501953125, -1.970458984375, -1.876678466796875, -1.78289794921875, -1.689117431640625, -1.5953369140625, -1.501556396484375, -1.40777587890625, -1.313995361328125, -1.22021484375, -1.126434326171875, -1.03265380859375, -0.938873291015625, -0.8450927734375, -0.751312255859375, -0.65753173828125, -0.563751220703125, -0.469970703125, -0.376190185546875, -0.28240966796875, -0.188629150390625, -0.0948486328125, -0.001068115234375, 0.09271240234375, 0.186492919921875, 0.2802734375, 0.374053955078125, 0.46783447265625, 0.561614990234375, 0.6553955078125, 0.749176025390625, 0.84295654296875, 0.936737060546875, 1.030517578125, 1.124298095703125, 1.21807861328125, 1.311859130859375, 1.4056396484375, 1.499420166015625, 1.59320068359375, 1.686981201171875, 1.78076171875, 1.874542236328125, 1.96832275390625, 2.062103271484375, 2.1558837890625, 2.249664306640625, 2.34344482421875, 2.437225341796875, 2.531005859375, 2.624786376953125, 2.71856689453125, 2.812347412109375, 2.9061279296875, 2.999908447265625, 3.09368896484375, 3.187469482421875, 3.28125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 6.0, 8.0, 16.0, 36.0, 50.0, 89.0, 103.0, 144.0, 139.0, 135.0, 104.0, 72.0, 34.0, 32.0, 16.0, 9.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.68461799621582, -30.03406524658203, -29.383512496948242, -28.732959747314453, -28.082406997680664, -27.431854248046875, -26.781301498413086, -26.130748748779297, -25.480194091796875, -24.829641342163086, -24.179088592529297, -23.528535842895508, -22.87798309326172, -22.22743034362793, -21.57687759399414, -20.92632293701172, -20.275772094726562, -19.625219345092773, -18.974666595458984, -18.324113845825195, -17.673561096191406, -17.023008346557617, -16.372455596923828, -15.721901893615723, -15.071349143981934, -14.420796394348145, -13.770243644714355, -13.119690895080566, -12.469137191772461, -11.818584442138672, -11.168031692504883, -10.517478942871094, -9.866926193237305, -9.216373443603516, -8.565820693969727, -7.915267467498779, -7.26471471786499, -6.614161968231201, -5.963608741760254, -5.313055992126465, -4.662503242492676, -4.011950492858887, -3.3613975048065186, -2.7108445167541504, -2.0602917671203613, -1.4097390174865723, -0.7591860294342041, -0.10863304138183594, 0.5419197082519531, 1.1924725770950317, 1.8430254459381104, 2.4935784339904785, 3.1441311836242676, 3.7946839332580566, 4.445237159729004, 5.095789909362793, 5.746342658996582, 6.396895408630371, 7.04744815826416, 7.698001384735107, 8.348554611206055, 8.999107360839844, 9.649660110473633, 10.300212860107422, 10.950765609741211]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 6.0, 14.0, 13.0, 12.0, 21.0, 29.0, 19.0, 32.0, 40.0, 41.0, 46.0, 43.0, 47.0, 44.0, 47.0, 58.0, 51.0, 50.0, 59.0, 45.0, 43.0, 40.0, 45.0, 34.0, 18.0, 21.0, 17.0, 14.0, 15.0, 6.0, 7.0, 7.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.23513412475586, -9.909123420715332, -9.583112716674805, -9.257102966308594, -8.931092262268066, -8.605081558227539, -8.279071807861328, -7.953061103820801, -7.627050399780273, -7.301039695739746, -6.975029468536377, -6.649019241333008, -6.3230085372924805, -5.996997833251953, -5.670987606048584, -5.344977378845215, -5.0189666748046875, -4.69295597076416, -4.366945743560791, -4.040935516357422, -3.7149248123168945, -3.3889143466949463, -3.062903881072998, -2.73689341545105, -2.4108829498291016, -2.0848724842071533, -1.758862018585205, -1.4328515529632568, -1.1068410873413086, -0.7808306217193604, -0.4548201560974121, -0.12880969047546387, 0.19720172882080078, 0.523212194442749, 0.8492226600646973, 1.1752331256866455, 1.5012435913085938, 1.827254056930542, 2.1532645225524902, 2.4792749881744385, 2.8052854537963867, 3.131295919418335, 3.457306385040283, 3.7833168506622314, 4.10932731628418, 4.435338020324707, 4.761348247528076, 5.087358474731445, 5.413369178771973, 5.7393798828125, 6.065390110015869, 6.391400337219238, 6.717411041259766, 7.043421745300293, 7.369431972503662, 7.695442199707031, 8.021452903747559, 8.347463607788086, 8.673473358154297, 8.999484062194824, 9.325494766235352, 9.651505470275879, 9.977516174316406, 10.303525924682617, 10.629536628723145]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 13.0, 20.0, 28.0, 32.0, 66.0, 94.0, 161.0, 240.0, 533.0, 1327.0, 3599.0, 11184.0, 40228.0, 160381.0, 421453.0, 296293.0, 81782.0, 20804.0, 6315.0, 2183.0, 855.0, 407.0, 183.0, 122.0, 78.0, 54.0, 33.0, 20.0, 11.0, 16.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9892578125, -1.9175872802734375, -1.845916748046875, -1.7742462158203125, -1.70257568359375, -1.6309051513671875, -1.559234619140625, -1.4875640869140625, -1.4158935546875, -1.3442230224609375, -1.272552490234375, -1.2008819580078125, -1.12921142578125, -1.0575408935546875, -0.985870361328125, -0.9141998291015625, -0.842529296875, -0.7708587646484375, -0.699188232421875, -0.6275177001953125, -0.55584716796875, -0.4841766357421875, -0.412506103515625, -0.3408355712890625, -0.2691650390625, -0.1974945068359375, -0.125823974609375, -0.0541534423828125, 0.01751708984375, 0.0891876220703125, 0.160858154296875, 0.2325286865234375, 0.30419921875, 0.3758697509765625, 0.447540283203125, 0.5192108154296875, 0.59088134765625, 0.6625518798828125, 0.734222412109375, 0.8058929443359375, 0.8775634765625, 0.9492340087890625, 1.020904541015625, 1.0925750732421875, 1.16424560546875, 1.2359161376953125, 1.307586669921875, 1.3792572021484375, 1.450927734375, 1.5225982666015625, 1.594268798828125, 1.6659393310546875, 1.73760986328125, 1.8092803955078125, 1.880950927734375, 1.9526214599609375, 2.0242919921875, 2.0959625244140625, 2.167633056640625, 2.2393035888671875, 2.31097412109375, 2.3826446533203125, 2.454315185546875, 2.5259857177734375, 2.59765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 9.0, 11.0, 20.0, 17.0, 22.0, 39.0, 49.0, 43.0, 69.0, 59.0, 72.0, 69.0, 86.0, 80.0, 67.0, 63.0, 46.0, 53.0, 32.0, 34.0, 14.0, 15.0, 10.0, 10.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.234375, -10.912353515625, -10.59033203125, -10.268310546875, -9.9462890625, -9.624267578125, -9.30224609375, -8.980224609375, -8.658203125, -8.336181640625, -8.01416015625, -7.692138671875, -7.3701171875, -7.048095703125, -6.72607421875, -6.404052734375, -6.08203125, -5.760009765625, -5.43798828125, -5.115966796875, -4.7939453125, -4.471923828125, -4.14990234375, -3.827880859375, -3.505859375, -3.183837890625, -2.86181640625, -2.539794921875, -2.2177734375, -1.895751953125, -1.57373046875, -1.251708984375, -0.9296875, -0.607666015625, -0.28564453125, 0.036376953125, 0.3583984375, 0.680419921875, 1.00244140625, 1.324462890625, 1.646484375, 1.968505859375, 2.29052734375, 2.612548828125, 2.9345703125, 3.256591796875, 3.57861328125, 3.900634765625, 4.22265625, 4.544677734375, 4.86669921875, 5.188720703125, 5.5107421875, 5.832763671875, 6.15478515625, 6.476806640625, 6.798828125, 7.120849609375, 7.44287109375, 7.764892578125, 8.0869140625, 8.408935546875, 8.73095703125, 9.052978515625, 9.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 12.0, 17.0, 13.0, 22.0, 34.0, 49.0, 55.0, 97.0, 132.0, 207.0, 329.0, 513.0, 852.0, 1420.0, 2314.0, 3931.0, 7104.0, 12635.0, 23338.0, 43437.0, 78165.0, 130173.0, 184805.0, 196461.0, 151109.0, 94001.0, 52534.0, 28664.0, 15680.0, 8593.0, 4776.0, 2804.0, 1585.0, 981.0, 594.0, 414.0, 235.0, 162.0, 107.0, 64.0, 37.0, 37.0, 15.0, 14.0, 12.0, 12.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.943359375, -0.9149169921875, -0.886474609375, -0.8580322265625, -0.82958984375, -0.8011474609375, -0.772705078125, -0.7442626953125, -0.7158203125, -0.6873779296875, -0.658935546875, -0.6304931640625, -0.60205078125, -0.5736083984375, -0.545166015625, -0.5167236328125, -0.48828125, -0.4598388671875, -0.431396484375, -0.4029541015625, -0.37451171875, -0.3460693359375, -0.317626953125, -0.2891845703125, -0.2607421875, -0.2322998046875, -0.203857421875, -0.1754150390625, -0.14697265625, -0.1185302734375, -0.090087890625, -0.0616455078125, -0.033203125, -0.0047607421875, 0.023681640625, 0.0521240234375, 0.08056640625, 0.1090087890625, 0.137451171875, 0.1658935546875, 0.1943359375, 0.2227783203125, 0.251220703125, 0.2796630859375, 0.30810546875, 0.3365478515625, 0.364990234375, 0.3934326171875, 0.421875, 0.4503173828125, 0.478759765625, 0.5072021484375, 0.53564453125, 0.5640869140625, 0.592529296875, 0.6209716796875, 0.6494140625, 0.6778564453125, 0.706298828125, 0.7347412109375, 0.76318359375, 0.7916259765625, 0.820068359375, 0.8485107421875, 0.876953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 3.0, 7.0, 11.0, 7.0, 11.0, 10.0, 9.0, 17.0, 19.0, 25.0, 29.0, 30.0, 30.0, 36.0, 39.0, 34.0, 33.0, 41.0, 40.0, 61.0, 48.0, 42.0, 55.0, 43.0, 38.0, 43.0, 36.0, 38.0, 30.0, 23.0, 11.0, 19.0, 22.0, 12.0, 6.0, 12.0, 6.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.5078125, -13.1171875, -12.7265625, -12.3359375, -11.9453125, -11.5546875, -11.1640625, -10.7734375, -10.3828125, -9.9921875, -9.6015625, -9.2109375, -8.8203125, -8.4296875, -8.0390625, -7.6484375, -7.2578125, -6.8671875, -6.4765625, -6.0859375, -5.6953125, -5.3046875, -4.9140625, -4.5234375, -4.1328125, -3.7421875, -3.3515625, -2.9609375, -2.5703125, -2.1796875, -1.7890625, -1.3984375, -1.0078125, -0.6171875, -0.2265625, 0.1640625, 0.5546875, 0.9453125, 1.3359375, 1.7265625, 2.1171875, 2.5078125, 2.8984375, 3.2890625, 3.6796875, 4.0703125, 4.4609375, 4.8515625, 5.2421875, 5.6328125, 6.0234375, 6.4140625, 6.8046875, 7.1953125, 7.5859375, 7.9765625, 8.3671875, 8.7578125, 9.1484375, 9.5390625, 9.9296875, 10.3203125, 10.7109375, 11.1015625, 11.4921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 5.0, 9.0, 5.0, 6.0, 20.0, 30.0, 40.0, 65.0, 76.0, 129.0, 184.0, 252.0, 459.0, 723.0, 1315.0, 2367.0, 5472.0, 14818.0, 46770.0, 155757.0, 355321.0, 301527.0, 110433.0, 33060.0, 10880.0, 4060.0, 1938.0, 1053.0, 605.0, 409.0, 255.0, 136.0, 124.0, 75.0, 42.0, 38.0, 18.0, 27.0, 15.0, 13.0, 9.0, 0.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32177734375, -0.31134796142578125, -0.3009185791015625, -0.29048919677734375, -0.280059814453125, -0.26963043212890625, -0.2592010498046875, -0.24877166748046875, -0.23834228515625, -0.22791290283203125, -0.2174835205078125, -0.20705413818359375, -0.196624755859375, -0.18619537353515625, -0.1757659912109375, -0.16533660888671875, -0.1549072265625, -0.14447784423828125, -0.1340484619140625, -0.12361907958984375, -0.113189697265625, -0.10276031494140625, -0.0923309326171875, -0.08190155029296875, -0.07147216796875, -0.06104278564453125, -0.0506134033203125, -0.04018402099609375, -0.029754638671875, -0.01932525634765625, -0.0088958740234375, 0.00153350830078125, 0.011962890625, 0.02239227294921875, 0.0328216552734375, 0.04325103759765625, 0.053680419921875, 0.06410980224609375, 0.0745391845703125, 0.08496856689453125, 0.09539794921875, 0.10582733154296875, 0.1162567138671875, 0.12668609619140625, 0.137115478515625, 0.14754486083984375, 0.1579742431640625, 0.16840362548828125, 0.1788330078125, 0.18926239013671875, 0.1996917724609375, 0.21012115478515625, 0.220550537109375, 0.23097991943359375, 0.2414093017578125, 0.25183868408203125, 0.26226806640625, 0.27269744873046875, 0.2831268310546875, 0.29355621337890625, 0.303985595703125, 0.31441497802734375, 0.3248443603515625, 0.33527374267578125, 0.345703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 10.0, 11.0, 14.0, 24.0, 43.0, 50.0, 81.0, 98.0, 124.0, 130.0, 125.0, 92.0, 63.0, 52.0, 31.0, 25.0, 20.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026679039001464844, -0.0002580583095550537, -0.000249326229095459, -0.00024059414863586426, -0.00023186206817626953, -0.0002231299877166748, -0.00021439790725708008, -0.00020566582679748535, -0.00019693374633789062, -0.0001882016658782959, -0.00017946958541870117, -0.00017073750495910645, -0.00016200542449951172, -0.000153273344039917, -0.00014454126358032227, -0.00013580918312072754, -0.0001270771026611328, -0.00011834502220153809, -0.00010961294174194336, -0.00010088086128234863, -9.21487808227539e-05, -8.341670036315918e-05, -7.468461990356445e-05, -6.595253944396973e-05, -5.7220458984375e-05, -4.8488378524780273e-05, -3.975629806518555e-05, -3.102421760559082e-05, -2.2292137145996094e-05, -1.3560056686401367e-05, -4.827976226806641e-06, 3.904104232788086e-06, 1.2636184692382812e-05, 2.136826515197754e-05, 3.0100345611572266e-05, 3.883242607116699e-05, 4.756450653076172e-05, 5.6296586990356445e-05, 6.502866744995117e-05, 7.37607479095459e-05, 8.249282836914062e-05, 9.122490882873535e-05, 9.995698928833008e-05, 0.0001086890697479248, 0.00011742115020751953, 0.00012615323066711426, 0.00013488531112670898, 0.0001436173915863037, 0.00015234947204589844, 0.00016108155250549316, 0.0001698136329650879, 0.00017854571342468262, 0.00018727779388427734, 0.00019600987434387207, 0.0002047419548034668, 0.00021347403526306152, 0.00022220611572265625, 0.00023093819618225098, 0.0002396702766418457, 0.00024840235710144043, 0.00025713443756103516, 0.0002658665180206299, 0.0002745985984802246, 0.00028333067893981934, 0.00029206275939941406]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 9.0, 13.0, 16.0, 18.0, 29.0, 33.0, 41.0, 61.0, 101.0, 127.0, 245.0, 362.0, 681.0, 1675.0, 4383.0, 13407.0, 43223.0, 130633.0, 288224.0, 315756.0, 164680.0, 56948.0, 18021.0, 5769.0, 2046.0, 853.0, 414.0, 249.0, 163.0, 102.0, 85.0, 49.0, 34.0, 31.0, 18.0, 14.0, 10.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.324462890625, -0.3157215118408203, -0.3069801330566406, -0.29823875427246094, -0.28949737548828125, -0.28075599670410156, -0.2720146179199219, -0.2632732391357422, -0.2545318603515625, -0.2457904815673828, -0.23704910278320312, -0.22830772399902344, -0.21956634521484375, -0.21082496643066406, -0.20208358764648438, -0.1933422088623047, -0.184600830078125, -0.1758594512939453, -0.16711807250976562, -0.15837669372558594, -0.14963531494140625, -0.14089393615722656, -0.13215255737304688, -0.12341117858886719, -0.1146697998046875, -0.10592842102050781, -0.09718704223632812, -0.08844566345214844, -0.07970428466796875, -0.07096290588378906, -0.062221527099609375, -0.05348014831542969, -0.04473876953125, -0.03599739074707031, -0.027256011962890625, -0.018514633178710938, -0.00977325439453125, -0.0010318756103515625, 0.007709503173828125, 0.016450881958007812, 0.0251922607421875, 0.03393363952636719, 0.042675018310546875, 0.05141639709472656, 0.06015777587890625, 0.06889915466308594, 0.07764053344726562, 0.08638191223144531, 0.095123291015625, 0.10386466979980469, 0.11260604858398438, 0.12134742736816406, 0.13008880615234375, 0.13883018493652344, 0.14757156372070312, 0.1563129425048828, 0.1650543212890625, 0.1737957000732422, 0.18253707885742188, 0.19127845764160156, 0.20001983642578125, 0.20876121520996094, 0.21750259399414062, 0.2262439727783203, 0.2349853515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 8.0, 17.0, 19.0, 24.0, 12.0, 27.0, 21.0, 35.0, 36.0, 36.0, 41.0, 65.0, 53.0, 63.0, 56.0, 66.0, 37.0, 53.0, 48.0, 39.0, 46.0, 34.0, 21.0, 26.0, 29.0, 24.0, 9.0, 13.0, 6.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08251953125, -0.07959747314453125, -0.0766754150390625, -0.07375335693359375, -0.070831298828125, -0.06790924072265625, -0.0649871826171875, -0.06206512451171875, -0.05914306640625, -0.05622100830078125, -0.0532989501953125, -0.05037689208984375, -0.047454833984375, -0.04453277587890625, -0.0416107177734375, -0.03868865966796875, -0.0357666015625, -0.03284454345703125, -0.0299224853515625, -0.02700042724609375, -0.024078369140625, -0.02115631103515625, -0.0182342529296875, -0.01531219482421875, -0.01239013671875, -0.00946807861328125, -0.0065460205078125, -0.00362396240234375, -0.000701904296875, 0.00222015380859375, 0.0051422119140625, 0.00806427001953125, 0.010986328125, 0.01390838623046875, 0.0168304443359375, 0.01975250244140625, 0.022674560546875, 0.02559661865234375, 0.0285186767578125, 0.03144073486328125, 0.03436279296875, 0.03728485107421875, 0.0402069091796875, 0.04312896728515625, 0.046051025390625, 0.04897308349609375, 0.0518951416015625, 0.05481719970703125, 0.0577392578125, 0.06066131591796875, 0.0635833740234375, 0.06650543212890625, 0.069427490234375, 0.07234954833984375, 0.0752716064453125, 0.07819366455078125, 0.08111572265625, 0.08403778076171875, 0.0869598388671875, 0.08988189697265625, 0.092803955078125, 0.09572601318359375, 0.0986480712890625, 0.10157012939453125, 0.1044921875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 32.0, 104.0, 244.0, 328.0, 186.0, 69.0, 22.0, 6.0, 5.0, 1.0, 1.0, 2.0], "bins": [-49.059749603271484, -48.172054290771484, -47.28435516357422, -46.39665985107422, -45.50896453857422, -44.62126922607422, -43.73357009887695, -42.84587478637695, -41.95817565917969, -41.07048034667969, -40.18278121948242, -39.29508590698242, -38.40739059448242, -37.519691467285156, -36.631996154785156, -35.744300842285156, -34.856605529785156, -33.968910217285156, -33.08121109008789, -32.19351577758789, -31.30582046508789, -30.418123245239258, -29.530426025390625, -28.642730712890625, -27.755033493041992, -26.86733627319336, -25.97964096069336, -25.091943740844727, -24.204246520996094, -23.316551208496094, -22.42885398864746, -21.541156768798828, -20.653461456298828, -19.765764236450195, -18.878068923950195, -17.990371704101562, -17.102676391601562, -16.21497917175293, -15.327281951904297, -14.43958568572998, -13.551889419555664, -12.664193153381348, -11.776496887207031, -10.888799667358398, -10.001103401184082, -9.113407135009766, -8.225709915161133, -7.338013648986816, -6.4503173828125, -5.562621116638184, -4.674924373626709, -3.7872278690338135, -2.899531364440918, -2.0118350982666016, -1.124138355255127, -0.23644161224365234, 0.6512546539306641, 1.5389511585235596, 2.426647663116455, 3.3143441677093506, 4.202040672302246, 5.0897369384765625, 5.977433681488037, 6.865130424499512, 7.752826690673828]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 9.0, 14.0, 13.0, 18.0, 34.0, 35.0, 42.0, 54.0, 59.0, 69.0, 61.0, 64.0, 87.0, 67.0, 75.0, 60.0, 52.0, 54.0, 33.0, 23.0, 26.0, 16.0, 13.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.054313659667969, -8.752047538757324, -8.449780464172363, -8.147514343261719, -7.845247268676758, -7.542980670928955, -7.240714073181152, -6.938447952270508, -6.636180877685547, -6.333914279937744, -6.031647682189941, -5.729381084442139, -5.427114486694336, -5.124847888946533, -4.8225812911987305, -4.520315170288086, -4.218048572540283, -3.9157819747924805, -3.6135153770446777, -3.311248779296875, -3.0089821815490723, -2.7067155838012695, -2.404449224472046, -2.102182626724243, -1.7999160289764404, -1.4976494312286377, -1.195382833480835, -0.8931163549423218, -0.590849757194519, -0.2885831594467163, 0.013683319091796875, 0.3159499168395996, 0.6182165145874023, 0.9204831123352051, 1.2227497100830078, 1.525016188621521, 1.8272827863693237, 2.129549503326416, 2.4318158626556396, 2.7340824604034424, 3.036349058151245, 3.338615655899048, 3.6408822536468506, 3.943148612976074, 4.245415210723877, 4.54768180847168, 4.849948406219482, 5.152215003967285, 5.454481601715088, 5.756748199462891, 6.059014797210693, 6.361281394958496, 6.663547992706299, 6.965814590454102, 7.268080711364746, 7.570347785949707, 7.872613906860352, 8.174880027770996, 8.477147102355957, 8.779413223266602, 9.081680297851562, 9.383946418762207, 9.686213493347168, 9.988479614257812, 10.290746688842773]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 6.0, 4.0, 3.0, 3.0, 9.0, 11.0, 14.0, 15.0, 35.0, 53.0, 86.0, 176.0, 308.0, 565.0, 1082.0, 2248.0, 4902.0, 11320.0, 27936.0, 70567.0, 205458.0, 451202.0, 170057.0, 60618.0, 23459.0, 9944.0, 4293.0, 2038.0, 920.0, 478.0, 306.0, 157.0, 82.0, 50.0, 46.0, 32.0, 17.0, 13.0, 9.0, 1.0, 7.0, 6.0, 1.0, 9.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.796875, -5.61236572265625, -5.4278564453125, -5.24334716796875, -5.058837890625, -4.87432861328125, -4.6898193359375, -4.50531005859375, -4.32080078125, -4.13629150390625, -3.9517822265625, -3.76727294921875, -3.582763671875, -3.39825439453125, -3.2137451171875, -3.02923583984375, -2.8447265625, -2.66021728515625, -2.4757080078125, -2.29119873046875, -2.106689453125, -1.92218017578125, -1.7376708984375, -1.55316162109375, -1.36865234375, -1.18414306640625, -0.9996337890625, -0.81512451171875, -0.630615234375, -0.44610595703125, -0.2615966796875, -0.07708740234375, 0.107421875, 0.29193115234375, 0.4764404296875, 0.66094970703125, 0.845458984375, 1.02996826171875, 1.2144775390625, 1.39898681640625, 1.58349609375, 1.76800537109375, 1.9525146484375, 2.13702392578125, 2.321533203125, 2.50604248046875, 2.6905517578125, 2.87506103515625, 3.0595703125, 3.24407958984375, 3.4285888671875, 3.61309814453125, 3.797607421875, 3.98211669921875, 4.1666259765625, 4.35113525390625, 4.53564453125, 4.72015380859375, 4.9046630859375, 5.08917236328125, 5.273681640625, 5.45819091796875, 5.6427001953125, 5.82720947265625, 6.01171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 10.0, 5.0, 13.0, 17.0, 15.0, 27.0, 27.0, 35.0, 46.0, 41.0, 46.0, 47.0, 45.0, 49.0, 65.0, 56.0, 56.0, 45.0, 41.0, 53.0, 43.0, 42.0, 27.0, 30.0, 24.0, 18.0, 11.0, 14.0, 14.0, 8.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7265625, -12.31494140625, -11.9033203125, -11.49169921875, -11.080078125, -10.66845703125, -10.2568359375, -9.84521484375, -9.43359375, -9.02197265625, -8.6103515625, -8.19873046875, -7.787109375, -7.37548828125, -6.9638671875, -6.55224609375, -6.140625, -5.72900390625, -5.3173828125, -4.90576171875, -4.494140625, -4.08251953125, -3.6708984375, -3.25927734375, -2.84765625, -2.43603515625, -2.0244140625, -1.61279296875, -1.201171875, -0.78955078125, -0.3779296875, 0.03369140625, 0.4453125, 0.85693359375, 1.2685546875, 1.68017578125, 2.091796875, 2.50341796875, 2.9150390625, 3.32666015625, 3.73828125, 4.14990234375, 4.5615234375, 4.97314453125, 5.384765625, 5.79638671875, 6.2080078125, 6.61962890625, 7.03125, 7.44287109375, 7.8544921875, 8.26611328125, 8.677734375, 9.08935546875, 9.5009765625, 9.91259765625, 10.32421875, 10.73583984375, 11.1474609375, 11.55908203125, 11.970703125, 12.38232421875, 12.7939453125, 13.20556640625, 13.6171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 3.0, 8.0, 6.0, 8.0, 11.0, 16.0, 29.0, 26.0, 26.0, 42.0, 65.0, 57.0, 112.0, 114.0, 193.0, 333.0, 722.0, 2428.0, 13724.0, 113933.0, 741439.0, 152620.0, 17710.0, 2953.0, 861.0, 321.0, 224.0, 149.0, 85.0, 70.0, 51.0, 48.0, 37.0, 33.0, 13.0, 17.0, 15.0, 9.0, 8.0, 8.0, 6.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.75, -12.381103515625, -12.01220703125, -11.643310546875, -11.2744140625, -10.905517578125, -10.53662109375, -10.167724609375, -9.798828125, -9.429931640625, -9.06103515625, -8.692138671875, -8.3232421875, -7.954345703125, -7.58544921875, -7.216552734375, -6.84765625, -6.478759765625, -6.10986328125, -5.740966796875, -5.3720703125, -5.003173828125, -4.63427734375, -4.265380859375, -3.896484375, -3.527587890625, -3.15869140625, -2.789794921875, -2.4208984375, -2.052001953125, -1.68310546875, -1.314208984375, -0.9453125, -0.576416015625, -0.20751953125, 0.161376953125, 0.5302734375, 0.899169921875, 1.26806640625, 1.636962890625, 2.005859375, 2.374755859375, 2.74365234375, 3.112548828125, 3.4814453125, 3.850341796875, 4.21923828125, 4.588134765625, 4.95703125, 5.325927734375, 5.69482421875, 6.063720703125, 6.4326171875, 6.801513671875, 7.17041015625, 7.539306640625, 7.908203125, 8.277099609375, 8.64599609375, 9.014892578125, 9.3837890625, 9.752685546875, 10.12158203125, 10.490478515625, 10.859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 3.0, 6.0, 7.0, 11.0, 12.0, 8.0, 25.0, 22.0, 27.0, 21.0, 29.0, 34.0, 40.0, 38.0, 34.0, 34.0, 39.0, 53.0, 51.0, 63.0, 52.0, 44.0, 31.0, 37.0, 38.0, 29.0, 27.0, 25.0, 20.0, 23.0, 16.0, 7.0, 11.0, 20.0, 6.0, 12.0, 9.0, 8.0, 8.0, 8.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.09375, -14.6484375, -14.203125, -13.7578125, -13.3125, -12.8671875, -12.421875, -11.9765625, -11.53125, -11.0859375, -10.640625, -10.1953125, -9.75, -9.3046875, -8.859375, -8.4140625, -7.96875, -7.5234375, -7.078125, -6.6328125, -6.1875, -5.7421875, -5.296875, -4.8515625, -4.40625, -3.9609375, -3.515625, -3.0703125, -2.625, -2.1796875, -1.734375, -1.2890625, -0.84375, -0.3984375, 0.046875, 0.4921875, 0.9375, 1.3828125, 1.828125, 2.2734375, 2.71875, 3.1640625, 3.609375, 4.0546875, 4.5, 4.9453125, 5.390625, 5.8359375, 6.28125, 6.7265625, 7.171875, 7.6171875, 8.0625, 8.5078125, 8.953125, 9.3984375, 9.84375, 10.2890625, 10.734375, 11.1796875, 11.625, 12.0703125, 12.515625, 12.9609375, 13.40625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 6.0, 9.0, 14.0, 23.0, 29.0, 71.0, 239.0, 1073.0, 11968.0, 1009556.0, 23773.0, 1373.0, 261.0, 86.0, 26.0, 20.0, 12.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.337158203125, -12.90087890625, -12.464599609375, -12.0283203125, -11.592041015625, -11.15576171875, -10.719482421875, -10.283203125, -9.846923828125, -9.41064453125, -8.974365234375, -8.5380859375, -8.101806640625, -7.66552734375, -7.229248046875, -6.79296875, -6.356689453125, -5.92041015625, -5.484130859375, -5.0478515625, -4.611572265625, -4.17529296875, -3.739013671875, -3.302734375, -2.866455078125, -2.43017578125, -1.993896484375, -1.5576171875, -1.121337890625, -0.68505859375, -0.248779296875, 0.1875, 0.623779296875, 1.06005859375, 1.496337890625, 1.9326171875, 2.368896484375, 2.80517578125, 3.241455078125, 3.677734375, 4.114013671875, 4.55029296875, 4.986572265625, 5.4228515625, 5.859130859375, 6.29541015625, 6.731689453125, 7.16796875, 7.604248046875, 8.04052734375, 8.476806640625, 8.9130859375, 9.349365234375, 9.78564453125, 10.221923828125, 10.658203125, 11.094482421875, 11.53076171875, 11.967041015625, 12.4033203125, 12.839599609375, 13.27587890625, 13.712158203125, 14.1484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 13.0, 19.0, 25.0, 39.0, 59.0, 74.0, 123.0, 189.0, 157.0, 106.0, 64.0, 45.0, 35.0, 17.0, 16.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006299018859863281, -0.0006035193800926208, -0.0005771368741989136, -0.0005507543683052063, -0.000524371862411499, -0.0004979893565177917, -0.00047160685062408447, -0.0004452243447303772, -0.0004188418388366699, -0.00039245933294296265, -0.00036607682704925537, -0.0003396943211555481, -0.0003133118152618408, -0.00028692930936813354, -0.00026054680347442627, -0.000234164297580719, -0.00020778179168701172, -0.00018139928579330444, -0.00015501677989959717, -0.0001286342740058899, -0.00010225176811218262, -7.586926221847534e-05, -4.9486756324768066e-05, -2.310425043106079e-05, 3.2782554626464844e-06, 2.966076135635376e-05, 5.6043267250061035e-05, 8.242577314376831e-05, 0.00010880827903747559, 0.00013519078493118286, 0.00016157329082489014, 0.0001879557967185974, 0.0002143383026123047, 0.00024072080850601196, 0.00026710331439971924, 0.0002934858202934265, 0.0003198683261871338, 0.00034625083208084106, 0.00037263333797454834, 0.0003990158438682556, 0.0004253983497619629, 0.00045178085565567017, 0.00047816336154937744, 0.0005045458674430847, 0.000530928373336792, 0.0005573108792304993, 0.0005836933851242065, 0.0006100758910179138, 0.0006364583969116211, 0.0006628409028053284, 0.0006892234086990356, 0.0007156059145927429, 0.0007419884204864502, 0.0007683709263801575, 0.0007947534322738647, 0.000821135938167572, 0.0008475184440612793, 0.0008739009499549866, 0.0009002834558486938, 0.0009266659617424011, 0.0009530484676361084, 0.0009794309735298157, 0.001005813479423523, 0.0010321959853172302, 0.0010585784912109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 10.0, 18.0, 22.0, 31.0, 74.0, 144.0, 439.0, 1732.0, 13593.0, 937181.0, 90755.0, 3405.0, 722.0, 224.0, 91.0, 38.0, 22.0, 16.0, 9.0, 8.0, 3.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.8515625, -10.4981689453125, -10.144775390625, -9.7913818359375, -9.43798828125, -9.0845947265625, -8.731201171875, -8.3778076171875, -8.0244140625, -7.6710205078125, -7.317626953125, -6.9642333984375, -6.61083984375, -6.2574462890625, -5.904052734375, -5.5506591796875, -5.197265625, -4.8438720703125, -4.490478515625, -4.1370849609375, -3.78369140625, -3.4302978515625, -3.076904296875, -2.7235107421875, -2.3701171875, -2.0167236328125, -1.663330078125, -1.3099365234375, -0.95654296875, -0.6031494140625, -0.249755859375, 0.1036376953125, 0.45703125, 0.8104248046875, 1.163818359375, 1.5172119140625, 1.87060546875, 2.2239990234375, 2.577392578125, 2.9307861328125, 3.2841796875, 3.6375732421875, 3.990966796875, 4.3443603515625, 4.69775390625, 5.0511474609375, 5.404541015625, 5.7579345703125, 6.111328125, 6.4647216796875, 6.818115234375, 7.1715087890625, 7.52490234375, 7.8782958984375, 8.231689453125, 8.5850830078125, 8.9384765625, 9.2918701171875, 9.645263671875, 9.9986572265625, 10.35205078125, 10.7054443359375, 11.058837890625, 11.4122314453125, 11.765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 9.0, 6.0, 5.0, 22.0, 34.0, 39.0, 54.0, 90.0, 118.0, 158.0, 149.0, 90.0, 73.0, 34.0, 40.0, 28.0, 12.0, 8.0, 8.0, 4.0, 1.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.951171875, -2.87701416015625, -2.8028564453125, -2.72869873046875, -2.654541015625, -2.58038330078125, -2.5062255859375, -2.43206787109375, -2.35791015625, -2.28375244140625, -2.2095947265625, -2.13543701171875, -2.061279296875, -1.98712158203125, -1.9129638671875, -1.83880615234375, -1.7646484375, -1.69049072265625, -1.6163330078125, -1.54217529296875, -1.468017578125, -1.39385986328125, -1.3197021484375, -1.24554443359375, -1.17138671875, -1.09722900390625, -1.0230712890625, -0.94891357421875, -0.874755859375, -0.80059814453125, -0.7264404296875, -0.65228271484375, -0.578125, -0.50396728515625, -0.4298095703125, -0.35565185546875, -0.281494140625, -0.20733642578125, -0.1331787109375, -0.05902099609375, 0.01513671875, 0.08929443359375, 0.1634521484375, 0.23760986328125, 0.311767578125, 0.38592529296875, 0.4600830078125, 0.53424072265625, 0.6083984375, 0.68255615234375, 0.7567138671875, 0.83087158203125, 0.905029296875, 0.97918701171875, 1.0533447265625, 1.12750244140625, 1.20166015625, 1.27581787109375, 1.3499755859375, 1.42413330078125, 1.498291015625, 1.57244873046875, 1.6466064453125, 1.72076416015625, 1.794921875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 23.0, 85.0, 253.0, 343.0, 209.0, 60.0, 16.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.9179801940918, -33.958656311035156, -31.99933624267578, -30.04001235961914, -28.080690383911133, -26.121368408203125, -24.162044525146484, -22.202722549438477, -20.24340057373047, -18.28407859802246, -16.324756622314453, -14.365432739257812, -12.406110763549805, -10.446788787841797, -8.487465858459473, -6.528142929077148, -4.568820953369141, -2.6094985008239746, -0.6501760482788086, 1.3091464042663574, 3.2684688568115234, 5.227790832519531, 7.1871137619018555, 9.14643669128418, 11.105758666992188, 13.065080642700195, 15.02440357208252, 16.983726501464844, 18.94304847717285, 20.90237045288086, 22.8616943359375, 24.821016311645508, 26.78033447265625, 28.739656448364258, 30.698978424072266, 32.658302307128906, 34.61762237548828, 36.57694625854492, 38.53627014160156, 40.49559020996094, 42.45491409301758, 44.41423797607422, 46.373558044433594, 48.332881927490234, 50.292205810546875, 52.25152587890625, 54.21084976196289, 56.17017364501953, 58.129493713378906, 60.08881759643555, 62.04813766479492, 64.00746154785156, 65.96678161621094, 67.92610168457031, 69.88542938232422, 71.8447494506836, 73.8040771484375, 75.76339721679688, 77.72272491455078, 79.68204498291016, 81.64136505126953, 83.60069274902344, 85.56001281738281, 87.51933288574219, 89.47865295410156]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 11.0, 10.0, 8.0, 5.0, 10.0, 17.0, 14.0, 25.0, 18.0, 25.0, 29.0, 20.0, 35.0, 22.0, 35.0, 32.0, 36.0, 31.0, 33.0, 37.0, 41.0, 32.0, 41.0, 47.0, 34.0, 27.0, 49.0, 26.0, 33.0, 20.0, 26.0, 29.0, 23.0, 14.0, 11.0, 18.0, 14.0, 12.0, 7.0, 12.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0], "bins": [-19.992359161376953, -19.370800018310547, -18.74924087524414, -18.1276798248291, -17.506120681762695, -16.88456153869629, -16.263002395629883, -15.641443252563477, -15.019883155822754, -14.398324012756348, -13.776763916015625, -13.155204772949219, -12.533645629882812, -11.91208553314209, -11.290526390075684, -10.668966293334961, -10.047407150268555, -9.425848007202148, -8.804287910461426, -8.18272876739502, -7.561169147491455, -6.939609527587891, -6.318050384521484, -5.69649076461792, -5.0749311447143555, -4.453371524810791, -3.8318121433258057, -3.2102527618408203, -2.588693141937256, -1.9671335220336914, -1.345574140548706, -0.7240147590637207, -0.10245704650878906, 0.5191024541854858, 1.1406619548797607, 1.7622214555740356, 2.3837809562683105, 3.005340576171875, 3.6268999576568604, 4.248459339141846, 4.87001895904541, 5.491578578948975, 6.113138198852539, 6.734697341918945, 7.35625696182251, 7.977816581726074, 8.59937572479248, 9.220935821533203, 9.84249496459961, 10.464054107666016, 11.085614204406738, 11.707173347473145, 12.328733444213867, 12.950292587280273, 13.57185173034668, 14.193410873413086, 14.814970970153809, 15.436530113220215, 16.058090209960938, 16.679649353027344, 17.30120849609375, 17.922767639160156, 18.544328689575195, 19.1658878326416, 19.787446975708008]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 6.0, 7.0, 19.0, 31.0, 42.0, 74.0, 108.0, 150.0, 257.0, 549.0, 1512.0, 7812.0, 125710.0, 2901981.0, 1112174.0, 38905.0, 3347.0, 749.0, 347.0, 184.0, 99.0, 70.0, 53.0, 32.0, 26.0, 14.0, 4.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -16.98291015625, -16.3720703125, -15.76123046875, -15.150390625, -14.53955078125, -13.9287109375, -13.31787109375, -12.70703125, -12.09619140625, -11.4853515625, -10.87451171875, -10.263671875, -9.65283203125, -9.0419921875, -8.43115234375, -7.8203125, -7.20947265625, -6.5986328125, -5.98779296875, -5.376953125, -4.76611328125, -4.1552734375, -3.54443359375, -2.93359375, -2.32275390625, -1.7119140625, -1.10107421875, -0.490234375, 0.12060546875, 0.7314453125, 1.34228515625, 1.953125, 2.56396484375, 3.1748046875, 3.78564453125, 4.396484375, 5.00732421875, 5.6181640625, 6.22900390625, 6.83984375, 7.45068359375, 8.0615234375, 8.67236328125, 9.283203125, 9.89404296875, 10.5048828125, 11.11572265625, 11.7265625, 12.33740234375, 12.9482421875, 13.55908203125, 14.169921875, 14.78076171875, 15.3916015625, 16.00244140625, 16.61328125, 17.22412109375, 17.8349609375, 18.44580078125, 19.056640625, 19.66748046875, 20.2783203125, 20.88916015625, 21.5]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 5.0, 6.0, 6.0, 9.0, 6.0, 10.0, 11.0, 13.0, 19.0, 22.0, 33.0, 22.0, 39.0, 29.0, 44.0, 59.0, 59.0, 53.0, 67.0, 51.0, 51.0, 66.0, 55.0, 40.0, 35.0, 31.0, 37.0, 33.0, 27.0, 17.0, 13.0, 9.0, 7.0, 6.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.59375, -8.3145751953125, -8.035400390625, -7.7562255859375, -7.47705078125, -7.1978759765625, -6.918701171875, -6.6395263671875, -6.3603515625, -6.0811767578125, -5.802001953125, -5.5228271484375, -5.24365234375, -4.9644775390625, -4.685302734375, -4.4061279296875, -4.126953125, -3.8477783203125, -3.568603515625, -3.2894287109375, -3.01025390625, -2.7310791015625, -2.451904296875, -2.1727294921875, -1.8935546875, -1.6143798828125, -1.335205078125, -1.0560302734375, -0.77685546875, -0.4976806640625, -0.218505859375, 0.0606689453125, 0.33984375, 0.6190185546875, 0.898193359375, 1.1773681640625, 1.45654296875, 1.7357177734375, 2.014892578125, 2.2940673828125, 2.5732421875, 2.8524169921875, 3.131591796875, 3.4107666015625, 3.68994140625, 3.9691162109375, 4.248291015625, 4.5274658203125, 4.806640625, 5.0858154296875, 5.364990234375, 5.6441650390625, 5.92333984375, 6.2025146484375, 6.481689453125, 6.7608642578125, 7.0400390625, 7.3192138671875, 7.598388671875, 7.8775634765625, 8.15673828125, 8.4359130859375, 8.715087890625, 8.9942626953125, 9.2734375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 3.0, 9.0, 10.0, 14.0, 14.0, 19.0, 26.0, 24.0, 53.0, 95.0, 160.0, 288.0, 514.0, 1189.0, 2758.0, 9842.0, 69991.0, 1732742.0, 2271839.0, 88278.0, 11000.0, 2983.0, 1192.0, 522.0, 297.0, 151.0, 87.0, 57.0, 37.0, 28.0, 11.0, 15.0, 5.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.328125, -11.872314453125, -11.41650390625, -10.960693359375, -10.5048828125, -10.049072265625, -9.59326171875, -9.137451171875, -8.681640625, -8.225830078125, -7.77001953125, -7.314208984375, -6.8583984375, -6.402587890625, -5.94677734375, -5.490966796875, -5.03515625, -4.579345703125, -4.12353515625, -3.667724609375, -3.2119140625, -2.756103515625, -2.30029296875, -1.844482421875, -1.388671875, -0.932861328125, -0.47705078125, -0.021240234375, 0.4345703125, 0.890380859375, 1.34619140625, 1.802001953125, 2.2578125, 2.713623046875, 3.16943359375, 3.625244140625, 4.0810546875, 4.536865234375, 4.99267578125, 5.448486328125, 5.904296875, 6.360107421875, 6.81591796875, 7.271728515625, 7.7275390625, 8.183349609375, 8.63916015625, 9.094970703125, 9.55078125, 10.006591796875, 10.46240234375, 10.918212890625, 11.3740234375, 11.829833984375, 12.28564453125, 12.741455078125, 13.197265625, 13.653076171875, 14.10888671875, 14.564697265625, 15.0205078125, 15.476318359375, 15.93212890625, 16.387939453125, 16.84375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 19.0, 20.0, 23.0, 48.0, 75.0, 115.0, 168.0, 280.0, 503.0, 620.0, 674.0, 507.0, 378.0, 218.0, 159.0, 93.0, 38.0, 42.0, 22.0, 14.0, 11.0, 5.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.484375, -4.34503173828125, -4.2056884765625, -4.06634521484375, -3.927001953125, -3.78765869140625, -3.6483154296875, -3.50897216796875, -3.36962890625, -3.23028564453125, -3.0909423828125, -2.95159912109375, -2.812255859375, -2.67291259765625, -2.5335693359375, -2.39422607421875, -2.2548828125, -2.11553955078125, -1.9761962890625, -1.83685302734375, -1.697509765625, -1.55816650390625, -1.4188232421875, -1.27947998046875, -1.14013671875, -1.00079345703125, -0.8614501953125, -0.72210693359375, -0.582763671875, -0.44342041015625, -0.3040771484375, -0.16473388671875, -0.025390625, 0.11395263671875, 0.2532958984375, 0.39263916015625, 0.531982421875, 0.67132568359375, 0.8106689453125, 0.95001220703125, 1.08935546875, 1.22869873046875, 1.3680419921875, 1.50738525390625, 1.646728515625, 1.78607177734375, 1.9254150390625, 2.06475830078125, 2.2041015625, 2.34344482421875, 2.4827880859375, 2.62213134765625, 2.761474609375, 2.90081787109375, 3.0401611328125, 3.17950439453125, 3.31884765625, 3.45819091796875, 3.5975341796875, 3.73687744140625, 3.876220703125, 4.01556396484375, 4.1549072265625, 4.29425048828125, 4.43359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 16.0, 20.0, 39.0, 82.0, 107.0, 160.0, 153.0, 160.0, 116.0, 64.0, 42.0, 23.0, 18.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.623897552490234, -32.86772918701172, -32.11155700683594, -31.355388641357422, -30.599220275878906, -29.843050003051758, -29.086881637573242, -28.330711364746094, -27.574542999267578, -26.81837272644043, -26.062204360961914, -25.306034088134766, -24.54986572265625, -23.7936954498291, -23.037527084350586, -22.281356811523438, -21.525188446044922, -20.769018173217773, -20.012849807739258, -19.25667953491211, -18.500511169433594, -17.744340896606445, -16.98817253112793, -16.23200225830078, -15.475831985473633, -14.7196626663208, -13.963493347167969, -13.207324028015137, -12.451154708862305, -11.694985389709473, -10.93881607055664, -10.182645797729492, -9.426477432250977, -8.670308113098145, -7.9141387939453125, -7.1579694747924805, -6.401800155639648, -5.645630836486816, -4.889461040496826, -4.133291721343994, -3.377122402191162, -2.62095308303833, -1.8647836446762085, -1.108614206314087, -0.3524448871612549, 0.40372443199157715, 1.1598939895629883, 1.9160633087158203, 2.6722326278686523, 3.4284019470214844, 4.184571266174316, 4.940740585327148, 5.6969099044799805, 6.4530792236328125, 7.209249019622803, 7.965418338775635, 8.721588134765625, 9.477757453918457, 10.233926773071289, 10.990096092224121, 11.746265411376953, 12.502434730529785, 13.258604049682617, 14.014774322509766, 14.770942687988281]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 7.0, 2.0, 4.0, 4.0, 3.0, 9.0, 11.0, 12.0, 19.0, 18.0, 24.0, 27.0, 24.0, 25.0, 28.0, 38.0, 41.0, 33.0, 40.0, 45.0, 49.0, 47.0, 38.0, 62.0, 51.0, 31.0, 32.0, 30.0, 29.0, 38.0, 33.0, 28.0, 25.0, 16.0, 10.0, 8.0, 13.0, 14.0, 11.0, 7.0, 7.0, 7.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.811712265014648, -8.543663024902344, -8.275614738464355, -8.00756549835205, -7.739516258239746, -7.4714674949646, -7.203418731689453, -6.935369491577148, -6.667320728302002, -6.3992719650268555, -6.131222724914551, -5.863173961639404, -5.595125198364258, -5.327075958251953, -5.059027194976807, -4.79097843170166, -4.5229291915893555, -4.254880428314209, -3.9868311882019043, -3.718782424926758, -3.4507334232330322, -3.1826844215393066, -2.91463565826416, -2.6465866565704346, -2.378537654876709, -2.1104886531829834, -1.8424397706985474, -1.5743908882141113, -1.3063418865203857, -1.0382928848266602, -0.7702440023422241, -0.5021951198577881, -0.2341461181640625, 0.03390282392501831, 0.3019517660140991, 0.5700007081031799, 0.8380496501922607, 1.1060986518859863, 1.3741475343704224, 1.6421964168548584, 1.910245418548584, 2.1782944202423096, 2.446343421936035, 2.7143921852111816, 2.9824411869049072, 3.250490188598633, 3.5185389518737793, 3.786587953567505, 4.0546369552612305, 4.322685718536377, 4.590734958648682, 4.858783721923828, 5.126832962036133, 5.394881725311279, 5.662930488586426, 5.9309797286987305, 6.199028491973877, 6.467077255249023, 6.735126495361328, 7.003175258636475, 7.271224021911621, 7.539273262023926, 7.807322025299072, 8.075370788574219, 8.343420028686523]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 10.0, 9.0, 15.0, 13.0, 24.0, 30.0, 40.0, 56.0, 91.0, 166.0, 274.0, 471.0, 941.0, 2111.0, 4880.0, 12473.0, 36252.0, 112731.0, 292434.0, 345386.0, 159210.0, 51686.0, 17472.0, 6490.0, 2692.0, 1168.0, 569.0, 311.0, 195.0, 111.0, 85.0, 52.0, 28.0, 15.0, 15.0, 11.0, 8.0, 4.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.61328125, -1.557952880859375, -1.50262451171875, -1.447296142578125, -1.3919677734375, -1.336639404296875, -1.28131103515625, -1.225982666015625, -1.170654296875, -1.115325927734375, -1.05999755859375, -1.004669189453125, -0.9493408203125, -0.894012451171875, -0.83868408203125, -0.783355712890625, -0.72802734375, -0.672698974609375, -0.61737060546875, -0.562042236328125, -0.5067138671875, -0.451385498046875, -0.39605712890625, -0.340728759765625, -0.285400390625, -0.230072021484375, -0.17474365234375, -0.119415283203125, -0.0640869140625, -0.008758544921875, 0.04656982421875, 0.101898193359375, 0.1572265625, 0.212554931640625, 0.26788330078125, 0.323211669921875, 0.3785400390625, 0.433868408203125, 0.48919677734375, 0.544525146484375, 0.599853515625, 0.655181884765625, 0.71051025390625, 0.765838623046875, 0.8211669921875, 0.876495361328125, 0.93182373046875, 0.987152099609375, 1.04248046875, 1.097808837890625, 1.15313720703125, 1.208465576171875, 1.2637939453125, 1.319122314453125, 1.37445068359375, 1.429779052734375, 1.485107421875, 1.540435791015625, 1.59576416015625, 1.651092529296875, 1.7064208984375, 1.761749267578125, 1.81707763671875, 1.872406005859375, 1.927734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 6.0, 6.0, 15.0, 17.0, 18.0, 20.0, 28.0, 35.0, 35.0, 43.0, 46.0, 48.0, 51.0, 54.0, 60.0, 63.0, 56.0, 43.0, 50.0, 54.0, 41.0, 35.0, 32.0, 27.0, 19.0, 21.0, 14.0, 12.0, 12.0, 15.0, 7.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.3740234375, -7.158203125, -6.9423828125, -6.7265625, -6.5107421875, -6.294921875, -6.0791015625, -5.86328125, -5.6474609375, -5.431640625, -5.2158203125, -5.0, -4.7841796875, -4.568359375, -4.3525390625, -4.13671875, -3.9208984375, -3.705078125, -3.4892578125, -3.2734375, -3.0576171875, -2.841796875, -2.6259765625, -2.41015625, -2.1943359375, -1.978515625, -1.7626953125, -1.546875, -1.3310546875, -1.115234375, -0.8994140625, -0.68359375, -0.4677734375, -0.251953125, -0.0361328125, 0.1796875, 0.3955078125, 0.611328125, 0.8271484375, 1.04296875, 1.2587890625, 1.474609375, 1.6904296875, 1.90625, 2.1220703125, 2.337890625, 2.5537109375, 2.76953125, 2.9853515625, 3.201171875, 3.4169921875, 3.6328125, 3.8486328125, 4.064453125, 4.2802734375, 4.49609375, 4.7119140625, 4.927734375, 5.1435546875, 5.359375, 5.5751953125, 5.791015625, 6.0068359375, 6.22265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 4.0, 9.0, 21.0, 26.0, 30.0, 49.0, 67.0, 100.0, 217.0, 369.0, 680.0, 1339.0, 2510.0, 4976.0, 10081.0, 19954.0, 40821.0, 83329.0, 157970.0, 235091.0, 219728.0, 134549.0, 69171.0, 33728.0, 16532.0, 8277.0, 4172.0, 2166.0, 1124.0, 602.0, 339.0, 187.0, 95.0, 79.0, 39.0, 41.0, 29.0, 18.0, 9.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.0727462768554688, -1.0419769287109375, -1.0112075805664062, -0.980438232421875, -0.9496688842773438, -0.9188995361328125, -0.8881301879882812, -0.85736083984375, -0.8265914916992188, -0.7958221435546875, -0.7650527954101562, -0.734283447265625, -0.7035140991210938, -0.6727447509765625, -0.6419754028320312, -0.6112060546875, -0.5804367065429688, -0.5496673583984375, -0.5188980102539062, -0.488128662109375, -0.45735931396484375, -0.4265899658203125, -0.39582061767578125, -0.36505126953125, -0.33428192138671875, -0.3035125732421875, -0.27274322509765625, -0.241973876953125, -0.21120452880859375, -0.1804351806640625, -0.14966583251953125, -0.118896484375, -0.08812713623046875, -0.0573577880859375, -0.02658843994140625, 0.004180908203125, 0.03495025634765625, 0.0657196044921875, 0.09648895263671875, 0.12725830078125, 0.15802764892578125, 0.1887969970703125, 0.21956634521484375, 0.250335693359375, 0.28110504150390625, 0.3118743896484375, 0.34264373779296875, 0.3734130859375, 0.40418243408203125, 0.4349517822265625, 0.46572113037109375, 0.496490478515625, 0.5272598266601562, 0.5580291748046875, 0.5887985229492188, 0.61956787109375, 0.6503372192382812, 0.6811065673828125, 0.7118759155273438, 0.742645263671875, 0.7734146118164062, 0.8041839599609375, 0.8349533081054688, 0.86572265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 1.0, 5.0, 12.0, 9.0, 5.0, 15.0, 10.0, 16.0, 16.0, 18.0, 25.0, 23.0, 22.0, 36.0, 43.0, 36.0, 44.0, 47.0, 39.0, 41.0, 41.0, 43.0, 45.0, 46.0, 46.0, 44.0, 28.0, 25.0, 38.0, 30.0, 16.0, 21.0, 17.0, 19.0, 17.0, 15.0, 9.0, 11.0, 8.0, 10.0, 6.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.7421875, -12.3944091796875, -12.046630859375, -11.6988525390625, -11.35107421875, -11.0032958984375, -10.655517578125, -10.3077392578125, -9.9599609375, -9.6121826171875, -9.264404296875, -8.9166259765625, -8.56884765625, -8.2210693359375, -7.873291015625, -7.5255126953125, -7.177734375, -6.8299560546875, -6.482177734375, -6.1343994140625, -5.78662109375, -5.4388427734375, -5.091064453125, -4.7432861328125, -4.3955078125, -4.0477294921875, -3.699951171875, -3.3521728515625, -3.00439453125, -2.6566162109375, -2.308837890625, -1.9610595703125, -1.61328125, -1.2655029296875, -0.917724609375, -0.5699462890625, -0.22216796875, 0.1256103515625, 0.473388671875, 0.8211669921875, 1.1689453125, 1.5167236328125, 1.864501953125, 2.2122802734375, 2.56005859375, 2.9078369140625, 3.255615234375, 3.6033935546875, 3.951171875, 4.2989501953125, 4.646728515625, 4.9945068359375, 5.34228515625, 5.6900634765625, 6.037841796875, 6.3856201171875, 6.7333984375, 7.0811767578125, 7.428955078125, 7.7767333984375, 8.12451171875, 8.4722900390625, 8.820068359375, 9.1678466796875, 9.515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 4.0, 6.0, 8.0, 6.0, 9.0, 20.0, 23.0, 17.0, 41.0, 42.0, 53.0, 104.0, 120.0, 184.0, 254.0, 374.0, 623.0, 1004.0, 1827.0, 3627.0, 8208.0, 21545.0, 62347.0, 173194.0, 334034.0, 268194.0, 109802.0, 37625.0, 13440.0, 5490.0, 2556.0, 1380.0, 812.0, 497.0, 336.0, 208.0, 135.0, 110.0, 81.0, 42.0, 50.0, 32.0, 28.0, 14.0, 16.0, 12.0, 7.0, 7.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.25439453125, -0.24555206298828125, -0.2367095947265625, -0.22786712646484375, -0.219024658203125, -0.21018218994140625, -0.2013397216796875, -0.19249725341796875, -0.18365478515625, -0.17481231689453125, -0.1659698486328125, -0.15712738037109375, -0.148284912109375, -0.13944244384765625, -0.1305999755859375, -0.12175750732421875, -0.1129150390625, -0.10407257080078125, -0.0952301025390625, -0.08638763427734375, -0.077545166015625, -0.06870269775390625, -0.0598602294921875, -0.05101776123046875, -0.04217529296875, -0.03333282470703125, -0.0244903564453125, -0.01564788818359375, -0.006805419921875, 0.00203704833984375, 0.0108795166015625, 0.01972198486328125, 0.028564453125, 0.03740692138671875, 0.0462493896484375, 0.05509185791015625, 0.063934326171875, 0.07277679443359375, 0.0816192626953125, 0.09046173095703125, 0.09930419921875, 0.10814666748046875, 0.1169891357421875, 0.12583160400390625, 0.134674072265625, 0.14351654052734375, 0.1523590087890625, 0.16120147705078125, 0.1700439453125, 0.17888641357421875, 0.1877288818359375, 0.19657135009765625, 0.205413818359375, 0.21425628662109375, 0.2230987548828125, 0.23194122314453125, 0.24078369140625, 0.24962615966796875, 0.2584686279296875, 0.26731109619140625, 0.276153564453125, 0.28499603271484375, 0.2938385009765625, 0.30268096923828125, 0.3115234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 5.0, 9.0, 16.0, 16.0, 33.0, 39.0, 64.0, 110.0, 107.0, 120.0, 122.0, 109.0, 84.0, 46.0, 40.0, 35.0, 17.0, 13.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016641616821289062, -0.00015875324606895447, -0.0001510903239250183, -0.00014342740178108215, -0.000135764479637146, -0.00012810155749320984, -0.00012043863534927368, -0.00011277571320533752, -0.00010511279106140137, -9.744986891746521e-05, -8.978694677352905e-05, -8.21240246295929e-05, -7.446110248565674e-05, -6.679818034172058e-05, -5.9135258197784424e-05, -5.1472336053848267e-05, -4.380941390991211e-05, -3.614649176597595e-05, -2.8483569622039795e-05, -2.0820647478103638e-05, -1.315772533416748e-05, -5.494803190231323e-06, 2.168118953704834e-06, 9.831041097640991e-06, 1.749396324157715e-05, 2.5156885385513306e-05, 3.281980752944946e-05, 4.048272967338562e-05, 4.814565181732178e-05, 5.5808573961257935e-05, 6.347149610519409e-05, 7.113441824913025e-05, 7.87973403930664e-05, 8.646026253700256e-05, 9.412318468093872e-05, 0.00010178610682487488, 0.00010944902896881104, 0.00011711195111274719, 0.00012477487325668335, 0.0001324377954006195, 0.00014010071754455566, 0.00014776363968849182, 0.00015542656183242798, 0.00016308948397636414, 0.0001707524061203003, 0.00017841532826423645, 0.0001860782504081726, 0.00019374117255210876, 0.00020140409469604492, 0.00020906701683998108, 0.00021672993898391724, 0.0002243928611278534, 0.00023205578327178955, 0.0002397187054157257, 0.00024738162755966187, 0.000255044549703598, 0.0002627074718475342, 0.00027037039399147034, 0.0002780333161354065, 0.00028569623827934265, 0.0002933591604232788, 0.00030102208256721497, 0.0003086850047111511, 0.0003163479268550873, 0.00032401084899902344]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 2.0, 3.0, 8.0, 6.0, 20.0, 17.0, 39.0, 62.0, 94.0, 156.0, 298.0, 690.0, 1604.0, 4836.0, 18775.0, 82878.0, 313865.0, 426968.0, 151446.0, 34177.0, 8332.0, 2465.0, 878.0, 392.0, 207.0, 114.0, 79.0, 45.0, 33.0, 27.0, 10.0, 8.0, 8.0, 4.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3896484375, -0.3779144287109375, -0.366180419921875, -0.3544464111328125, -0.34271240234375, -0.3309783935546875, -0.319244384765625, -0.3075103759765625, -0.2957763671875, -0.2840423583984375, -0.272308349609375, -0.2605743408203125, -0.24884033203125, -0.2371063232421875, -0.225372314453125, -0.2136383056640625, -0.201904296875, -0.1901702880859375, -0.178436279296875, -0.1667022705078125, -0.15496826171875, -0.1432342529296875, -0.131500244140625, -0.1197662353515625, -0.1080322265625, -0.0962982177734375, -0.084564208984375, -0.0728302001953125, -0.06109619140625, -0.0493621826171875, -0.037628173828125, -0.0258941650390625, -0.01416015625, -0.0024261474609375, 0.009307861328125, 0.0210418701171875, 0.03277587890625, 0.0445098876953125, 0.056243896484375, 0.0679779052734375, 0.0797119140625, 0.0914459228515625, 0.103179931640625, 0.1149139404296875, 0.12664794921875, 0.1383819580078125, 0.150115966796875, 0.1618499755859375, 0.173583984375, 0.1853179931640625, 0.197052001953125, 0.2087860107421875, 0.22052001953125, 0.2322540283203125, 0.243988037109375, 0.2557220458984375, 0.2674560546875, 0.2791900634765625, 0.290924072265625, 0.3026580810546875, 0.31439208984375, 0.3261260986328125, 0.337860107421875, 0.3495941162109375, 0.361328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 10.0, 9.0, 13.0, 16.0, 30.0, 25.0, 36.0, 46.0, 47.0, 61.0, 73.0, 82.0, 68.0, 68.0, 75.0, 57.0, 42.0, 45.0, 42.0, 45.0, 21.0, 14.0, 21.0, 14.0, 8.0, 5.0, 1.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09246826171875, -0.08897113800048828, -0.08547401428222656, -0.08197689056396484, -0.07847976684570312, -0.0749826431274414, -0.07148551940917969, -0.06798839569091797, -0.06449127197265625, -0.06099414825439453, -0.05749702453613281, -0.053999900817871094, -0.050502777099609375, -0.047005653381347656, -0.04350852966308594, -0.04001140594482422, -0.0365142822265625, -0.03301715850830078, -0.029520034790039062, -0.026022911071777344, -0.022525787353515625, -0.019028663635253906, -0.015531539916992188, -0.012034416198730469, -0.00853729248046875, -0.005040168762207031, -0.0015430450439453125, 0.0019540786743164062, 0.005451202392578125, 0.008948326110839844, 0.012445449829101562, 0.01594257354736328, 0.019439697265625, 0.02293682098388672, 0.026433944702148438, 0.029931068420410156, 0.033428192138671875, 0.036925315856933594, 0.04042243957519531, 0.04391956329345703, 0.04741668701171875, 0.05091381072998047, 0.05441093444824219, 0.057908058166503906, 0.061405181884765625, 0.06490230560302734, 0.06839942932128906, 0.07189655303955078, 0.0753936767578125, 0.07889080047607422, 0.08238792419433594, 0.08588504791259766, 0.08938217163085938, 0.0928792953491211, 0.09637641906738281, 0.09987354278564453, 0.10337066650390625, 0.10686779022216797, 0.11036491394042969, 0.1138620376586914, 0.11735916137695312, 0.12085628509521484, 0.12435340881347656, 0.12785053253173828, 0.13134765625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 19.0, 90.0, 220.0, 304.0, 233.0, 104.0, 24.0, 8.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-44.817466735839844, -43.9799919128418, -43.14251708984375, -42.30504608154297, -41.46757125854492, -40.630096435546875, -39.79262161254883, -38.95514678955078, -38.11767578125, -37.28020095825195, -36.442726135253906, -35.605255126953125, -34.76778030395508, -33.93030548095703, -33.092830657958984, -32.25535583496094, -31.41788101196289, -30.580406188964844, -29.74293327331543, -28.905458450317383, -28.06798553466797, -27.230510711669922, -26.393035888671875, -25.555561065673828, -24.718088150024414, -23.880613327026367, -23.043140411376953, -22.205665588378906, -21.36819076538086, -20.530717849731445, -19.6932430267334, -18.855770111083984, -18.018295288085938, -17.18082046508789, -16.343347549438477, -15.50587272644043, -14.6683988571167, -13.830924987792969, -12.993450164794922, -12.155976295471191, -11.318501472473145, -10.481027603149414, -9.643552780151367, -8.806078910827637, -7.968605041503906, -7.131131172180176, -6.293656826019287, -5.456182479858398, -4.618708610534668, -3.7812345027923584, -2.943760395050049, -2.1062862873077393, -1.2688121795654297, -0.4313383102416992, 0.40613603591918945, 1.2436103820800781, 2.0810842514038086, 2.918558359146118, 3.7560324668884277, 4.593506813049316, 5.430980682373047, 6.268454551696777, 7.105928897857666, 7.943403244018555, 8.780877113342285]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 4.0, 7.0, 6.0, 9.0, 16.0, 20.0, 22.0, 28.0, 34.0, 26.0, 41.0, 48.0, 57.0, 45.0, 58.0, 67.0, 57.0, 68.0, 57.0, 42.0, 38.0, 45.0, 44.0, 31.0, 34.0, 14.0, 16.0, 17.0, 17.0, 8.0, 7.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6605963706970215, -7.443086624145508, -7.225576877593994, -7.0080671310424805, -6.790557861328125, -6.573048114776611, -6.355538368225098, -6.138028621673584, -5.92051887512207, -5.703009128570557, -5.485499382019043, -5.2679901123046875, -5.050480365753174, -4.83297061920166, -4.6154608726501465, -4.397951126098633, -4.180441856384277, -3.9629321098327637, -3.745422601699829, -3.5279128551483154, -3.310403347015381, -3.092893600463867, -2.8753838539123535, -2.65787410736084, -2.4403645992279053, -2.2228548526763916, -2.005345344543457, -1.7878355979919434, -1.5703259706497192, -1.3528163433074951, -1.1353065967559814, -0.9177969694137573, -0.7002873420715332, -0.4827776849269867, -0.2652680277824402, -0.04775834083557129, 0.16975128650665283, 0.38726091384887695, 0.6047706604003906, 0.8222802877426147, 1.0397899150848389, 1.257299542427063, 1.474809169769287, 1.6923189163208008, 1.909828543663025, 2.127338171005249, 2.3448479175567627, 2.5623574256896973, 2.779867172241211, 2.9973769187927246, 3.214886426925659, 3.432396173477173, 3.6499056816101074, 3.867415428161621, 4.084925174713135, 4.302434921264648, 4.519944190979004, 4.737453937530518, 4.954963684082031, 5.172472953796387, 5.3899827003479, 5.607492446899414, 5.825002193450928, 6.042511940002441, 6.260021686553955]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 4.0, 9.0, 16.0, 19.0, 48.0, 64.0, 87.0, 167.0, 344.0, 678.0, 1806.0, 5555.0, 20849.0, 93777.0, 713880.0, 166315.0, 32433.0, 8295.0, 2417.0, 892.0, 374.0, 215.0, 115.0, 69.0, 46.0, 28.0, 25.0, 10.0, 9.0, 2.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.546875, -9.2713623046875, -8.995849609375, -8.7203369140625, -8.44482421875, -8.1693115234375, -7.893798828125, -7.6182861328125, -7.3427734375, -7.0672607421875, -6.791748046875, -6.5162353515625, -6.24072265625, -5.9652099609375, -5.689697265625, -5.4141845703125, -5.138671875, -4.8631591796875, -4.587646484375, -4.3121337890625, -4.03662109375, -3.7611083984375, -3.485595703125, -3.2100830078125, -2.9345703125, -2.6590576171875, -2.383544921875, -2.1080322265625, -1.83251953125, -1.5570068359375, -1.281494140625, -1.0059814453125, -0.73046875, -0.4549560546875, -0.179443359375, 0.0960693359375, 0.37158203125, 0.6470947265625, 0.922607421875, 1.1981201171875, 1.4736328125, 1.7491455078125, 2.024658203125, 2.3001708984375, 2.57568359375, 2.8511962890625, 3.126708984375, 3.4022216796875, 3.677734375, 3.9532470703125, 4.228759765625, 4.5042724609375, 4.77978515625, 5.0552978515625, 5.330810546875, 5.6063232421875, 5.8818359375, 6.1573486328125, 6.432861328125, 6.7083740234375, 6.98388671875, 7.2593994140625, 7.534912109375, 7.8104248046875, 8.0859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 5.0, 6.0, 10.0, 13.0, 17.0, 23.0, 19.0, 26.0, 21.0, 32.0, 25.0, 32.0, 41.0, 45.0, 63.0, 43.0, 51.0, 48.0, 52.0, 48.0, 45.0, 37.0, 44.0, 36.0, 29.0, 26.0, 24.0, 22.0, 27.0, 14.0, 9.0, 14.0, 12.0, 8.0, 11.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.71875, -11.3682861328125, -11.017822265625, -10.6673583984375, -10.31689453125, -9.9664306640625, -9.615966796875, -9.2655029296875, -8.9150390625, -8.5645751953125, -8.214111328125, -7.8636474609375, -7.51318359375, -7.1627197265625, -6.812255859375, -6.4617919921875, -6.111328125, -5.7608642578125, -5.410400390625, -5.0599365234375, -4.70947265625, -4.3590087890625, -4.008544921875, -3.6580810546875, -3.3076171875, -2.9571533203125, -2.606689453125, -2.2562255859375, -1.90576171875, -1.5552978515625, -1.204833984375, -0.8543701171875, -0.50390625, -0.1534423828125, 0.197021484375, 0.5474853515625, 0.89794921875, 1.2484130859375, 1.598876953125, 1.9493408203125, 2.2998046875, 2.6502685546875, 3.000732421875, 3.3511962890625, 3.70166015625, 4.0521240234375, 4.402587890625, 4.7530517578125, 5.103515625, 5.4539794921875, 5.804443359375, 6.1549072265625, 6.50537109375, 6.8558349609375, 7.206298828125, 7.5567626953125, 7.9072265625, 8.2576904296875, 8.608154296875, 8.9586181640625, 9.30908203125, 9.6595458984375, 10.010009765625, 10.3604736328125, 10.7109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 4.0, 7.0, 9.0, 5.0, 9.0, 19.0, 23.0, 29.0, 45.0, 60.0, 84.0, 122.0, 157.0, 257.0, 378.0, 781.0, 3055.0, 39193.0, 908872.0, 87824.0, 5271.0, 1013.0, 454.0, 278.0, 178.0, 110.0, 78.0, 72.0, 36.0, 34.0, 19.0, 15.0, 11.0, 7.0, 9.0, 11.0, 6.0, 4.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.703125, -14.1708984375, -13.638671875, -13.1064453125, -12.57421875, -12.0419921875, -11.509765625, -10.9775390625, -10.4453125, -9.9130859375, -9.380859375, -8.8486328125, -8.31640625, -7.7841796875, -7.251953125, -6.7197265625, -6.1875, -5.6552734375, -5.123046875, -4.5908203125, -4.05859375, -3.5263671875, -2.994140625, -2.4619140625, -1.9296875, -1.3974609375, -0.865234375, -0.3330078125, 0.19921875, 0.7314453125, 1.263671875, 1.7958984375, 2.328125, 2.8603515625, 3.392578125, 3.9248046875, 4.45703125, 4.9892578125, 5.521484375, 6.0537109375, 6.5859375, 7.1181640625, 7.650390625, 8.1826171875, 8.71484375, 9.2470703125, 9.779296875, 10.3115234375, 10.84375, 11.3759765625, 11.908203125, 12.4404296875, 12.97265625, 13.5048828125, 14.037109375, 14.5693359375, 15.1015625, 15.6337890625, 16.166015625, 16.6982421875, 17.23046875, 17.7626953125, 18.294921875, 18.8271484375, 19.359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 4.0, 4.0, 5.0, 10.0, 11.0, 16.0, 22.0, 25.0, 20.0, 40.0, 31.0, 36.0, 42.0, 40.0, 49.0, 47.0, 62.0, 67.0, 57.0, 36.0, 49.0, 47.0, 35.0, 39.0, 27.0, 19.0, 27.0, 29.0, 18.0, 19.0, 10.0, 11.0, 7.0, 5.0, 7.0, 5.0, 2.0, 2.0, 5.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.9453125, -14.485107421875, -14.02490234375, -13.564697265625, -13.1044921875, -12.644287109375, -12.18408203125, -11.723876953125, -11.263671875, -10.803466796875, -10.34326171875, -9.883056640625, -9.4228515625, -8.962646484375, -8.50244140625, -8.042236328125, -7.58203125, -7.121826171875, -6.66162109375, -6.201416015625, -5.7412109375, -5.281005859375, -4.82080078125, -4.360595703125, -3.900390625, -3.440185546875, -2.97998046875, -2.519775390625, -2.0595703125, -1.599365234375, -1.13916015625, -0.678955078125, -0.21875, 0.241455078125, 0.70166015625, 1.161865234375, 1.6220703125, 2.082275390625, 2.54248046875, 3.002685546875, 3.462890625, 3.923095703125, 4.38330078125, 4.843505859375, 5.3037109375, 5.763916015625, 6.22412109375, 6.684326171875, 7.14453125, 7.604736328125, 8.06494140625, 8.525146484375, 8.9853515625, 9.445556640625, 9.90576171875, 10.365966796875, 10.826171875, 11.286376953125, 11.74658203125, 12.206787109375, 12.6669921875, 13.127197265625, 13.58740234375, 14.047607421875, 14.5078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 10.0, 5.0, 7.0, 15.0, 12.0, 27.0, 51.0, 81.0, 134.0, 257.0, 506.0, 1086.0, 2873.0, 10203.0, 172440.0, 829471.0, 23959.0, 4326.0, 1565.0, 670.0, 371.0, 205.0, 101.0, 63.0, 39.0, 18.0, 16.0, 14.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.9609375, -7.75250244140625, -7.5440673828125, -7.33563232421875, -7.127197265625, -6.91876220703125, -6.7103271484375, -6.50189208984375, -6.29345703125, -6.08502197265625, -5.8765869140625, -5.66815185546875, -5.459716796875, -5.25128173828125, -5.0428466796875, -4.83441162109375, -4.6259765625, -4.41754150390625, -4.2091064453125, -4.00067138671875, -3.792236328125, -3.58380126953125, -3.3753662109375, -3.16693115234375, -2.95849609375, -2.75006103515625, -2.5416259765625, -2.33319091796875, -2.124755859375, -1.91632080078125, -1.7078857421875, -1.49945068359375, -1.291015625, -1.08258056640625, -0.8741455078125, -0.66571044921875, -0.457275390625, -0.24884033203125, -0.0404052734375, 0.16802978515625, 0.37646484375, 0.58489990234375, 0.7933349609375, 1.00177001953125, 1.210205078125, 1.41864013671875, 1.6270751953125, 1.83551025390625, 2.0439453125, 2.25238037109375, 2.4608154296875, 2.66925048828125, 2.877685546875, 3.08612060546875, 3.2945556640625, 3.50299072265625, 3.71142578125, 3.91986083984375, 4.1282958984375, 4.33673095703125, 4.545166015625, 4.75360107421875, 4.9620361328125, 5.17047119140625, 5.37890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 1.0, 7.0, 11.0, 12.0, 21.0, 35.0, 52.0, 79.0, 171.0, 308.0, 137.0, 59.0, 32.0, 23.0, 22.0, 6.0, 8.0, 4.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009708404541015625, -0.0009425431489944458, -0.0009142458438873291, -0.0008859485387802124, -0.0008576512336730957, -0.000829353928565979, -0.0008010566234588623, -0.0007727593183517456, -0.0007444620132446289, -0.0007161647081375122, -0.0006878674030303955, -0.0006595700979232788, -0.0006312727928161621, -0.0006029754877090454, -0.0005746781826019287, -0.000546380877494812, -0.0005180835723876953, -0.0004897862672805786, -0.0004614889621734619, -0.0004331916570663452, -0.0004048943519592285, -0.0003765970468521118, -0.0003482997417449951, -0.0003200024366378784, -0.0002917051315307617, -0.000263407826423645, -0.00023511052131652832, -0.00020681321620941162, -0.00017851591110229492, -0.00015021860599517822, -0.00012192130088806152, -9.362399578094482e-05, -6.532669067382812e-05, -3.7029385566711426e-05, -8.732080459594727e-06, 1.9565224647521973e-05, 4.786252975463867e-05, 7.615983486175537e-05, 0.00010445713996887207, 0.00013275444507598877, 0.00016105175018310547, 0.00018934905529022217, 0.00021764636039733887, 0.00024594366550445557, 0.00027424097061157227, 0.00030253827571868896, 0.00033083558082580566, 0.00035913288593292236, 0.00038743019104003906, 0.00041572749614715576, 0.00044402480125427246, 0.00047232210636138916, 0.0005006194114685059, 0.0005289167165756226, 0.0005572140216827393, 0.000585511326789856, 0.0006138086318969727, 0.0006421059370040894, 0.0006704032421112061, 0.0006987005472183228, 0.0007269978523254395, 0.0007552951574325562, 0.0007835924625396729, 0.0008118897676467896, 0.0008401870727539062]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 13.0, 15.0, 18.0, 42.0, 41.0, 72.0, 146.0, 294.0, 473.0, 944.0, 1896.0, 6298.0, 106112.0, 904509.0, 21249.0, 3475.0, 1385.0, 683.0, 378.0, 200.0, 105.0, 65.0, 37.0, 28.0, 15.0, 16.0, 13.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.9296875, -8.653076171875, -8.37646484375, -8.099853515625, -7.8232421875, -7.546630859375, -7.27001953125, -6.993408203125, -6.716796875, -6.440185546875, -6.16357421875, -5.886962890625, -5.6103515625, -5.333740234375, -5.05712890625, -4.780517578125, -4.50390625, -4.227294921875, -3.95068359375, -3.674072265625, -3.3974609375, -3.120849609375, -2.84423828125, -2.567626953125, -2.291015625, -2.014404296875, -1.73779296875, -1.461181640625, -1.1845703125, -0.907958984375, -0.63134765625, -0.354736328125, -0.078125, 0.198486328125, 0.47509765625, 0.751708984375, 1.0283203125, 1.304931640625, 1.58154296875, 1.858154296875, 2.134765625, 2.411376953125, 2.68798828125, 2.964599609375, 3.2412109375, 3.517822265625, 3.79443359375, 4.071044921875, 4.34765625, 4.624267578125, 4.90087890625, 5.177490234375, 5.4541015625, 5.730712890625, 6.00732421875, 6.283935546875, 6.560546875, 6.837158203125, 7.11376953125, 7.390380859375, 7.6669921875, 7.943603515625, 8.22021484375, 8.496826171875, 8.7734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 10.0, 15.0, 28.0, 44.0, 50.0, 123.0, 412.0, 133.0, 67.0, 44.0, 23.0, 20.0, 7.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.916015625, -2.81396484375, -2.7119140625, -2.60986328125, -2.5078125, -2.40576171875, -2.3037109375, -2.20166015625, -2.099609375, -1.99755859375, -1.8955078125, -1.79345703125, -1.69140625, -1.58935546875, -1.4873046875, -1.38525390625, -1.283203125, -1.18115234375, -1.0791015625, -0.97705078125, -0.875, -0.77294921875, -0.6708984375, -0.56884765625, -0.466796875, -0.36474609375, -0.2626953125, -0.16064453125, -0.05859375, 0.04345703125, 0.1455078125, 0.24755859375, 0.349609375, 0.45166015625, 0.5537109375, 0.65576171875, 0.7578125, 0.85986328125, 0.9619140625, 1.06396484375, 1.166015625, 1.26806640625, 1.3701171875, 1.47216796875, 1.57421875, 1.67626953125, 1.7783203125, 1.88037109375, 1.982421875, 2.08447265625, 2.1865234375, 2.28857421875, 2.390625, 2.49267578125, 2.5947265625, 2.69677734375, 2.798828125, 2.90087890625, 3.0029296875, 3.10498046875, 3.20703125, 3.30908203125, 3.4111328125, 3.51318359375, 3.615234375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 7.0, 78.0, 410.0, 423.0, 81.0, 9.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.859556198120117, -12.686710357666016, -9.513864517211914, -6.3410186767578125, -3.168172836303711, 0.004673004150390625, 3.177518844604492, 6.350364685058594, 9.523210525512695, 12.696056365966797, 15.868902206420898, 19.041748046875, 22.2145938873291, 25.387439727783203, 28.560285568237305, 31.733131408691406, 34.905975341796875, 38.078819274902344, 41.25166702270508, 44.42451477050781, 47.59735870361328, 50.77020263671875, 53.943050384521484, 57.11589813232422, 60.28874206542969, 63.461585998535156, 66.63442993164062, 69.80728149414062, 72.9801254272461, 76.15296936035156, 79.32582092285156, 82.49866485595703, 85.6715087890625, 88.84435272216797, 92.01719665527344, 95.19004821777344, 98.3628921508789, 101.53573608398438, 104.70858764648438, 107.88143157958984, 111.05427551269531, 114.22711944580078, 117.39996337890625, 120.57281494140625, 123.74565887451172, 126.91850280761719, 130.0913543701172, 133.26419067382812, 136.43704223632812, 139.60989379882812, 142.78273010253906, 145.95558166503906, 149.12841796875, 152.30126953125, 155.47412109375, 158.64695739746094, 161.81980895996094, 164.99266052246094, 168.16549682617188, 171.33834838867188, 174.51119995117188, 177.6840362548828, 180.8568878173828, 184.02972412109375, 187.20257568359375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 2.0, 2.0, 6.0, 14.0, 8.0, 11.0, 10.0, 12.0, 20.0, 15.0, 14.0, 22.0, 30.0, 32.0, 26.0, 44.0, 47.0, 43.0, 36.0, 51.0, 37.0, 22.0, 31.0, 55.0, 43.0, 42.0, 36.0, 27.0, 38.0, 29.0, 22.0, 16.0, 22.0, 21.0, 15.0, 17.0, 18.0, 10.0, 10.0, 8.0, 7.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-19.483474731445312, -18.8795108795166, -18.27554702758789, -17.67158317565918, -17.06761932373047, -16.463653564453125, -15.859689712524414, -15.255725860595703, -14.651762008666992, -14.047798156738281, -13.44383430480957, -12.839869499206543, -12.235905647277832, -11.631941795349121, -11.027976989746094, -10.424013137817383, -9.820049285888672, -9.216085433959961, -8.61212158203125, -8.008156776428223, -7.404192924499512, -6.800229072570801, -6.196264743804932, -5.5923004150390625, -4.988336563110352, -4.384372711181641, -3.7804083824157715, -3.1764442920684814, -2.5724802017211914, -1.9685161113739014, -1.3645520210266113, -0.7605876922607422, -0.15662574768066406, 0.447338342666626, 1.051302433013916, 1.655266523361206, 2.259230613708496, 2.863194704055786, 3.467158794403076, 4.071123123168945, 4.675086975097656, 5.279050827026367, 5.883015155792236, 6.4869794845581055, 7.090943336486816, 7.694907188415527, 8.298871994018555, 8.902835845947266, 9.506799697875977, 10.110763549804688, 10.714727401733398, 11.318692207336426, 11.922656059265137, 12.526619911193848, 13.130584716796875, 13.734548568725586, 14.338512420654297, 14.942476272583008, 15.546440124511719, 16.15040397644043, 16.75436782836914, 17.358333587646484, 17.962297439575195, 18.566261291503906, 19.170225143432617]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 9.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 12.0, 15.0, 11.0, 15.0, 10.0, 24.0, 20.0, 29.0, 41.0, 47.0, 56.0, 69.0, 136.0, 261.0, 879.0, 6036.0, 198538.0, 3822733.0, 157898.0, 5640.0, 896.0, 304.0, 167.0, 96.0, 46.0, 45.0, 24.0, 33.0, 26.0, 23.0, 22.0, 14.0, 10.0, 20.0, 12.0, 10.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 2.0, 3.0, 4.0], "bins": [-27.140625, -26.304931640625, -25.46923828125, -24.633544921875, -23.7978515625, -22.962158203125, -22.12646484375, -21.290771484375, -20.455078125, -19.619384765625, -18.78369140625, -17.947998046875, -17.1123046875, -16.276611328125, -15.44091796875, -14.605224609375, -13.76953125, -12.933837890625, -12.09814453125, -11.262451171875, -10.4267578125, -9.591064453125, -8.75537109375, -7.919677734375, -7.083984375, -6.248291015625, -5.41259765625, -4.576904296875, -3.7412109375, -2.905517578125, -2.06982421875, -1.234130859375, -0.3984375, 0.437255859375, 1.27294921875, 2.108642578125, 2.9443359375, 3.780029296875, 4.61572265625, 5.451416015625, 6.287109375, 7.122802734375, 7.95849609375, 8.794189453125, 9.6298828125, 10.465576171875, 11.30126953125, 12.136962890625, 12.97265625, 13.808349609375, 14.64404296875, 15.479736328125, 16.3154296875, 17.151123046875, 17.98681640625, 18.822509765625, 19.658203125, 20.493896484375, 21.32958984375, 22.165283203125, 23.0009765625, 23.836669921875, 24.67236328125, 25.508056640625, 26.34375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 10.0, 8.0, 11.0, 16.0, 11.0, 20.0, 15.0, 24.0, 39.0, 32.0, 33.0, 50.0, 50.0, 54.0, 51.0, 51.0, 36.0, 59.0, 41.0, 61.0, 39.0, 45.0, 39.0, 28.0, 29.0, 34.0, 24.0, 11.0, 15.0, 15.0, 10.0, 9.0, 9.0, 4.0, 2.0, 3.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.9375, -7.70068359375, -7.4638671875, -7.22705078125, -6.990234375, -6.75341796875, -6.5166015625, -6.27978515625, -6.04296875, -5.80615234375, -5.5693359375, -5.33251953125, -5.095703125, -4.85888671875, -4.6220703125, -4.38525390625, -4.1484375, -3.91162109375, -3.6748046875, -3.43798828125, -3.201171875, -2.96435546875, -2.7275390625, -2.49072265625, -2.25390625, -2.01708984375, -1.7802734375, -1.54345703125, -1.306640625, -1.06982421875, -0.8330078125, -0.59619140625, -0.359375, -0.12255859375, 0.1142578125, 0.35107421875, 0.587890625, 0.82470703125, 1.0615234375, 1.29833984375, 1.53515625, 1.77197265625, 2.0087890625, 2.24560546875, 2.482421875, 2.71923828125, 2.9560546875, 3.19287109375, 3.4296875, 3.66650390625, 3.9033203125, 4.14013671875, 4.376953125, 4.61376953125, 4.8505859375, 5.08740234375, 5.32421875, 5.56103515625, 5.7978515625, 6.03466796875, 6.271484375, 6.50830078125, 6.7451171875, 6.98193359375, 7.21875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 15.0, 17.0, 27.0, 48.0, 104.0, 219.0, 672.0, 2522.0, 21270.0, 2427398.0, 1721950.0, 16907.0, 2130.0, 577.0, 224.0, 100.0, 48.0, 20.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.921875, -22.102294921875, -21.28271484375, -20.463134765625, -19.6435546875, -18.823974609375, -18.00439453125, -17.184814453125, -16.365234375, -15.545654296875, -14.72607421875, -13.906494140625, -13.0869140625, -12.267333984375, -11.44775390625, -10.628173828125, -9.80859375, -8.989013671875, -8.16943359375, -7.349853515625, -6.5302734375, -5.710693359375, -4.89111328125, -4.071533203125, -3.251953125, -2.432373046875, -1.61279296875, -0.793212890625, 0.0263671875, 0.845947265625, 1.66552734375, 2.485107421875, 3.3046875, 4.124267578125, 4.94384765625, 5.763427734375, 6.5830078125, 7.402587890625, 8.22216796875, 9.041748046875, 9.861328125, 10.680908203125, 11.50048828125, 12.320068359375, 13.1396484375, 13.959228515625, 14.77880859375, 15.598388671875, 16.41796875, 17.237548828125, 18.05712890625, 18.876708984375, 19.6962890625, 20.515869140625, 21.33544921875, 22.155029296875, 22.974609375, 23.794189453125, 24.61376953125, 25.433349609375, 26.2529296875, 27.072509765625, 27.89208984375, 28.711669921875, 29.53125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 8.0, 13.0, 18.0, 27.0, 47.0, 73.0, 110.0, 187.0, 290.0, 442.0, 559.0, 629.0, 566.0, 369.0, 235.0, 155.0, 119.0, 68.0, 41.0, 27.0, 23.0, 13.0, 10.0, 4.0, 4.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.19140625, -4.065765380859375, -3.94012451171875, -3.814483642578125, -3.6888427734375, -3.563201904296875, -3.43756103515625, -3.311920166015625, -3.186279296875, -3.060638427734375, -2.93499755859375, -2.809356689453125, -2.6837158203125, -2.558074951171875, -2.43243408203125, -2.306793212890625, -2.18115234375, -2.055511474609375, -1.92987060546875, -1.804229736328125, -1.6785888671875, -1.552947998046875, -1.42730712890625, -1.301666259765625, -1.176025390625, -1.050384521484375, -0.92474365234375, -0.799102783203125, -0.6734619140625, -0.547821044921875, -0.42218017578125, -0.296539306640625, -0.1708984375, -0.045257568359375, 0.08038330078125, 0.206024169921875, 0.3316650390625, 0.457305908203125, 0.58294677734375, 0.708587646484375, 0.834228515625, 0.959869384765625, 1.08551025390625, 1.211151123046875, 1.3367919921875, 1.462432861328125, 1.58807373046875, 1.713714599609375, 1.83935546875, 1.964996337890625, 2.09063720703125, 2.216278076171875, 2.3419189453125, 2.467559814453125, 2.59320068359375, 2.718841552734375, 2.844482421875, 2.970123291015625, 3.09576416015625, 3.221405029296875, 3.3470458984375, 3.472686767578125, 3.59832763671875, 3.723968505859375, 3.849609375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 6.0, 8.0, 21.0, 24.0, 39.0, 46.0, 86.0, 78.0, 91.0, 108.0, 117.0, 106.0, 63.0, 65.0, 39.0, 30.0, 24.0, 19.0, 16.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.75612449645996, -16.28530502319336, -15.814485549926758, -15.343666076660156, -14.872845649719238, -14.402026176452637, -13.931206703186035, -13.460387229919434, -12.989566802978516, -12.518747329711914, -12.047927856445312, -11.577108383178711, -11.106287956237793, -10.635468482971191, -10.16464900970459, -9.693829536437988, -9.223010063171387, -8.752190589904785, -8.281371116638184, -7.810551166534424, -7.339731216430664, -6.8689117431640625, -6.398092269897461, -5.927272796630859, -5.4564528465271, -4.985633373260498, -4.514813423156738, -4.043993949890137, -3.573174238204956, -3.1023545265197754, -2.631535053253174, -2.160715341567993, -1.6898956298828125, -1.2190759181976318, -0.7482563257217407, -0.2774367332458496, 0.19338297843933105, 0.6642026901245117, 1.1350221633911133, 1.605841875076294, 2.0766615867614746, 2.5474812984466553, 3.018301010131836, 3.4891204833984375, 3.959940195083618, 4.430759906768799, 4.9015793800354, 5.37239933013916, 5.843218803405762, 6.314038276672363, 6.784858226776123, 7.255677700042725, 7.726497650146484, 8.197317123413086, 8.668136596679688, 9.138956069946289, 9.60977554321289, 10.080595016479492, 10.551414489746094, 11.022233963012695, 11.493054389953613, 11.963873863220215, 12.434693336486816, 12.905512809753418, 13.376333236694336]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 6.0, 4.0, 6.0, 11.0, 9.0, 8.0, 6.0, 8.0, 9.0, 12.0, 17.0, 32.0, 19.0, 26.0, 24.0, 22.0, 40.0, 39.0, 36.0, 28.0, 48.0, 41.0, 40.0, 42.0, 35.0, 34.0, 30.0, 39.0, 42.0, 32.0, 32.0, 27.0, 26.0, 27.0, 13.0, 14.0, 22.0, 14.0, 21.0, 9.0, 13.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-8.36999225616455, -8.142390251159668, -7.914788722991943, -7.6871867179870605, -7.459585189819336, -7.231983184814453, -7.00438117980957, -6.7767791748046875, -6.549177646636963, -6.32157564163208, -6.0939741134643555, -5.866372108459473, -5.63877010345459, -5.411168575286865, -5.183566570281982, -4.955965042114258, -4.728363037109375, -4.500761032104492, -4.273159503936768, -4.045557498931885, -3.817955732345581, -3.5903539657592773, -3.3627519607543945, -3.135150194168091, -2.907548427581787, -2.6799466609954834, -2.4523448944091797, -2.224742889404297, -1.9971411228179932, -1.7695393562316895, -1.5419374704360962, -1.314335584640503, -1.0867342948913574, -0.8591324687004089, -0.6315306425094604, -0.40392881631851196, -0.17632699012756348, 0.051274776458740234, 0.2788766622543335, 0.5064785480499268, 0.7340803146362305, 0.961682140827179, 1.1892839670181274, 1.4168858528137207, 1.6444876194000244, 1.8720893859863281, 2.099691390991211, 2.3272931575775146, 2.5548949241638184, 2.782496690750122, 3.010098457336426, 3.2377004623413086, 3.4653022289276123, 3.692903995513916, 3.920506000518799, 4.148107528686523, 4.375709533691406, 4.603311538696289, 4.830913066864014, 5.0585150718688965, 5.286116600036621, 5.513718605041504, 5.741320610046387, 5.9689226150512695, 6.196524143218994]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 5.0, 16.0, 40.0, 64.0, 93.0, 219.0, 408.0, 1105.0, 4932.0, 45332.0, 508955.0, 444458.0, 36832.0, 4246.0, 1059.0, 391.0, 179.0, 90.0, 56.0, 35.0, 15.0, 8.0, 8.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.9429931640625, -4.788330078125, -4.6336669921875, -4.47900390625, -4.3243408203125, -4.169677734375, -4.0150146484375, -3.8603515625, -3.7056884765625, -3.551025390625, -3.3963623046875, -3.24169921875, -3.0870361328125, -2.932373046875, -2.7777099609375, -2.623046875, -2.4683837890625, -2.313720703125, -2.1590576171875, -2.00439453125, -1.8497314453125, -1.695068359375, -1.5404052734375, -1.3857421875, -1.2310791015625, -1.076416015625, -0.9217529296875, -0.76708984375, -0.6124267578125, -0.457763671875, -0.3031005859375, -0.1484375, 0.0062255859375, 0.160888671875, 0.3155517578125, 0.47021484375, 0.6248779296875, 0.779541015625, 0.9342041015625, 1.0888671875, 1.2435302734375, 1.398193359375, 1.5528564453125, 1.70751953125, 1.8621826171875, 2.016845703125, 2.1715087890625, 2.326171875, 2.4808349609375, 2.635498046875, 2.7901611328125, 2.94482421875, 3.0994873046875, 3.254150390625, 3.4088134765625, 3.5634765625, 3.7181396484375, 3.872802734375, 4.0274658203125, 4.18212890625, 4.3367919921875, 4.491455078125, 4.6461181640625, 4.80078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 10.0, 12.0, 16.0, 24.0, 34.0, 51.0, 40.0, 65.0, 62.0, 105.0, 84.0, 77.0, 70.0, 70.0, 64.0, 55.0, 45.0, 36.0, 24.0, 26.0, 12.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0], "bins": [-16.1875, -15.84991455078125, -15.5123291015625, -15.17474365234375, -14.837158203125, -14.49957275390625, -14.1619873046875, -13.82440185546875, -13.48681640625, -13.14923095703125, -12.8116455078125, -12.47406005859375, -12.136474609375, -11.79888916015625, -11.4613037109375, -11.12371826171875, -10.7861328125, -10.44854736328125, -10.1109619140625, -9.77337646484375, -9.435791015625, -9.09820556640625, -8.7606201171875, -8.42303466796875, -8.08544921875, -7.74786376953125, -7.4102783203125, -7.07269287109375, -6.735107421875, -6.39752197265625, -6.0599365234375, -5.72235107421875, -5.384765625, -5.04718017578125, -4.7095947265625, -4.37200927734375, -4.034423828125, -3.69683837890625, -3.3592529296875, -3.02166748046875, -2.68408203125, -2.34649658203125, -2.0089111328125, -1.67132568359375, -1.333740234375, -0.99615478515625, -0.6585693359375, -0.32098388671875, 0.0166015625, 0.35418701171875, 0.6917724609375, 1.02935791015625, 1.366943359375, 1.70452880859375, 2.0421142578125, 2.37969970703125, 2.71728515625, 3.05487060546875, 3.3924560546875, 3.73004150390625, 4.067626953125, 4.40521240234375, 4.7427978515625, 5.08038330078125, 5.41796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 17.0, 12.0, 24.0, 41.0, 41.0, 95.0, 139.0, 223.0, 377.0, 721.0, 1198.0, 2220.0, 4218.0, 8389.0, 16971.0, 34247.0, 69084.0, 129622.0, 204957.0, 224682.0, 163915.0, 92885.0, 47082.0, 23374.0, 11466.0, 5738.0, 2992.0, 1570.0, 961.0, 500.0, 290.0, 178.0, 119.0, 80.0, 39.0, 29.0, 11.0, 8.0, 6.0, 8.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.022796630859375, -0.98895263671875, -0.955108642578125, -0.9212646484375, -0.887420654296875, -0.85357666015625, -0.819732666015625, -0.785888671875, -0.752044677734375, -0.71820068359375, -0.684356689453125, -0.6505126953125, -0.616668701171875, -0.58282470703125, -0.548980712890625, -0.51513671875, -0.481292724609375, -0.44744873046875, -0.413604736328125, -0.3797607421875, -0.345916748046875, -0.31207275390625, -0.278228759765625, -0.244384765625, -0.210540771484375, -0.17669677734375, -0.142852783203125, -0.1090087890625, -0.075164794921875, -0.04132080078125, -0.007476806640625, 0.0263671875, 0.060211181640625, 0.09405517578125, 0.127899169921875, 0.1617431640625, 0.195587158203125, 0.22943115234375, 0.263275146484375, 0.297119140625, 0.330963134765625, 0.36480712890625, 0.398651123046875, 0.4324951171875, 0.466339111328125, 0.50018310546875, 0.534027099609375, 0.56787109375, 0.601715087890625, 0.63555908203125, 0.669403076171875, 0.7032470703125, 0.737091064453125, 0.77093505859375, 0.804779052734375, 0.838623046875, 0.872467041015625, 0.90631103515625, 0.940155029296875, 0.9739990234375, 1.007843017578125, 1.04168701171875, 1.075531005859375, 1.109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 2.0, 2.0, 9.0, 16.0, 8.0, 18.0, 21.0, 24.0, 14.0, 32.0, 21.0, 36.0, 30.0, 39.0, 60.0, 49.0, 52.0, 40.0, 44.0, 48.0, 41.0, 46.0, 42.0, 41.0, 45.0, 37.0, 38.0, 27.0, 19.0, 17.0, 18.0, 12.0, 10.0, 12.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.3515625, -12.947998046875, -12.54443359375, -12.140869140625, -11.7373046875, -11.333740234375, -10.93017578125, -10.526611328125, -10.123046875, -9.719482421875, -9.31591796875, -8.912353515625, -8.5087890625, -8.105224609375, -7.70166015625, -7.298095703125, -6.89453125, -6.490966796875, -6.08740234375, -5.683837890625, -5.2802734375, -4.876708984375, -4.47314453125, -4.069580078125, -3.666015625, -3.262451171875, -2.85888671875, -2.455322265625, -2.0517578125, -1.648193359375, -1.24462890625, -0.841064453125, -0.4375, -0.033935546875, 0.36962890625, 0.773193359375, 1.1767578125, 1.580322265625, 1.98388671875, 2.387451171875, 2.791015625, 3.194580078125, 3.59814453125, 4.001708984375, 4.4052734375, 4.808837890625, 5.21240234375, 5.615966796875, 6.01953125, 6.423095703125, 6.82666015625, 7.230224609375, 7.6337890625, 8.037353515625, 8.44091796875, 8.844482421875, 9.248046875, 9.651611328125, 10.05517578125, 10.458740234375, 10.8623046875, 11.265869140625, 11.66943359375, 12.072998046875, 12.4765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 17.0, 17.0, 37.0, 43.0, 65.0, 90.0, 134.0, 268.0, 357.0, 656.0, 1139.0, 2295.0, 4774.0, 11374.0, 31488.0, 94491.0, 241968.0, 339361.0, 203083.0, 74212.0, 24824.0, 9272.0, 3988.0, 1956.0, 1058.0, 570.0, 378.0, 216.0, 139.0, 99.0, 68.0, 39.0, 31.0, 17.0, 7.0, 4.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362060546875, -0.351531982421875, -0.34100341796875, -0.330474853515625, -0.3199462890625, -0.309417724609375, -0.29888916015625, -0.288360595703125, -0.27783203125, -0.267303466796875, -0.25677490234375, -0.246246337890625, -0.2357177734375, -0.225189208984375, -0.21466064453125, -0.204132080078125, -0.193603515625, -0.183074951171875, -0.17254638671875, -0.162017822265625, -0.1514892578125, -0.140960693359375, -0.13043212890625, -0.119903564453125, -0.109375, -0.098846435546875, -0.08831787109375, -0.077789306640625, -0.0672607421875, -0.056732177734375, -0.04620361328125, -0.035675048828125, -0.025146484375, -0.014617919921875, -0.00408935546875, 0.006439208984375, 0.0169677734375, 0.027496337890625, 0.03802490234375, 0.048553466796875, 0.05908203125, 0.069610595703125, 0.08013916015625, 0.090667724609375, 0.1011962890625, 0.111724853515625, 0.12225341796875, 0.132781982421875, 0.143310546875, 0.153839111328125, 0.16436767578125, 0.174896240234375, 0.1854248046875, 0.195953369140625, 0.20648193359375, 0.217010498046875, 0.2275390625, 0.238067626953125, 0.24859619140625, 0.259124755859375, 0.2696533203125, 0.280181884765625, 0.29071044921875, 0.301239013671875, 0.311767578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 5.0, 5.0, 10.0, 12.0, 23.0, 21.0, 47.0, 44.0, 48.0, 75.0, 82.0, 81.0, 92.0, 98.0, 79.0, 68.0, 55.0, 34.0, 28.0, 19.0, 20.0, 9.0, 10.0, 9.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021886825561523438, -0.00021162629127502441, -0.00020438432693481445, -0.0001971423625946045, -0.00018990039825439453, -0.00018265843391418457, -0.0001754164695739746, -0.00016817450523376465, -0.0001609325408935547, -0.00015369057655334473, -0.00014644861221313477, -0.0001392066478729248, -0.00013196468353271484, -0.00012472271919250488, -0.00011748075485229492, -0.00011023879051208496, -0.000102996826171875, -9.575486183166504e-05, -8.851289749145508e-05, -8.127093315124512e-05, -7.402896881103516e-05, -6.67870044708252e-05, -5.9545040130615234e-05, -5.2303075790405273e-05, -4.506111145019531e-05, -3.781914710998535e-05, -3.057718276977539e-05, -2.333521842956543e-05, -1.609325408935547e-05, -8.851289749145508e-06, -1.6093254089355469e-06, 5.632638931274414e-06, 1.2874603271484375e-05, 2.0116567611694336e-05, 2.7358531951904297e-05, 3.460049629211426e-05, 4.184246063232422e-05, 4.908442497253418e-05, 5.632638931274414e-05, 6.35683536529541e-05, 7.081031799316406e-05, 7.805228233337402e-05, 8.529424667358398e-05, 9.253621101379395e-05, 9.97781753540039e-05, 0.00010702013969421387, 0.00011426210403442383, 0.00012150406837463379, 0.00012874603271484375, 0.0001359879970550537, 0.00014322996139526367, 0.00015047192573547363, 0.0001577138900756836, 0.00016495585441589355, 0.00017219781875610352, 0.00017943978309631348, 0.00018668174743652344, 0.0001939237117767334, 0.00020116567611694336, 0.00020840764045715332, 0.00021564960479736328, 0.00022289156913757324, 0.0002301335334777832, 0.00023737549781799316, 0.0002446174621582031]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 12.0, 11.0, 14.0, 28.0, 27.0, 50.0, 61.0, 78.0, 126.0, 176.0, 293.0, 502.0, 1077.0, 2800.0, 8660.0, 30453.0, 104259.0, 272395.0, 351502.0, 189112.0, 61075.0, 17148.0, 5105.0, 1777.0, 693.0, 372.0, 222.0, 147.0, 89.0, 73.0, 52.0, 43.0, 23.0, 22.0, 12.0, 12.0, 8.0, 6.0, 3.0, 8.0, 6.0, 4.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.334716796875, -0.3232841491699219, -0.31185150146484375, -0.3004188537597656, -0.2889862060546875, -0.2775535583496094, -0.26612091064453125, -0.2546882629394531, -0.243255615234375, -0.23182296752929688, -0.22039031982421875, -0.20895767211914062, -0.1975250244140625, -0.18609237670898438, -0.17465972900390625, -0.16322708129882812, -0.15179443359375, -0.14036178588867188, -0.12892913818359375, -0.11749649047851562, -0.1060638427734375, -0.09463119506835938, -0.08319854736328125, -0.07176589965820312, -0.060333251953125, -0.048900604248046875, -0.03746795654296875, -0.026035308837890625, -0.0146026611328125, -0.003170013427734375, 0.00826263427734375, 0.019695281982421875, 0.0311279296875, 0.042560577392578125, 0.05399322509765625, 0.06542587280273438, 0.0768585205078125, 0.08829116821289062, 0.09972381591796875, 0.11115646362304688, 0.122589111328125, 0.13402175903320312, 0.14545440673828125, 0.15688705444335938, 0.1683197021484375, 0.17975234985351562, 0.19118499755859375, 0.20261764526367188, 0.21405029296875, 0.22548294067382812, 0.23691558837890625, 0.24834823608398438, 0.2597808837890625, 0.2712135314941406, 0.28264617919921875, 0.2940788269042969, 0.305511474609375, 0.3169441223144531, 0.32837677001953125, 0.3398094177246094, 0.3512420654296875, 0.3626747131347656, 0.37410736083984375, 0.3855400085449219, 0.39697265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 12.0, 15.0, 11.0, 15.0, 30.0, 26.0, 40.0, 40.0, 47.0, 55.0, 47.0, 51.0, 67.0, 60.0, 39.0, 59.0, 58.0, 46.0, 43.0, 38.0, 39.0, 35.0, 29.0, 18.0, 17.0, 7.0, 14.0, 3.0, 6.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14709854125976562, -0.14331817626953125, -0.13953781127929688, -0.1357574462890625, -0.13197708129882812, -0.12819671630859375, -0.12441635131835938, -0.120635986328125, -0.11685562133789062, -0.11307525634765625, -0.10929489135742188, -0.1055145263671875, -0.10173416137695312, -0.09795379638671875, -0.09417343139648438, -0.09039306640625, -0.08661270141601562, -0.08283233642578125, -0.07905197143554688, -0.0752716064453125, -0.07149124145507812, -0.06771087646484375, -0.06393051147460938, -0.060150146484375, -0.056369781494140625, -0.05258941650390625, -0.048809051513671875, -0.0450286865234375, -0.041248321533203125, -0.03746795654296875, -0.033687591552734375, -0.0299072265625, -0.026126861572265625, -0.02234649658203125, -0.018566131591796875, -0.0147857666015625, -0.011005401611328125, -0.00722503662109375, -0.003444671630859375, 0.000335693359375, 0.004116058349609375, 0.00789642333984375, 0.011676788330078125, 0.0154571533203125, 0.019237518310546875, 0.02301788330078125, 0.026798248291015625, 0.03057861328125, 0.034358978271484375, 0.03813934326171875, 0.041919708251953125, 0.0457000732421875, 0.049480438232421875, 0.05326080322265625, 0.057041168212890625, 0.060821533203125, 0.06460189819335938, 0.06838226318359375, 0.07216262817382812, 0.0759429931640625, 0.07972335815429688, 0.08350372314453125, 0.08728408813476562, 0.091064453125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 15.0, 38.0, 78.0, 147.0, 188.0, 226.0, 164.0, 73.0, 44.0, 23.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.770256042480469, -11.11961555480957, -10.468976020812988, -9.81833553314209, -9.167695999145508, -8.51705551147461, -7.866415500640869, -7.215775489807129, -6.565135478973389, -5.914495468139648, -5.263855457305908, -4.613215446472168, -3.9625751972198486, -3.3119351863861084, -2.661294937133789, -2.010654926300049, -1.3600149154663086, -0.7093748450279236, -0.058734774589538574, 0.5919053554534912, 1.2425453662872314, 1.8931853771209717, 2.543825626373291, 3.1944656372070312, 3.8451056480407715, 4.495745658874512, 5.146385669708252, 5.797025680541992, 6.447666168212891, 7.098305702209473, 7.748946189880371, 8.399585723876953, 9.050226211547852, 9.70086669921875, 10.351506233215332, 11.00214672088623, 11.652786254882812, 12.303426742553711, 12.95406723022461, 13.604706764221191, 14.255346298217773, 14.905986785888672, 15.556626319885254, 16.207265853881836, 16.857906341552734, 17.508546829223633, 18.15918731689453, 18.809825897216797, 19.460468292236328, 20.111108779907227, 20.761749267578125, 21.41238784790039, 22.06302833557129, 22.713668823242188, 23.364309310913086, 24.014949798583984, 24.66558837890625, 25.31622886657715, 25.966869354248047, 26.617507934570312, 27.26814842224121, 27.91878890991211, 28.569429397583008, 29.220069885253906, 29.870708465576172]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 11.0, 12.0, 18.0, 14.0, 21.0, 32.0, 53.0, 54.0, 66.0, 75.0, 86.0, 86.0, 66.0, 64.0, 78.0, 59.0, 48.0, 37.0, 40.0, 30.0, 16.0, 13.0, 11.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-14.457428932189941, -14.147439956665039, -13.83745002746582, -13.527461051940918, -13.2174711227417, -12.907482147216797, -12.597492218017578, -12.287503242492676, -11.977513313293457, -11.667524337768555, -11.357534408569336, -11.047545433044434, -10.737555503845215, -10.427566528320312, -10.117576599121094, -9.807587623596191, -9.497598648071289, -9.187609672546387, -8.877619743347168, -8.567630767822266, -8.257640838623047, -7.947651386260986, -7.637661933898926, -7.327672958374023, -7.017683029174805, -6.707693576812744, -6.397704124450684, -6.087714672088623, -5.7777252197265625, -5.467735767364502, -5.157746315002441, -4.847757339477539, -4.53776741027832, -4.22777795791626, -3.917788505554199, -3.6077990531921387, -3.297809600830078, -2.9878201484680176, -2.677830934524536, -2.3678414821624756, -2.057852029800415, -1.7478625774383545, -1.437873125076294, -1.127883791923523, -0.8178943395614624, -0.5079048871994019, -0.19791555404663086, 0.11207389831542969, 0.42206335067749023, 0.7320528030395508, 1.0420422554016113, 1.3520315885543823, 1.6620210409164429, 1.9720104932785034, 2.2819998264312744, 2.591989278793335, 2.9019787311553955, 3.211968183517456, 3.5219576358795166, 3.831946849822998, 4.141936302185059, 4.451925754547119, 4.76191520690918, 5.07190465927124, 5.381894111633301]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 8.0, 11.0, 21.0, 46.0, 46.0, 97.0, 170.0, 366.0, 907.0, 3082.0, 13831.0, 77195.0, 570219.0, 322279.0, 47832.0, 8954.0, 2112.0, 743.0, 291.0, 157.0, 86.0, 39.0, 16.0, 12.0, 16.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.703125, -11.3575439453125, -11.011962890625, -10.6663818359375, -10.32080078125, -9.9752197265625, -9.629638671875, -9.2840576171875, -8.9384765625, -8.5928955078125, -8.247314453125, -7.9017333984375, -7.55615234375, -7.2105712890625, -6.864990234375, -6.5194091796875, -6.173828125, -5.8282470703125, -5.482666015625, -5.1370849609375, -4.79150390625, -4.4459228515625, -4.100341796875, -3.7547607421875, -3.4091796875, -3.0635986328125, -2.718017578125, -2.3724365234375, -2.02685546875, -1.6812744140625, -1.335693359375, -0.9901123046875, -0.64453125, -0.2989501953125, 0.046630859375, 0.3922119140625, 0.73779296875, 1.0833740234375, 1.428955078125, 1.7745361328125, 2.1201171875, 2.4656982421875, 2.811279296875, 3.1568603515625, 3.50244140625, 3.8480224609375, 4.193603515625, 4.5391845703125, 4.884765625, 5.2303466796875, 5.575927734375, 5.9215087890625, 6.26708984375, 6.6126708984375, 6.958251953125, 7.3038330078125, 7.6494140625, 7.9949951171875, 8.340576171875, 8.6861572265625, 9.03173828125, 9.3773193359375, 9.722900390625, 10.0684814453125, 10.4140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 6.0, 11.0, 13.0, 13.0, 28.0, 20.0, 44.0, 39.0, 53.0, 61.0, 66.0, 79.0, 65.0, 62.0, 78.0, 74.0, 50.0, 60.0, 34.0, 44.0, 31.0, 20.0, 19.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 4.0], "bins": [-24.078125, -23.56298828125, -23.0478515625, -22.53271484375, -22.017578125, -21.50244140625, -20.9873046875, -20.47216796875, -19.95703125, -19.44189453125, -18.9267578125, -18.41162109375, -17.896484375, -17.38134765625, -16.8662109375, -16.35107421875, -15.8359375, -15.32080078125, -14.8056640625, -14.29052734375, -13.775390625, -13.26025390625, -12.7451171875, -12.22998046875, -11.71484375, -11.19970703125, -10.6845703125, -10.16943359375, -9.654296875, -9.13916015625, -8.6240234375, -8.10888671875, -7.59375, -7.07861328125, -6.5634765625, -6.04833984375, -5.533203125, -5.01806640625, -4.5029296875, -3.98779296875, -3.47265625, -2.95751953125, -2.4423828125, -1.92724609375, -1.412109375, -0.89697265625, -0.3818359375, 0.13330078125, 0.6484375, 1.16357421875, 1.6787109375, 2.19384765625, 2.708984375, 3.22412109375, 3.7392578125, 4.25439453125, 4.76953125, 5.28466796875, 5.7998046875, 6.31494140625, 6.830078125, 7.34521484375, 7.8603515625, 8.37548828125, 8.890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 3.0, 8.0, 9.0, 10.0, 17.0, 23.0, 24.0, 31.0, 46.0, 81.0, 128.0, 204.0, 451.0, 1454.0, 17602.0, 853160.0, 169224.0, 4451.0, 826.0, 299.0, 150.0, 104.0, 61.0, 37.0, 42.0, 28.0, 20.0, 12.0, 12.0, 11.0, 8.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.515625, -21.759521484375, -21.00341796875, -20.247314453125, -19.4912109375, -18.735107421875, -17.97900390625, -17.222900390625, -16.466796875, -15.710693359375, -14.95458984375, -14.198486328125, -13.4423828125, -12.686279296875, -11.93017578125, -11.174072265625, -10.41796875, -9.661865234375, -8.90576171875, -8.149658203125, -7.3935546875, -6.637451171875, -5.88134765625, -5.125244140625, -4.369140625, -3.613037109375, -2.85693359375, -2.100830078125, -1.3447265625, -0.588623046875, 0.16748046875, 0.923583984375, 1.6796875, 2.435791015625, 3.19189453125, 3.947998046875, 4.7041015625, 5.460205078125, 6.21630859375, 6.972412109375, 7.728515625, 8.484619140625, 9.24072265625, 9.996826171875, 10.7529296875, 11.509033203125, 12.26513671875, 13.021240234375, 13.77734375, 14.533447265625, 15.28955078125, 16.045654296875, 16.8017578125, 17.557861328125, 18.31396484375, 19.070068359375, 19.826171875, 20.582275390625, 21.33837890625, 22.094482421875, 22.8505859375, 23.606689453125, 24.36279296875, 25.118896484375, 25.875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 6.0, 3.0, 6.0, 15.0, 9.0, 4.0, 20.0, 21.0, 24.0, 20.0, 26.0, 45.0, 36.0, 30.0, 41.0, 31.0, 55.0, 62.0, 76.0, 48.0, 49.0, 37.0, 52.0, 39.0, 28.0, 26.0, 35.0, 27.0, 25.0, 21.0, 15.0, 15.0, 12.0, 13.0, 11.0, 2.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.84375, -13.38916015625, -12.9345703125, -12.47998046875, -12.025390625, -11.57080078125, -11.1162109375, -10.66162109375, -10.20703125, -9.75244140625, -9.2978515625, -8.84326171875, -8.388671875, -7.93408203125, -7.4794921875, -7.02490234375, -6.5703125, -6.11572265625, -5.6611328125, -5.20654296875, -4.751953125, -4.29736328125, -3.8427734375, -3.38818359375, -2.93359375, -2.47900390625, -2.0244140625, -1.56982421875, -1.115234375, -0.66064453125, -0.2060546875, 0.24853515625, 0.703125, 1.15771484375, 1.6123046875, 2.06689453125, 2.521484375, 2.97607421875, 3.4306640625, 3.88525390625, 4.33984375, 4.79443359375, 5.2490234375, 5.70361328125, 6.158203125, 6.61279296875, 7.0673828125, 7.52197265625, 7.9765625, 8.43115234375, 8.8857421875, 9.34033203125, 9.794921875, 10.24951171875, 10.7041015625, 11.15869140625, 11.61328125, 12.06787109375, 12.5224609375, 12.97705078125, 13.431640625, 13.88623046875, 14.3408203125, 14.79541015625, 15.25]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 8.0, 11.0, 7.0, 15.0, 20.0, 38.0, 67.0, 99.0, 224.0, 558.0, 2307.0, 21707.0, 766875.0, 245797.0, 8690.0, 1319.0, 385.0, 167.0, 68.0, 38.0, 32.0, 19.0, 19.0, 19.0, 10.0, 9.0, 5.0, 5.0, 7.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.20703125, -6.9940185546875, -6.781005859375, -6.5679931640625, -6.35498046875, -6.1419677734375, -5.928955078125, -5.7159423828125, -5.5029296875, -5.2899169921875, -5.076904296875, -4.8638916015625, -4.65087890625, -4.4378662109375, -4.224853515625, -4.0118408203125, -3.798828125, -3.5858154296875, -3.372802734375, -3.1597900390625, -2.94677734375, -2.7337646484375, -2.520751953125, -2.3077392578125, -2.0947265625, -1.8817138671875, -1.668701171875, -1.4556884765625, -1.24267578125, -1.0296630859375, -0.816650390625, -0.6036376953125, -0.390625, -0.1776123046875, 0.035400390625, 0.2484130859375, 0.46142578125, 0.6744384765625, 0.887451171875, 1.1004638671875, 1.3134765625, 1.5264892578125, 1.739501953125, 1.9525146484375, 2.16552734375, 2.3785400390625, 2.591552734375, 2.8045654296875, 3.017578125, 3.2305908203125, 3.443603515625, 3.6566162109375, 3.86962890625, 4.0826416015625, 4.295654296875, 4.5086669921875, 4.7216796875, 4.9346923828125, 5.147705078125, 5.3607177734375, 5.57373046875, 5.7867431640625, 5.999755859375, 6.2127685546875, 6.42578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 9.0, 9.0, 9.0, 14.0, 8.0, 21.0, 25.0, 41.0, 57.0, 79.0, 105.0, 160.0, 129.0, 87.0, 65.0, 43.0, 31.0, 22.0, 18.0, 24.0, 9.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.0007109642028808594, -0.0006926655769348145, -0.0006743669509887695, -0.0006560683250427246, -0.0006377696990966797, -0.0006194710731506348, -0.0006011724472045898, -0.0005828738212585449, -0.0005645751953125, -0.0005462765693664551, -0.0005279779434204102, -0.0005096793174743652, -0.0004913806915283203, -0.0004730820655822754, -0.00045478343963623047, -0.00043648481369018555, -0.0004181861877441406, -0.0003998875617980957, -0.0003815889358520508, -0.00036329030990600586, -0.00034499168395996094, -0.000326693058013916, -0.0003083944320678711, -0.00029009580612182617, -0.00027179718017578125, -0.00025349855422973633, -0.0002351999282836914, -0.00021690130233764648, -0.00019860267639160156, -0.00018030405044555664, -0.00016200542449951172, -0.0001437067985534668, -0.00012540817260742188, -0.00010710954666137695, -8.881092071533203e-05, -7.051229476928711e-05, -5.221366882324219e-05, -3.3915042877197266e-05, -1.5616416931152344e-05, 2.682209014892578e-06, 2.09808349609375e-05, 3.927946090698242e-05, 5.7578086853027344e-05, 7.587671279907227e-05, 9.417533874511719e-05, 0.00011247396469116211, 0.00013077259063720703, 0.00014907121658325195, 0.00016736984252929688, 0.0001856684684753418, 0.00020396709442138672, 0.00022226572036743164, 0.00024056434631347656, 0.0002588629722595215, 0.0002771615982055664, 0.00029546022415161133, 0.00031375885009765625, 0.00033205747604370117, 0.0003503561019897461, 0.000368654727935791, 0.00038695335388183594, 0.00040525197982788086, 0.0004235506057739258, 0.0004418492317199707, 0.0004601478576660156]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 4.0, 12.0, 14.0, 17.0, 25.0, 49.0, 85.0, 167.0, 362.0, 1034.0, 3359.0, 25910.0, 808551.0, 197440.0, 8385.0, 1868.0, 661.0, 271.0, 125.0, 83.0, 43.0, 27.0, 15.0, 15.0, 4.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.890625, -8.6552734375, -8.419921875, -8.1845703125, -7.94921875, -7.7138671875, -7.478515625, -7.2431640625, -7.0078125, -6.7724609375, -6.537109375, -6.3017578125, -6.06640625, -5.8310546875, -5.595703125, -5.3603515625, -5.125, -4.8896484375, -4.654296875, -4.4189453125, -4.18359375, -3.9482421875, -3.712890625, -3.4775390625, -3.2421875, -3.0068359375, -2.771484375, -2.5361328125, -2.30078125, -2.0654296875, -1.830078125, -1.5947265625, -1.359375, -1.1240234375, -0.888671875, -0.6533203125, -0.41796875, -0.1826171875, 0.052734375, 0.2880859375, 0.5234375, 0.7587890625, 0.994140625, 1.2294921875, 1.46484375, 1.7001953125, 1.935546875, 2.1708984375, 2.40625, 2.6416015625, 2.876953125, 3.1123046875, 3.34765625, 3.5830078125, 3.818359375, 4.0537109375, 4.2890625, 4.5244140625, 4.759765625, 4.9951171875, 5.23046875, 5.4658203125, 5.701171875, 5.9365234375, 6.171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 10.0, 21.0, 43.0, 75.0, 140.0, 286.0, 195.0, 105.0, 50.0, 33.0, 14.0, 13.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.76171875, -2.64019775390625, -2.5186767578125, -2.39715576171875, -2.275634765625, -2.15411376953125, -2.0325927734375, -1.91107177734375, -1.78955078125, -1.66802978515625, -1.5465087890625, -1.42498779296875, -1.303466796875, -1.18194580078125, -1.0604248046875, -0.93890380859375, -0.8173828125, -0.69586181640625, -0.5743408203125, -0.45281982421875, -0.331298828125, -0.20977783203125, -0.0882568359375, 0.03326416015625, 0.15478515625, 0.27630615234375, 0.3978271484375, 0.51934814453125, 0.640869140625, 0.76239013671875, 0.8839111328125, 1.00543212890625, 1.126953125, 1.24847412109375, 1.3699951171875, 1.49151611328125, 1.613037109375, 1.73455810546875, 1.8560791015625, 1.97760009765625, 2.09912109375, 2.22064208984375, 2.3421630859375, 2.46368408203125, 2.585205078125, 2.70672607421875, 2.8282470703125, 2.94976806640625, 3.0712890625, 3.19281005859375, 3.3143310546875, 3.43585205078125, 3.557373046875, 3.67889404296875, 3.8004150390625, 3.92193603515625, 4.04345703125, 4.16497802734375, 4.2864990234375, 4.40802001953125, 4.529541015625, 4.65106201171875, 4.7725830078125, 4.89410400390625, 5.015625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 9.0, 55.0, 306.0, 448.0, 177.0, 17.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.826820373535156, -9.848483085632324, -6.870145797729492, -3.89180850982666, -0.9134712219238281, 2.064866065979004, 5.043203353881836, 8.021541595458984, 10.9998779296875, 13.978215217590332, 16.956552505493164, 19.934890747070312, 22.913227081298828, 25.891563415527344, 28.869901657104492, 31.84823989868164, 34.826576232910156, 37.80491256713867, 40.78324890136719, 43.76158905029297, 46.739925384521484, 49.71826171875, 52.69660186767578, 55.6749382019043, 58.65327453613281, 61.63161087036133, 64.60994720458984, 67.58828735351562, 70.56661987304688, 73.54496002197266, 76.52330017089844, 79.50163269042969, 82.47996520996094, 85.45830535888672, 88.43663787841797, 91.41497802734375, 94.393310546875, 97.37165069580078, 100.34999084472656, 103.32832336425781, 106.3066635131836, 109.28500366210938, 112.26333618164062, 115.2416763305664, 118.22001647949219, 121.19834899902344, 124.17668914794922, 127.155029296875, 130.13336181640625, 133.1116943359375, 136.0900421142578, 139.06837463378906, 142.0467071533203, 145.02505493164062, 148.00338745117188, 150.98171997070312, 153.96005249023438, 156.93838500976562, 159.91673278808594, 162.8950653076172, 165.87339782714844, 168.85174560546875, 171.830078125, 174.80841064453125, 177.78675842285156]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 9.0, 11.0, 14.0, 18.0, 22.0, 28.0, 32.0, 32.0, 40.0, 59.0, 57.0, 55.0, 53.0, 63.0, 66.0, 72.0, 54.0, 47.0, 47.0, 40.0, 38.0, 26.0, 25.0, 17.0, 15.0, 15.0, 13.0, 7.0, 5.0, 2.0, 10.0, 3.0, 2.0, 2.0, 1.0], "bins": [-37.90641403198242, -37.00166320800781, -36.0969123840332, -35.19215774536133, -34.28740692138672, -33.38265609741211, -32.4779052734375, -31.573152542114258, -30.668399810791016, -29.763648986816406, -28.858896255493164, -27.954145431518555, -27.049392700195312, -26.144641876220703, -25.239891052246094, -24.33513832092285, -23.430387496948242, -22.525636672973633, -21.62088394165039, -20.71613311767578, -19.81138038635254, -18.90662956237793, -18.001876831054688, -17.097126007080078, -16.19237518310547, -15.287623405456543, -14.382871627807617, -13.478120803833008, -12.573368072509766, -11.668617248535156, -10.76386547088623, -9.859113693237305, -8.954362869262695, -8.04961109161377, -7.144859313964844, -6.240108013153076, -5.33535623550415, -4.430604457855225, -3.525853157043457, -2.6211013793945312, -1.7163496017456055, -0.8115979433059692, 0.09315371513366699, 0.9979052543640137, 1.9026570320129395, 2.8074088096618652, 3.712160110473633, 4.616911888122559, 5.521663665771484, 6.42641544342041, 7.331167221069336, 8.235918045043945, 9.140670776367188, 10.045421600341797, 10.950173377990723, 11.854925155639648, 12.759676933288574, 13.6644287109375, 14.569180488586426, 15.473932266235352, 16.37868309020996, 17.283435821533203, 18.188186645507812, 19.092937469482422, 19.997690200805664]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 6.0, 7.0, 17.0, 12.0, 36.0, 59.0, 102.0, 189.0, 374.0, 767.0, 1825.0, 5608.0, 24633.0, 225240.0, 2354941.0, 1448378.0, 110069.0, 15284.0, 3958.0, 1480.0, 583.0, 299.0, 183.0, 70.0, 65.0, 26.0, 25.0, 12.0, 15.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.1015625, -10.688232421875, -10.27490234375, -9.861572265625, -9.4482421875, -9.034912109375, -8.62158203125, -8.208251953125, -7.794921875, -7.381591796875, -6.96826171875, -6.554931640625, -6.1416015625, -5.728271484375, -5.31494140625, -4.901611328125, -4.48828125, -4.074951171875, -3.66162109375, -3.248291015625, -2.8349609375, -2.421630859375, -2.00830078125, -1.594970703125, -1.181640625, -0.768310546875, -0.35498046875, 0.058349609375, 0.4716796875, 0.885009765625, 1.29833984375, 1.711669921875, 2.125, 2.538330078125, 2.95166015625, 3.364990234375, 3.7783203125, 4.191650390625, 4.60498046875, 5.018310546875, 5.431640625, 5.844970703125, 6.25830078125, 6.671630859375, 7.0849609375, 7.498291015625, 7.91162109375, 8.324951171875, 8.73828125, 9.151611328125, 9.56494140625, 9.978271484375, 10.3916015625, 10.804931640625, 11.21826171875, 11.631591796875, 12.044921875, 12.458251953125, 12.87158203125, 13.284912109375, 13.6982421875, 14.111572265625, 14.52490234375, 14.938232421875, 15.3515625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 12.0, 11.0, 16.0, 15.0, 16.0, 15.0, 16.0, 32.0, 40.0, 30.0, 48.0, 54.0, 53.0, 38.0, 48.0, 53.0, 43.0, 54.0, 50.0, 46.0, 38.0, 46.0, 34.0, 32.0, 30.0, 27.0, 24.0, 14.0, 13.0, 18.0, 8.0, 6.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.82421875, -6.595703125, -6.3671875, -6.138671875, -5.91015625, -5.681640625, -5.453125, -5.224609375, -4.99609375, -4.767578125, -4.5390625, -4.310546875, -4.08203125, -3.853515625, -3.625, -3.396484375, -3.16796875, -2.939453125, -2.7109375, -2.482421875, -2.25390625, -2.025390625, -1.796875, -1.568359375, -1.33984375, -1.111328125, -0.8828125, -0.654296875, -0.42578125, -0.197265625, 0.03125, 0.259765625, 0.48828125, 0.716796875, 0.9453125, 1.173828125, 1.40234375, 1.630859375, 1.859375, 2.087890625, 2.31640625, 2.544921875, 2.7734375, 3.001953125, 3.23046875, 3.458984375, 3.6875, 3.916015625, 4.14453125, 4.373046875, 4.6015625, 4.830078125, 5.05859375, 5.287109375, 5.515625, 5.744140625, 5.97265625, 6.201171875, 6.4296875, 6.658203125, 6.88671875, 7.115234375, 7.34375, 7.572265625, 7.80078125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 1.0, 4.0, 7.0, 6.0, 15.0, 17.0, 30.0, 39.0, 67.0, 163.0, 422.0, 1517.0, 10253.0, 476401.0, 3657905.0, 43109.0, 3199.0, 652.0, 239.0, 98.0, 61.0, 24.0, 18.0, 11.0, 4.0, 6.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.65625, -25.802978515625, -24.94970703125, -24.096435546875, -23.2431640625, -22.389892578125, -21.53662109375, -20.683349609375, -19.830078125, -18.976806640625, -18.12353515625, -17.270263671875, -16.4169921875, -15.563720703125, -14.71044921875, -13.857177734375, -13.00390625, -12.150634765625, -11.29736328125, -10.444091796875, -9.5908203125, -8.737548828125, -7.88427734375, -7.031005859375, -6.177734375, -5.324462890625, -4.47119140625, -3.617919921875, -2.7646484375, -1.911376953125, -1.05810546875, -0.204833984375, 0.6484375, 1.501708984375, 2.35498046875, 3.208251953125, 4.0615234375, 4.914794921875, 5.76806640625, 6.621337890625, 7.474609375, 8.327880859375, 9.18115234375, 10.034423828125, 10.8876953125, 11.740966796875, 12.59423828125, 13.447509765625, 14.30078125, 15.154052734375, 16.00732421875, 16.860595703125, 17.7138671875, 18.567138671875, 19.42041015625, 20.273681640625, 21.126953125, 21.980224609375, 22.83349609375, 23.686767578125, 24.5400390625, 25.393310546875, 26.24658203125, 27.099853515625, 27.953125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 10.0, 11.0, 15.0, 20.0, 21.0, 32.0, 55.0, 74.0, 116.0, 173.0, 243.0, 383.0, 517.0, 552.0, 552.0, 403.0, 301.0, 210.0, 109.0, 92.0, 38.0, 30.0, 32.0, 15.0, 14.0, 13.0, 8.0, 10.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2109375, -3.08538818359375, -2.9598388671875, -2.83428955078125, -2.708740234375, -2.58319091796875, -2.4576416015625, -2.33209228515625, -2.20654296875, -2.08099365234375, -1.9554443359375, -1.82989501953125, -1.704345703125, -1.57879638671875, -1.4532470703125, -1.32769775390625, -1.2021484375, -1.07659912109375, -0.9510498046875, -0.82550048828125, -0.699951171875, -0.57440185546875, -0.4488525390625, -0.32330322265625, -0.19775390625, -0.07220458984375, 0.0533447265625, 0.17889404296875, 0.304443359375, 0.42999267578125, 0.5555419921875, 0.68109130859375, 0.806640625, 0.93218994140625, 1.0577392578125, 1.18328857421875, 1.308837890625, 1.43438720703125, 1.5599365234375, 1.68548583984375, 1.81103515625, 1.93658447265625, 2.0621337890625, 2.18768310546875, 2.313232421875, 2.43878173828125, 2.5643310546875, 2.68988037109375, 2.8154296875, 2.94097900390625, 3.0665283203125, 3.19207763671875, 3.317626953125, 3.44317626953125, 3.5687255859375, 3.69427490234375, 3.81982421875, 3.94537353515625, 4.0709228515625, 4.19647216796875, 4.322021484375, 4.44757080078125, 4.5731201171875, 4.69866943359375, 4.82421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 14.0, 20.0, 14.0, 21.0, 32.0, 42.0, 44.0, 46.0, 55.0, 64.0, 60.0, 72.0, 69.0, 57.0, 63.0, 62.0, 43.0, 45.0, 32.0, 28.0, 27.0, 25.0, 13.0, 17.0, 7.0, 7.0, 7.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-13.642107009887695, -13.330656051635742, -13.019205093383789, -12.70775318145752, -12.396302223205566, -12.084851264953613, -11.77340030670166, -11.46194839477539, -11.150497436523438, -10.839046478271484, -10.527595520019531, -10.216143608093262, -9.904692649841309, -9.593241691589355, -9.281790733337402, -8.970338821411133, -8.65888786315918, -8.347436904907227, -8.035985946655273, -7.724534511566162, -7.413083076477051, -7.101632118225098, -6.7901811599731445, -6.478729724884033, -6.167279243469238, -5.855828285217285, -5.544376850128174, -5.232925891876221, -4.921474456787109, -4.610023498535156, -4.298572540283203, -3.987121105194092, -3.6756691932678223, -3.36421799659729, -3.052766799926758, -2.7413158416748047, -2.4298644065856934, -2.1184134483337402, -1.806962251663208, -1.4955110549926758, -1.1840598583221436, -0.8726086616516113, -0.5611575245857239, -0.24970638751983643, 0.0617448091506958, 0.373196005821228, 0.6846470832824707, 0.9960982799530029, 1.3075494766235352, 1.6190006732940674, 1.9304518699645996, 2.2419028282165527, 2.553354263305664, 2.864805221557617, 3.1762564182281494, 3.4877076148986816, 3.799158811569214, 4.110610008239746, 4.422060966491699, 4.7335124015808105, 5.044963359832764, 5.356414794921875, 5.667865753173828, 5.979316711425781, 6.290768146514893]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 8.0, 6.0, 9.0, 8.0, 9.0, 12.0, 13.0, 15.0, 10.0, 22.0, 18.0, 31.0, 26.0, 32.0, 36.0, 47.0, 36.0, 46.0, 47.0, 52.0, 48.0, 43.0, 49.0, 35.0, 44.0, 27.0, 38.0, 36.0, 31.0, 25.0, 24.0, 18.0, 16.0, 15.0, 13.0, 13.0, 10.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.139963150024414, -7.894216060638428, -7.648468971252441, -7.402721881866455, -7.156974792480469, -6.911227703094482, -6.665480613708496, -6.419734001159668, -6.173986434936523, -5.928239345550537, -5.682492256164551, -5.4367451667785645, -5.190998077392578, -4.945250988006592, -4.6995038986206055, -4.453757286071777, -4.208010196685791, -3.9622631072998047, -3.7165160179138184, -3.470768928527832, -3.2250218391418457, -2.9792747497558594, -2.733527898788452, -2.487780809402466, -2.2420337200164795, -1.9962866306304932, -1.7505395412445068, -1.50479257106781, -1.2590454816818237, -1.0132983922958374, -0.7675514221191406, -0.5218043327331543, -0.27605676651000977, -0.030309706926345825, 0.21543735265731812, 0.46118438243865967, 0.706931471824646, 0.9526785612106323, 1.198425531387329, 1.4441726207733154, 1.6899197101593018, 1.935666799545288, 2.1814138889312744, 2.4271607398986816, 2.672907829284668, 2.9186549186706543, 3.1644020080566406, 3.410149097442627, 3.6558961868286133, 3.9016432762145996, 4.147390365600586, 4.393137454986572, 4.638884544372559, 4.884631633758545, 5.130378723144531, 5.376125335693359, 5.621872901916504, 5.86761999130249, 6.113367080688477, 6.359114170074463, 6.604861259460449, 6.8506083488464355, 7.096355438232422, 7.34210205078125, 7.587849140167236]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 6.0, 6.0, 6.0, 11.0, 18.0, 11.0, 31.0, 32.0, 66.0, 67.0, 131.0, 190.0, 349.0, 682.0, 1345.0, 3038.0, 7614.0, 21083.0, 65759.0, 201549.0, 383008.0, 241562.0, 80404.0, 25660.0, 9086.0, 3566.0, 1580.0, 697.0, 399.0, 208.0, 124.0, 82.0, 55.0, 33.0, 25.0, 23.0, 11.0, 13.0, 8.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.025390625, -1.9632415771484375, -1.901092529296875, -1.8389434814453125, -1.77679443359375, -1.7146453857421875, -1.652496337890625, -1.5903472900390625, -1.5281982421875, -1.4660491943359375, -1.403900146484375, -1.3417510986328125, -1.27960205078125, -1.2174530029296875, -1.155303955078125, -1.0931549072265625, -1.031005859375, -0.9688568115234375, -0.906707763671875, -0.8445587158203125, -0.78240966796875, -0.7202606201171875, -0.658111572265625, -0.5959625244140625, -0.5338134765625, -0.4716644287109375, -0.409515380859375, -0.3473663330078125, -0.28521728515625, -0.2230682373046875, -0.160919189453125, -0.0987701416015625, -0.03662109375, 0.0255279541015625, 0.087677001953125, 0.1498260498046875, 0.21197509765625, 0.2741241455078125, 0.336273193359375, 0.3984222412109375, 0.4605712890625, 0.5227203369140625, 0.584869384765625, 0.6470184326171875, 0.70916748046875, 0.7713165283203125, 0.833465576171875, 0.8956146240234375, 0.957763671875, 1.0199127197265625, 1.082061767578125, 1.1442108154296875, 1.20635986328125, 1.2685089111328125, 1.330657958984375, 1.3928070068359375, 1.4549560546875, 1.5171051025390625, 1.579254150390625, 1.6414031982421875, 1.70355224609375, 1.7657012939453125, 1.827850341796875, 1.8899993896484375, 1.9521484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 9.0, 8.0, 6.0, 12.0, 11.0, 19.0, 9.0, 18.0, 30.0, 34.0, 31.0, 39.0, 46.0, 46.0, 40.0, 54.0, 52.0, 48.0, 67.0, 50.0, 39.0, 41.0, 38.0, 42.0, 33.0, 37.0, 20.0, 30.0, 11.0, 15.0, 12.0, 9.0, 12.0, 9.0, 6.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3671875, -5.20147705078125, -5.0357666015625, -4.87005615234375, -4.704345703125, -4.53863525390625, -4.3729248046875, -4.20721435546875, -4.04150390625, -3.87579345703125, -3.7100830078125, -3.54437255859375, -3.378662109375, -3.21295166015625, -3.0472412109375, -2.88153076171875, -2.7158203125, -2.55010986328125, -2.3843994140625, -2.21868896484375, -2.052978515625, -1.88726806640625, -1.7215576171875, -1.55584716796875, -1.39013671875, -1.22442626953125, -1.0587158203125, -0.89300537109375, -0.727294921875, -0.56158447265625, -0.3958740234375, -0.23016357421875, -0.064453125, 0.10125732421875, 0.2669677734375, 0.43267822265625, 0.598388671875, 0.76409912109375, 0.9298095703125, 1.09552001953125, 1.26123046875, 1.42694091796875, 1.5926513671875, 1.75836181640625, 1.924072265625, 2.08978271484375, 2.2554931640625, 2.42120361328125, 2.5869140625, 2.75262451171875, 2.9183349609375, 3.08404541015625, 3.249755859375, 3.41546630859375, 3.5811767578125, 3.74688720703125, 3.91259765625, 4.07830810546875, 4.2440185546875, 4.40972900390625, 4.575439453125, 4.74114990234375, 4.9068603515625, 5.07257080078125, 5.23828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 5.0, 20.0, 20.0, 31.0, 47.0, 66.0, 76.0, 129.0, 213.0, 350.0, 499.0, 872.0, 1411.0, 2288.0, 3986.0, 6568.0, 10975.0, 18984.0, 31909.0, 53986.0, 87309.0, 131767.0, 172186.0, 171464.0, 132441.0, 88001.0, 53762.0, 32254.0, 19066.0, 11215.0, 6508.0, 3949.0, 2366.0, 1405.0, 825.0, 532.0, 372.0, 214.0, 149.0, 110.0, 75.0, 44.0, 32.0, 23.0, 11.0, 5.0, 7.0, 6.0, 4.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.7333984375, -0.7111740112304688, -0.6889495849609375, -0.6667251586914062, -0.644500732421875, -0.6222763061523438, -0.6000518798828125, -0.5778274536132812, -0.55560302734375, -0.5333786010742188, -0.5111541748046875, -0.48892974853515625, -0.466705322265625, -0.44448089599609375, -0.4222564697265625, -0.40003204345703125, -0.3778076171875, -0.35558319091796875, -0.3333587646484375, -0.31113433837890625, -0.288909912109375, -0.26668548583984375, -0.2444610595703125, -0.22223663330078125, -0.20001220703125, -0.17778778076171875, -0.1555633544921875, -0.13333892822265625, -0.111114501953125, -0.08889007568359375, -0.0666656494140625, -0.04444122314453125, -0.022216796875, 7.62939453125e-06, 0.0222320556640625, 0.04445648193359375, 0.066680908203125, 0.08890533447265625, 0.1111297607421875, 0.13335418701171875, 0.15557861328125, 0.17780303955078125, 0.2000274658203125, 0.22225189208984375, 0.244476318359375, 0.26670074462890625, 0.2889251708984375, 0.31114959716796875, 0.3333740234375, 0.35559844970703125, 0.3778228759765625, 0.40004730224609375, 0.422271728515625, 0.44449615478515625, 0.4667205810546875, 0.48894500732421875, 0.51116943359375, 0.5333938598632812, 0.5556182861328125, 0.5778427124023438, 0.600067138671875, 0.6222915649414062, 0.6445159912109375, 0.6667404174804688, 0.68896484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 6.0, 7.0, 9.0, 7.0, 9.0, 6.0, 9.0, 23.0, 17.0, 15.0, 20.0, 27.0, 24.0, 24.0, 34.0, 34.0, 48.0, 46.0, 45.0, 41.0, 41.0, 38.0, 44.0, 38.0, 38.0, 48.0, 45.0, 28.0, 22.0, 30.0, 23.0, 26.0, 21.0, 23.0, 13.0, 9.0, 10.0, 5.0, 7.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-9.0625, -8.7767333984375, -8.490966796875, -8.2052001953125, -7.91943359375, -7.6336669921875, -7.347900390625, -7.0621337890625, -6.7763671875, -6.4906005859375, -6.204833984375, -5.9190673828125, -5.63330078125, -5.3475341796875, -5.061767578125, -4.7760009765625, -4.490234375, -4.2044677734375, -3.918701171875, -3.6329345703125, -3.34716796875, -3.0614013671875, -2.775634765625, -2.4898681640625, -2.2041015625, -1.9183349609375, -1.632568359375, -1.3468017578125, -1.06103515625, -0.7752685546875, -0.489501953125, -0.2037353515625, 0.08203125, 0.3677978515625, 0.653564453125, 0.9393310546875, 1.22509765625, 1.5108642578125, 1.796630859375, 2.0823974609375, 2.3681640625, 2.6539306640625, 2.939697265625, 3.2254638671875, 3.51123046875, 3.7969970703125, 4.082763671875, 4.3685302734375, 4.654296875, 4.9400634765625, 5.225830078125, 5.5115966796875, 5.79736328125, 6.0831298828125, 6.368896484375, 6.6546630859375, 6.9404296875, 7.2261962890625, 7.511962890625, 7.7977294921875, 8.08349609375, 8.3692626953125, 8.655029296875, 8.9407958984375, 9.2265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 7.0, 12.0, 9.0, 12.0, 27.0, 28.0, 32.0, 66.0, 95.0, 135.0, 222.0, 339.0, 564.0, 1099.0, 2089.0, 5043.0, 14248.0, 47114.0, 162654.0, 393373.0, 285834.0, 93260.0, 26809.0, 8639.0, 3341.0, 1495.0, 765.0, 419.0, 270.0, 170.0, 102.0, 78.0, 48.0, 53.0, 31.0, 26.0, 11.0, 11.0, 9.0, 4.0, 6.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 1.0], "bins": [-0.418212890625, -0.4061851501464844, -0.39415740966796875, -0.3821296691894531, -0.3701019287109375, -0.3580741882324219, -0.34604644775390625, -0.3340187072753906, -0.321990966796875, -0.3099632263183594, -0.29793548583984375, -0.2859077453613281, -0.2738800048828125, -0.2618522644042969, -0.24982452392578125, -0.23779678344726562, -0.22576904296875, -0.21374130249023438, -0.20171356201171875, -0.18968582153320312, -0.1776580810546875, -0.16563034057617188, -0.15360260009765625, -0.14157485961914062, -0.129547119140625, -0.11751937866210938, -0.10549163818359375, -0.09346389770507812, -0.0814361572265625, -0.06940841674804688, -0.05738067626953125, -0.045352935791015625, -0.0333251953125, -0.021297454833984375, -0.00926971435546875, 0.002758026123046875, 0.0147857666015625, 0.026813507080078125, 0.03884124755859375, 0.050868988037109375, 0.062896728515625, 0.07492446899414062, 0.08695220947265625, 0.09897994995117188, 0.1110076904296875, 0.12303543090820312, 0.13506317138671875, 0.14709091186523438, 0.15911865234375, 0.17114639282226562, 0.18317413330078125, 0.19520187377929688, 0.2072296142578125, 0.21925735473632812, 0.23128509521484375, 0.24331283569335938, 0.255340576171875, 0.2673683166503906, 0.27939605712890625, 0.2914237976074219, 0.3034515380859375, 0.3154792785644531, 0.32750701904296875, 0.3395347595214844, 0.3515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 8.0, 6.0, 7.0, 11.0, 15.0, 24.0, 20.0, 30.0, 48.0, 63.0, 74.0, 91.0, 98.0, 92.0, 81.0, 63.0, 67.0, 43.0, 49.0, 30.0, 17.0, 15.0, 15.0, 6.0, 9.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002193450927734375, -0.00021239742636680603, -0.00020544975996017456, -0.0001985020935535431, -0.00019155442714691162, -0.00018460676074028015, -0.00017765909433364868, -0.0001707114279270172, -0.00016376376152038574, -0.00015681609511375427, -0.0001498684287071228, -0.00014292076230049133, -0.00013597309589385986, -0.0001290254294872284, -0.00012207776308059692, -0.00011513009667396545, -0.00010818243026733398, -0.00010123476386070251, -9.428709745407104e-05, -8.733943104743958e-05, -8.03917646408081e-05, -7.344409823417664e-05, -6.649643182754517e-05, -5.9548765420913696e-05, -5.2601099014282227e-05, -4.565343260765076e-05, -3.870576620101929e-05, -3.175809979438782e-05, -2.4810433387756348e-05, -1.7862766981124878e-05, -1.0915100574493408e-05, -3.9674341678619385e-06, 2.9802322387695312e-06, 9.927898645401001e-06, 1.687556505203247e-05, 2.382323145866394e-05, 3.077089786529541e-05, 3.771856427192688e-05, 4.466623067855835e-05, 5.161389708518982e-05, 5.856156349182129e-05, 6.550922989845276e-05, 7.245689630508423e-05, 7.94045627117157e-05, 8.635222911834717e-05, 9.329989552497864e-05, 0.00010024756193161011, 0.00010719522833824158, 0.00011414289474487305, 0.00012109056115150452, 0.00012803822755813599, 0.00013498589396476746, 0.00014193356037139893, 0.0001488812267780304, 0.00015582889318466187, 0.00016277655959129333, 0.0001697242259979248, 0.00017667189240455627, 0.00018361955881118774, 0.00019056722521781921, 0.00019751489162445068, 0.00020446255803108215, 0.00021141022443771362, 0.0002183578908443451, 0.00022530555725097656]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 7.0, 4.0, 12.0, 21.0, 10.0, 27.0, 30.0, 43.0, 54.0, 72.0, 110.0, 166.0, 296.0, 507.0, 1104.0, 2590.0, 6688.0, 18452.0, 50655.0, 136715.0, 296146.0, 305020.0, 144121.0, 54133.0, 19396.0, 6986.0, 2667.0, 1175.0, 541.0, 311.0, 154.0, 97.0, 56.0, 31.0, 28.0, 32.0, 17.0, 20.0, 10.0, 3.0, 9.0, 3.0, 1.0, 7.0, 3.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.380859375, -0.36966705322265625, -0.3584747314453125, -0.34728240966796875, -0.336090087890625, -0.32489776611328125, -0.3137054443359375, -0.30251312255859375, -0.29132080078125, -0.28012847900390625, -0.2689361572265625, -0.25774383544921875, -0.246551513671875, -0.23535919189453125, -0.2241668701171875, -0.21297454833984375, -0.2017822265625, -0.19058990478515625, -0.1793975830078125, -0.16820526123046875, -0.157012939453125, -0.14582061767578125, -0.1346282958984375, -0.12343597412109375, -0.11224365234375, -0.10105133056640625, -0.0898590087890625, -0.07866668701171875, -0.067474365234375, -0.05628204345703125, -0.0450897216796875, -0.03389739990234375, -0.022705078125, -0.01151275634765625, -0.0003204345703125, 0.01087188720703125, 0.022064208984375, 0.03325653076171875, 0.0444488525390625, 0.05564117431640625, 0.06683349609375, 0.07802581787109375, 0.0892181396484375, 0.10041046142578125, 0.111602783203125, 0.12279510498046875, 0.1339874267578125, 0.14517974853515625, 0.1563720703125, 0.16756439208984375, 0.1787567138671875, 0.18994903564453125, 0.201141357421875, 0.21233367919921875, 0.2235260009765625, 0.23471832275390625, 0.24591064453125, 0.25710296630859375, 0.2682952880859375, 0.27948760986328125, 0.290679931640625, 0.30187225341796875, 0.3130645751953125, 0.32425689697265625, 0.33544921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 13.0, 8.0, 11.0, 15.0, 22.0, 24.0, 25.0, 22.0, 27.0, 39.0, 39.0, 47.0, 52.0, 64.0, 50.0, 58.0, 62.0, 47.0, 50.0, 45.0, 29.0, 28.0, 26.0, 23.0, 20.0, 22.0, 24.0, 14.0, 10.0, 19.0, 7.0, 7.0, 9.0, 4.0, 8.0, 1.0, 7.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08428955078125, -0.08140945434570312, -0.07852935791015625, -0.07564926147460938, -0.0727691650390625, -0.06988906860351562, -0.06700897216796875, -0.06412887573242188, -0.061248779296875, -0.058368682861328125, -0.05548858642578125, -0.052608489990234375, -0.0497283935546875, -0.046848297119140625, -0.04396820068359375, -0.041088104248046875, -0.0382080078125, -0.035327911376953125, -0.03244781494140625, -0.029567718505859375, -0.0266876220703125, -0.023807525634765625, -0.02092742919921875, -0.018047332763671875, -0.015167236328125, -0.012287139892578125, -0.00940704345703125, -0.006526947021484375, -0.0036468505859375, -0.000766754150390625, 0.00211334228515625, 0.004993438720703125, 0.00787353515625, 0.010753631591796875, 0.01363372802734375, 0.016513824462890625, 0.0193939208984375, 0.022274017333984375, 0.02515411376953125, 0.028034210205078125, 0.030914306640625, 0.033794403076171875, 0.03667449951171875, 0.039554595947265625, 0.0424346923828125, 0.045314788818359375, 0.04819488525390625, 0.051074981689453125, 0.053955078125, 0.056835174560546875, 0.05971527099609375, 0.06259536743164062, 0.0654754638671875, 0.06835556030273438, 0.07123565673828125, 0.07411575317382812, 0.076995849609375, 0.07987594604492188, 0.08275604248046875, 0.08563613891601562, 0.0885162353515625, 0.09139633178710938, 0.09427642822265625, 0.09715652465820312, 0.10003662109375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 9.0, 10.0, 16.0, 25.0, 27.0, 65.0, 79.0, 60.0, 80.0, 100.0, 91.0, 82.0, 85.0, 72.0, 46.0, 53.0, 36.0, 27.0, 19.0, 10.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78955364227295, -8.540498733520508, -8.291443824768066, -8.042389869689941, -7.7933349609375, -7.544280052185059, -7.295225143432617, -7.046170711517334, -6.797116279602051, -6.548061370849609, -6.299006938934326, -6.049952030181885, -5.800897598266602, -5.55184268951416, -5.302787780761719, -5.0537333488464355, -4.804678440093994, -4.555623531341553, -4.3065690994262695, -4.057514190673828, -3.808459758758545, -3.5594048500061035, -3.310350179672241, -3.061295509338379, -2.8122408390045166, -2.5631861686706543, -2.314131498336792, -2.0650768280029297, -1.8160220384597778, -1.5669673681259155, -1.3179125785827637, -1.0688579082489014, -0.8198027610778809, -0.5707480907440186, -0.3216933608055115, -0.0726386308670044, 0.1764160394668579, 0.4254707098007202, 0.6745254993438721, 0.9235801696777344, 1.1726348400115967, 1.421689510345459, 1.6707441806793213, 1.9197989702224731, 2.168853759765625, 2.417908191680908, 2.6669631004333496, 2.916017770767212, 3.165072441101074, 3.4141271114349365, 3.663181781768799, 3.9122366905212402, 4.161291122436523, 4.410346031188965, 4.659400939941406, 4.9084553718566895, 5.157509803771973, 5.406564712524414, 5.655619144439697, 5.904674053192139, 6.153728485107422, 6.402783393859863, 6.651838302612305, 6.900892734527588, 7.149947643280029]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 3.0, 4.0, 4.0, 6.0, 3.0, 7.0, 8.0, 13.0, 13.0, 15.0, 16.0, 15.0, 16.0, 32.0, 30.0, 32.0, 39.0, 45.0, 41.0, 51.0, 53.0, 57.0, 45.0, 45.0, 38.0, 50.0, 42.0, 37.0, 33.0, 40.0, 22.0, 27.0, 20.0, 22.0, 16.0, 15.0, 11.0, 11.0, 7.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.284720420837402, -5.133851051330566, -4.9829816818237305, -4.832111835479736, -4.6812424659729, -4.5303730964660645, -4.37950325012207, -4.228633880615234, -4.077764511108398, -3.9268951416015625, -3.7760255336761475, -3.6251559257507324, -3.4742865562438965, -3.3234171867370605, -3.1725475788116455, -3.0216779708862305, -2.8708086013793945, -2.7199392318725586, -2.5690696239471436, -2.4182000160217285, -2.2673306465148926, -2.1164612770080566, -1.9655916690826416, -1.8147221803665161, -1.6638526916503906, -1.5129832029342651, -1.3621137142181396, -1.2112442255020142, -1.0603747367858887, -0.9095052480697632, -0.7586357593536377, -0.6077662706375122, -0.4568963050842285, -0.306026816368103, -0.15515732765197754, -0.004287838935852051, 0.14658164978027344, 0.2974511384963989, 0.4483206272125244, 0.5991901159286499, 0.7500596046447754, 0.9009290933609009, 1.0517985820770264, 1.2026680707931519, 1.3535375595092773, 1.5044070482254028, 1.6552765369415283, 1.8061460256576538, 1.9570155143737793, 2.1078848838806152, 2.2587544918060303, 2.4096240997314453, 2.5604934692382812, 2.711362838745117, 2.8622324466705322, 3.0131020545959473, 3.163971424102783, 3.314840793609619, 3.465710401535034, 3.616580009460449, 3.767449378967285, 3.918318748474121, 4.069188117980957, 4.220057964324951, 4.370927333831787]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 6.0, 8.0, 15.0, 34.0, 46.0, 66.0, 102.0, 208.0, 351.0, 723.0, 1457.0, 2992.0, 7000.0, 16453.0, 42377.0, 118589.0, 320943.0, 336486.0, 124812.0, 44875.0, 17607.0, 7256.0, 3182.0, 1456.0, 681.0, 371.0, 165.0, 103.0, 84.0, 49.0, 16.0, 21.0, 11.0, 5.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3203125, -7.11712646484375, -6.9139404296875, -6.71075439453125, -6.507568359375, -6.30438232421875, -6.1011962890625, -5.89801025390625, -5.69482421875, -5.49163818359375, -5.2884521484375, -5.08526611328125, -4.882080078125, -4.67889404296875, -4.4757080078125, -4.27252197265625, -4.0693359375, -3.86614990234375, -3.6629638671875, -3.45977783203125, -3.256591796875, -3.05340576171875, -2.8502197265625, -2.64703369140625, -2.44384765625, -2.24066162109375, -2.0374755859375, -1.83428955078125, -1.631103515625, -1.42791748046875, -1.2247314453125, -1.02154541015625, -0.818359375, -0.61517333984375, -0.4119873046875, -0.20880126953125, -0.005615234375, 0.19757080078125, 0.4007568359375, 0.60394287109375, 0.80712890625, 1.01031494140625, 1.2135009765625, 1.41668701171875, 1.619873046875, 1.82305908203125, 2.0262451171875, 2.22943115234375, 2.4326171875, 2.63580322265625, 2.8389892578125, 3.04217529296875, 3.245361328125, 3.44854736328125, 3.6517333984375, 3.85491943359375, 4.05810546875, 4.26129150390625, 4.4644775390625, 4.66766357421875, 4.870849609375, 5.07403564453125, 5.2772216796875, 5.48040771484375, 5.68359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 5.0, 2.0, 8.0, 6.0, 5.0, 6.0, 10.0, 19.0, 17.0, 7.0, 20.0, 22.0, 34.0, 29.0, 38.0, 49.0, 51.0, 51.0, 32.0, 54.0, 41.0, 59.0, 45.0, 41.0, 48.0, 30.0, 45.0, 32.0, 31.0, 28.0, 26.0, 25.0, 16.0, 19.0, 13.0, 7.0, 4.0, 5.0, 5.0, 4.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.4921875, -10.188720703125, -9.88525390625, -9.581787109375, -9.2783203125, -8.974853515625, -8.67138671875, -8.367919921875, -8.064453125, -7.760986328125, -7.45751953125, -7.154052734375, -6.8505859375, -6.547119140625, -6.24365234375, -5.940185546875, -5.63671875, -5.333251953125, -5.02978515625, -4.726318359375, -4.4228515625, -4.119384765625, -3.81591796875, -3.512451171875, -3.208984375, -2.905517578125, -2.60205078125, -2.298583984375, -1.9951171875, -1.691650390625, -1.38818359375, -1.084716796875, -0.78125, -0.477783203125, -0.17431640625, 0.129150390625, 0.4326171875, 0.736083984375, 1.03955078125, 1.343017578125, 1.646484375, 1.949951171875, 2.25341796875, 2.556884765625, 2.8603515625, 3.163818359375, 3.46728515625, 3.770751953125, 4.07421875, 4.377685546875, 4.68115234375, 4.984619140625, 5.2880859375, 5.591552734375, 5.89501953125, 6.198486328125, 6.501953125, 6.805419921875, 7.10888671875, 7.412353515625, 7.7158203125, 8.019287109375, 8.32275390625, 8.626220703125, 8.9296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 13.0, 14.0, 18.0, 29.0, 25.0, 50.0, 65.0, 132.0, 233.0, 415.0, 1073.0, 4840.0, 37563.0, 422039.0, 525648.0, 48093.0, 5994.0, 1255.0, 435.0, 231.0, 131.0, 69.0, 61.0, 32.0, 16.0, 19.0, 15.0, 7.0, 14.0, 8.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.171875, -15.6826171875, -15.193359375, -14.7041015625, -14.21484375, -13.7255859375, -13.236328125, -12.7470703125, -12.2578125, -11.7685546875, -11.279296875, -10.7900390625, -10.30078125, -9.8115234375, -9.322265625, -8.8330078125, -8.34375, -7.8544921875, -7.365234375, -6.8759765625, -6.38671875, -5.8974609375, -5.408203125, -4.9189453125, -4.4296875, -3.9404296875, -3.451171875, -2.9619140625, -2.47265625, -1.9833984375, -1.494140625, -1.0048828125, -0.515625, -0.0263671875, 0.462890625, 0.9521484375, 1.44140625, 1.9306640625, 2.419921875, 2.9091796875, 3.3984375, 3.8876953125, 4.376953125, 4.8662109375, 5.35546875, 5.8447265625, 6.333984375, 6.8232421875, 7.3125, 7.8017578125, 8.291015625, 8.7802734375, 9.26953125, 9.7587890625, 10.248046875, 10.7373046875, 11.2265625, 11.7158203125, 12.205078125, 12.6943359375, 13.18359375, 13.6728515625, 14.162109375, 14.6513671875, 15.140625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 10.0, 8.0, 14.0, 12.0, 20.0, 20.0, 28.0, 30.0, 28.0, 58.0, 50.0, 46.0, 60.0, 58.0, 54.0, 48.0, 69.0, 46.0, 42.0, 36.0, 39.0, 30.0, 33.0, 28.0, 31.0, 21.0, 14.0, 13.0, 11.0, 8.0, 5.0, 5.0, 4.0, 1.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.03125, -13.5941162109375, -13.156982421875, -12.7198486328125, -12.28271484375, -11.8455810546875, -11.408447265625, -10.9713134765625, -10.5341796875, -10.0970458984375, -9.659912109375, -9.2227783203125, -8.78564453125, -8.3485107421875, -7.911376953125, -7.4742431640625, -7.037109375, -6.5999755859375, -6.162841796875, -5.7257080078125, -5.28857421875, -4.8514404296875, -4.414306640625, -3.9771728515625, -3.5400390625, -3.1029052734375, -2.665771484375, -2.2286376953125, -1.79150390625, -1.3543701171875, -0.917236328125, -0.4801025390625, -0.04296875, 0.3941650390625, 0.831298828125, 1.2684326171875, 1.70556640625, 2.1427001953125, 2.579833984375, 3.0169677734375, 3.4541015625, 3.8912353515625, 4.328369140625, 4.7655029296875, 5.20263671875, 5.6397705078125, 6.076904296875, 6.5140380859375, 6.951171875, 7.3883056640625, 7.825439453125, 8.2625732421875, 8.69970703125, 9.1368408203125, 9.573974609375, 10.0111083984375, 10.4482421875, 10.8853759765625, 11.322509765625, 11.7596435546875, 12.19677734375, 12.6339111328125, 13.071044921875, 13.5081787109375, 13.9453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 11.0, 11.0, 25.0, 28.0, 59.0, 105.0, 286.0, 1042.0, 5934.0, 146504.0, 846847.0, 43453.0, 3101.0, 715.0, 221.0, 95.0, 37.0, 26.0, 15.0, 10.0, 5.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-6.09375, -5.89288330078125, -5.6920166015625, -5.49114990234375, -5.290283203125, -5.08941650390625, -4.8885498046875, -4.68768310546875, -4.48681640625, -4.28594970703125, -4.0850830078125, -3.88421630859375, -3.683349609375, -3.48248291015625, -3.2816162109375, -3.08074951171875, -2.8798828125, -2.67901611328125, -2.4781494140625, -2.27728271484375, -2.076416015625, -1.87554931640625, -1.6746826171875, -1.47381591796875, -1.27294921875, -1.07208251953125, -0.8712158203125, -0.67034912109375, -0.469482421875, -0.26861572265625, -0.0677490234375, 0.13311767578125, 0.333984375, 0.53485107421875, 0.7357177734375, 0.93658447265625, 1.137451171875, 1.33831787109375, 1.5391845703125, 1.74005126953125, 1.94091796875, 2.14178466796875, 2.3426513671875, 2.54351806640625, 2.744384765625, 2.94525146484375, 3.1461181640625, 3.34698486328125, 3.5478515625, 3.74871826171875, 3.9495849609375, 4.15045166015625, 4.351318359375, 4.55218505859375, 4.7530517578125, 4.95391845703125, 5.15478515625, 5.35565185546875, 5.5565185546875, 5.75738525390625, 5.958251953125, 6.15911865234375, 6.3599853515625, 6.56085205078125, 6.76171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 8.0, 10.0, 20.0, 18.0, 33.0, 46.0, 60.0, 66.0, 103.0, 101.0, 116.0, 106.0, 79.0, 45.0, 43.0, 37.0, 27.0, 18.0, 17.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005817413330078125, -0.0005652531981468201, -0.0005487650632858276, -0.0005322769284248352, -0.0005157887935638428, -0.0004993006587028503, -0.0004828125238418579, -0.0004663243889808655, -0.00044983625411987305, -0.0004333481192588806, -0.0004168599843978882, -0.00040037184953689575, -0.0003838837146759033, -0.0003673955798149109, -0.00035090744495391846, -0.000334419310092926, -0.0003179311752319336, -0.00030144304037094116, -0.00028495490550994873, -0.0002684667706489563, -0.00025197863578796387, -0.00023549050092697144, -0.000219002366065979, -0.00020251423120498657, -0.00018602609634399414, -0.0001695379614830017, -0.00015304982662200928, -0.00013656169176101685, -0.00012007355690002441, -0.00010358542203903198, -8.709728717803955e-05, -7.060915231704712e-05, -5.412101745605469e-05, -3.7632882595062256e-05, -2.1144747734069824e-05, -4.656612873077393e-06, 1.1831521987915039e-05, 2.831965684890747e-05, 4.48077917098999e-05, 6.129592657089233e-05, 7.778406143188477e-05, 9.42721962928772e-05, 0.00011076033115386963, 0.00012724846601486206, 0.0001437366008758545, 0.00016022473573684692, 0.00017671287059783936, 0.0001932010054588318, 0.00020968914031982422, 0.00022617727518081665, 0.00024266541004180908, 0.0002591535449028015, 0.00027564167976379395, 0.0002921298146247864, 0.0003086179494857788, 0.00032510608434677124, 0.00034159421920776367, 0.0003580823540687561, 0.00037457048892974854, 0.00039105862379074097, 0.0004075467586517334, 0.00042403489351272583, 0.00044052302837371826, 0.0004570111632347107, 0.0004734992980957031]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 2.0, 8.0, 19.0, 35.0, 85.0, 186.0, 527.0, 1534.0, 6410.0, 140489.0, 843718.0, 49888.0, 3895.0, 1135.0, 330.0, 142.0, 62.0, 22.0, 20.0, 7.0, 11.0, 3.0, 10.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.015625, -6.79193115234375, -6.5682373046875, -6.34454345703125, -6.120849609375, -5.89715576171875, -5.6734619140625, -5.44976806640625, -5.22607421875, -5.00238037109375, -4.7786865234375, -4.55499267578125, -4.331298828125, -4.10760498046875, -3.8839111328125, -3.66021728515625, -3.4365234375, -3.21282958984375, -2.9891357421875, -2.76544189453125, -2.541748046875, -2.31805419921875, -2.0943603515625, -1.87066650390625, -1.64697265625, -1.42327880859375, -1.1995849609375, -0.97589111328125, -0.752197265625, -0.52850341796875, -0.3048095703125, -0.08111572265625, 0.142578125, 0.36627197265625, 0.5899658203125, 0.81365966796875, 1.037353515625, 1.26104736328125, 1.4847412109375, 1.70843505859375, 1.93212890625, 2.15582275390625, 2.3795166015625, 2.60321044921875, 2.826904296875, 3.05059814453125, 3.2742919921875, 3.49798583984375, 3.7216796875, 3.94537353515625, 4.1690673828125, 4.39276123046875, 4.616455078125, 4.84014892578125, 5.0638427734375, 5.28753662109375, 5.51123046875, 5.73492431640625, 5.9586181640625, 6.18231201171875, 6.406005859375, 6.62969970703125, 6.8533935546875, 7.07708740234375, 7.30078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 13.0, 16.0, 23.0, 42.0, 78.0, 112.0, 169.0, 158.0, 118.0, 92.0, 60.0, 42.0, 20.0, 21.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.681640625, -2.602691650390625, -2.52374267578125, -2.444793701171875, -2.3658447265625, -2.286895751953125, -2.20794677734375, -2.128997802734375, -2.050048828125, -1.971099853515625, -1.89215087890625, -1.813201904296875, -1.7342529296875, -1.655303955078125, -1.57635498046875, -1.497406005859375, -1.41845703125, -1.339508056640625, -1.26055908203125, -1.181610107421875, -1.1026611328125, -1.023712158203125, -0.94476318359375, -0.865814208984375, -0.786865234375, -0.707916259765625, -0.62896728515625, -0.550018310546875, -0.4710693359375, -0.392120361328125, -0.31317138671875, -0.234222412109375, -0.1552734375, -0.076324462890625, 0.00262451171875, 0.081573486328125, 0.1605224609375, 0.239471435546875, 0.31842041015625, 0.397369384765625, 0.476318359375, 0.555267333984375, 0.63421630859375, 0.713165283203125, 0.7921142578125, 0.871063232421875, 0.95001220703125, 1.028961181640625, 1.10791015625, 1.186859130859375, 1.26580810546875, 1.344757080078125, 1.4237060546875, 1.502655029296875, 1.58160400390625, 1.660552978515625, 1.739501953125, 1.818450927734375, 1.89739990234375, 1.976348876953125, 2.0552978515625, 2.134246826171875, 2.21319580078125, 2.292144775390625, 2.37109375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 33.0, 451.0, 476.0, 51.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.840049743652344, -11.911993026733398, -7.983936309814453, -4.055879592895508, -0.1278228759765625, 3.800233840942383, 7.728290557861328, 11.656347274780273, 15.584403991699219, 19.512460708618164, 23.44051742553711, 27.368574142456055, 31.296630859375, 35.22468566894531, 39.15274429321289, 43.08080291748047, 47.00885772705078, 50.936912536621094, 54.86497116088867, 58.79302978515625, 62.72108459472656, 66.64913940429688, 70.57719421386719, 74.50525665283203, 78.43331146240234, 82.36136627197266, 86.2894287109375, 90.21748352050781, 94.14553833007812, 98.07359313964844, 102.00164794921875, 105.9297103881836, 109.85777282714844, 113.78582763671875, 117.71388244628906, 121.6419448852539, 125.56999969482422, 129.49806213378906, 133.42611694335938, 137.3541717529297, 141.2822265625, 145.2102813720703, 149.13833618164062, 153.06639099121094, 156.99444580078125, 160.92251586914062, 164.85057067871094, 168.77862548828125, 172.70668029785156, 176.63473510742188, 180.5627899169922, 184.4908447265625, 188.41891479492188, 192.3469696044922, 196.2750244140625, 200.2030792236328, 204.13113403320312, 208.05918884277344, 211.98724365234375, 215.91529846191406, 219.84335327148438, 223.77142333984375, 227.69947814941406, 231.62753295898438, 235.5555877685547]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 10.0, 9.0, 13.0, 20.0, 23.0, 28.0, 29.0, 33.0, 27.0, 34.0, 45.0, 52.0, 55.0, 52.0, 59.0, 49.0, 48.0, 50.0, 54.0, 38.0, 42.0, 31.0, 22.0, 31.0, 27.0, 18.0, 22.0, 16.0, 16.0, 8.0, 7.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.034082412719727, -22.359458923339844, -21.68483543395996, -21.010211944580078, -20.335586547851562, -19.66096305847168, -18.986339569091797, -18.311716079711914, -17.63709259033203, -16.96246910095215, -16.287845611572266, -15.613221168518066, -14.938596725463867, -14.263973236083984, -13.589349746704102, -12.914726257324219, -12.240100860595703, -11.56547737121582, -10.890852928161621, -10.216229438781738, -9.541604995727539, -8.866981506347656, -8.192358016967773, -7.517734050750732, -6.843110084533691, -6.16848611831665, -5.493862152099609, -4.819238662719727, -4.1446146965026855, -3.4699907302856445, -2.7953672409057617, -2.1207432746887207, -1.4461193084716797, -0.7714954614639282, -0.09687161445617676, 0.5777521133422852, 1.2523760795593262, 1.9270000457763672, 2.60162353515625, 3.276247501373291, 3.950871467590332, 4.625495433807373, 5.300119400024414, 5.974742889404297, 6.649366855621338, 7.323990821838379, 7.998614311218262, 8.673238754272461, 9.347862243652344, 10.022485733032227, 10.697110176086426, 11.371733665466309, 12.046358108520508, 12.72098159790039, 13.395605087280273, 14.070228576660156, 14.744853019714355, 15.419476509094238, 16.094100952148438, 16.76872444152832, 17.443347930908203, 18.11797332763672, 18.79259490966797, 19.467220306396484, 20.141843795776367]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 8.0, 13.0, 17.0, 25.0, 28.0, 50.0, 90.0, 185.0, 332.0, 933.0, 4172.0, 38824.0, 1634016.0, 2441749.0, 66036.0, 5702.0, 1229.0, 456.0, 173.0, 74.0, 56.0, 30.0, 29.0, 24.0, 11.0, 10.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3046875, -12.7020263671875, -12.099365234375, -11.4967041015625, -10.89404296875, -10.2913818359375, -9.688720703125, -9.0860595703125, -8.4833984375, -7.8807373046875, -7.278076171875, -6.6754150390625, -6.07275390625, -5.4700927734375, -4.867431640625, -4.2647705078125, -3.662109375, -3.0594482421875, -2.456787109375, -1.8541259765625, -1.25146484375, -0.6488037109375, -0.046142578125, 0.5565185546875, 1.1591796875, 1.7618408203125, 2.364501953125, 2.9671630859375, 3.56982421875, 4.1724853515625, 4.775146484375, 5.3778076171875, 5.98046875, 6.5831298828125, 7.185791015625, 7.7884521484375, 8.39111328125, 8.9937744140625, 9.596435546875, 10.1990966796875, 10.8017578125, 11.4044189453125, 12.007080078125, 12.6097412109375, 13.21240234375, 13.8150634765625, 14.417724609375, 15.0203857421875, 15.623046875, 16.2257080078125, 16.828369140625, 17.4310302734375, 18.03369140625, 18.6363525390625, 19.239013671875, 19.8416748046875, 20.4443359375, 21.0469970703125, 21.649658203125, 22.2523193359375, 22.85498046875, 23.4576416015625, 24.060302734375, 24.6629638671875, 25.265625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 7.0, 7.0, 16.0, 11.0, 11.0, 19.0, 19.0, 30.0, 36.0, 35.0, 28.0, 34.0, 49.0, 37.0, 50.0, 47.0, 55.0, 49.0, 45.0, 46.0, 46.0, 40.0, 24.0, 29.0, 30.0, 29.0, 18.0, 27.0, 24.0, 14.0, 13.0, 12.0, 8.0, 6.0, 11.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.6297607421875, -5.447021484375, -5.2642822265625, -5.08154296875, -4.8988037109375, -4.716064453125, -4.5333251953125, -4.3505859375, -4.1678466796875, -3.985107421875, -3.8023681640625, -3.61962890625, -3.4368896484375, -3.254150390625, -3.0714111328125, -2.888671875, -2.7059326171875, -2.523193359375, -2.3404541015625, -2.15771484375, -1.9749755859375, -1.792236328125, -1.6094970703125, -1.4267578125, -1.2440185546875, -1.061279296875, -0.8785400390625, -0.69580078125, -0.5130615234375, -0.330322265625, -0.1475830078125, 0.03515625, 0.2178955078125, 0.400634765625, 0.5833740234375, 0.76611328125, 0.9488525390625, 1.131591796875, 1.3143310546875, 1.4970703125, 1.6798095703125, 1.862548828125, 2.0452880859375, 2.22802734375, 2.4107666015625, 2.593505859375, 2.7762451171875, 2.958984375, 3.1417236328125, 3.324462890625, 3.5072021484375, 3.68994140625, 3.8726806640625, 4.055419921875, 4.2381591796875, 4.4208984375, 4.6036376953125, 4.786376953125, 4.9691162109375, 5.15185546875, 5.3345947265625, 5.517333984375, 5.7000732421875, 5.8828125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 12.0, 22.0, 39.0, 54.0, 133.0, 441.0, 1592.0, 14050.0, 3498369.0, 671653.0, 6350.0, 1042.0, 298.0, 111.0, 44.0, 25.0, 18.0, 7.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.4375, -35.361328125, -34.28515625, -33.208984375, -32.1328125, -31.056640625, -29.98046875, -28.904296875, -27.828125, -26.751953125, -25.67578125, -24.599609375, -23.5234375, -22.447265625, -21.37109375, -20.294921875, -19.21875, -18.142578125, -17.06640625, -15.990234375, -14.9140625, -13.837890625, -12.76171875, -11.685546875, -10.609375, -9.533203125, -8.45703125, -7.380859375, -6.3046875, -5.228515625, -4.15234375, -3.076171875, -2.0, -0.923828125, 0.15234375, 1.228515625, 2.3046875, 3.380859375, 4.45703125, 5.533203125, 6.609375, 7.685546875, 8.76171875, 9.837890625, 10.9140625, 11.990234375, 13.06640625, 14.142578125, 15.21875, 16.294921875, 17.37109375, 18.447265625, 19.5234375, 20.599609375, 21.67578125, 22.751953125, 23.828125, 24.904296875, 25.98046875, 27.056640625, 28.1328125, 29.208984375, 30.28515625, 31.361328125, 32.4375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 15.0, 21.0, 33.0, 65.0, 124.0, 257.0, 411.0, 681.0, 852.0, 677.0, 413.0, 217.0, 126.0, 62.0, 39.0, 18.0, 15.0, 14.0, 8.0, 6.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.46484375, -6.28277587890625, -6.1007080078125, -5.91864013671875, -5.736572265625, -5.55450439453125, -5.3724365234375, -5.19036865234375, -5.00830078125, -4.82623291015625, -4.6441650390625, -4.46209716796875, -4.280029296875, -4.09796142578125, -3.9158935546875, -3.73382568359375, -3.5517578125, -3.36968994140625, -3.1876220703125, -3.00555419921875, -2.823486328125, -2.64141845703125, -2.4593505859375, -2.27728271484375, -2.09521484375, -1.91314697265625, -1.7310791015625, -1.54901123046875, -1.366943359375, -1.18487548828125, -1.0028076171875, -0.82073974609375, -0.638671875, -0.45660400390625, -0.2745361328125, -0.09246826171875, 0.089599609375, 0.27166748046875, 0.4537353515625, 0.63580322265625, 0.81787109375, 0.99993896484375, 1.1820068359375, 1.36407470703125, 1.546142578125, 1.72821044921875, 1.9102783203125, 2.09234619140625, 2.2744140625, 2.45648193359375, 2.6385498046875, 2.82061767578125, 3.002685546875, 3.18475341796875, 3.3668212890625, 3.54888916015625, 3.73095703125, 3.91302490234375, 4.0950927734375, 4.27716064453125, 4.459228515625, 4.64129638671875, 4.8233642578125, 5.00543212890625, 5.1875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 3.0, 3.0, 9.0, 6.0, 13.0, 11.0, 23.0, 30.0, 24.0, 26.0, 33.0, 41.0, 43.0, 50.0, 48.0, 52.0, 55.0, 53.0, 48.0, 44.0, 61.0, 46.0, 42.0, 37.0, 40.0, 30.0, 26.0, 22.0, 22.0, 14.0, 8.0, 9.0, 10.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.916438102722168, -7.67176628112793, -7.427093982696533, -7.182422161102295, -6.937749862670898, -6.69307804107666, -6.448406219482422, -6.203734397888184, -5.959062099456787, -5.714390277862549, -5.469717979431152, -5.225046157836914, -4.980374336242676, -4.735702037811279, -4.491030216217041, -4.2463579177856445, -4.001686096191406, -3.757014036178589, -3.5123419761657715, -3.267670154571533, -3.022998094558716, -2.7783260345458984, -2.53365421295166, -2.2889821529388428, -2.0443100929260254, -1.799638032913208, -1.5549660921096802, -1.3102941513061523, -1.065622091293335, -0.8209500312805176, -0.5762780904769897, -0.3316061496734619, -0.08693408966064453, 0.15773791074752808, 0.4024099111557007, 0.6470819115638733, 0.8917539119720459, 1.1364259719848633, 1.3810979127883911, 1.625769853591919, 1.8704419136047363, 2.1151139736175537, 2.359786033630371, 2.6044578552246094, 2.8491299152374268, 3.093801975250244, 3.3384737968444824, 3.5831458568573, 3.827817916870117, 4.0724897384643555, 4.317162036895752, 4.56183385848999, 4.806506156921387, 5.051177978515625, 5.295849800109863, 5.540521621704102, 5.785193920135498, 6.029865741729736, 6.274538040161133, 6.519209861755371, 6.763881683349609, 7.008553981781006, 7.253225803375244, 7.497898101806641, 7.742569923400879]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 12.0, 8.0, 10.0, 10.0, 19.0, 23.0, 19.0, 20.0, 24.0, 27.0, 35.0, 54.0, 43.0, 50.0, 50.0, 42.0, 43.0, 40.0, 44.0, 43.0, 42.0, 41.0, 43.0, 24.0, 41.0, 22.0, 23.0, 24.0, 16.0, 18.0, 11.0, 11.0, 10.0, 12.0, 11.0, 5.0, 11.0, 3.0, 8.0, 0.0, 1.0, 0.0, 3.0], "bins": [-9.820923805236816, -9.570987701416016, -9.321051597595215, -9.071115493774414, -8.821179389953613, -8.571243286132812, -8.321308135986328, -8.071372032165527, -7.821435928344727, -7.571499824523926, -7.321563720703125, -7.071627616882324, -6.821691989898682, -6.571755886077881, -6.32181978225708, -6.071883678436279, -5.8219475746154785, -5.572011470794678, -5.322075366973877, -5.072139739990234, -4.822203636169434, -4.572267532348633, -4.322331428527832, -4.072395324707031, -3.8224594593048096, -3.572523355484009, -3.322587490081787, -3.0726513862609863, -2.8227152824401855, -2.572779417037964, -2.322843313217163, -2.0729074478149414, -1.8229713439941406, -1.5730353593826294, -1.3230993747711182, -1.0731632709503174, -0.8232272863388062, -0.5732913017272949, -0.32335519790649414, -0.07341921329498291, 0.17651677131652832, 0.42645278573036194, 0.6763888001441956, 0.9263248443603516, 1.1762608289718628, 1.426196813583374, 1.6761329174041748, 1.926068902015686, 2.1760048866271973, 2.425940990447998, 2.6758768558502197, 2.9258129596710205, 3.175748825073242, 3.425684928894043, 3.6756210327148438, 3.9255571365356445, 4.175493240356445, 4.425429344177246, 4.675365447998047, 4.925301551818848, 5.17523717880249, 5.425173282623291, 5.675109386444092, 5.925045490264893, 6.174981117248535]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 11.0, 11.0, 18.0, 8.0, 25.0, 34.0, 41.0, 45.0, 72.0, 92.0, 141.0, 198.0, 292.0, 543.0, 1308.0, 4649.0, 24789.0, 159994.0, 552150.0, 253317.0, 40225.0, 7195.0, 1670.0, 663.0, 325.0, 213.0, 150.0, 96.0, 87.0, 42.0, 34.0, 33.0, 22.0, 13.0, 12.0, 9.0, 4.0, 10.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.57421875, -2.473785400390625, -2.37335205078125, -2.272918701171875, -2.1724853515625, -2.072052001953125, -1.97161865234375, -1.871185302734375, -1.770751953125, -1.670318603515625, -1.56988525390625, -1.469451904296875, -1.3690185546875, -1.268585205078125, -1.16815185546875, -1.067718505859375, -0.96728515625, -0.866851806640625, -0.76641845703125, -0.665985107421875, -0.5655517578125, -0.465118408203125, -0.36468505859375, -0.264251708984375, -0.163818359375, -0.063385009765625, 0.03704833984375, 0.137481689453125, 0.2379150390625, 0.338348388671875, 0.43878173828125, 0.539215087890625, 0.6396484375, 0.740081787109375, 0.84051513671875, 0.940948486328125, 1.0413818359375, 1.141815185546875, 1.24224853515625, 1.342681884765625, 1.443115234375, 1.543548583984375, 1.64398193359375, 1.744415283203125, 1.8448486328125, 1.945281982421875, 2.04571533203125, 2.146148681640625, 2.24658203125, 2.347015380859375, 2.44744873046875, 2.547882080078125, 2.6483154296875, 2.748748779296875, 2.84918212890625, 2.949615478515625, 3.050048828125, 3.150482177734375, 3.25091552734375, 3.351348876953125, 3.4517822265625, 3.552215576171875, 3.65264892578125, 3.753082275390625, 3.853515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 1.0, 8.0, 8.0, 12.0, 8.0, 17.0, 14.0, 22.0, 24.0, 24.0, 30.0, 42.0, 37.0, 42.0, 56.0, 59.0, 53.0, 48.0, 54.0, 41.0, 54.0, 49.0, 29.0, 32.0, 28.0, 33.0, 31.0, 21.0, 18.0, 11.0, 18.0, 19.0, 10.0, 10.0, 15.0, 7.0, 3.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0], "bins": [-6.54296875, -6.37481689453125, -6.2066650390625, -6.03851318359375, -5.870361328125, -5.70220947265625, -5.5340576171875, -5.36590576171875, -5.19775390625, -5.02960205078125, -4.8614501953125, -4.69329833984375, -4.525146484375, -4.35699462890625, -4.1888427734375, -4.02069091796875, -3.8525390625, -3.68438720703125, -3.5162353515625, -3.34808349609375, -3.179931640625, -3.01177978515625, -2.8436279296875, -2.67547607421875, -2.50732421875, -2.33917236328125, -2.1710205078125, -2.00286865234375, -1.834716796875, -1.66656494140625, -1.4984130859375, -1.33026123046875, -1.162109375, -0.99395751953125, -0.8258056640625, -0.65765380859375, -0.489501953125, -0.32135009765625, -0.1531982421875, 0.01495361328125, 0.18310546875, 0.35125732421875, 0.5194091796875, 0.68756103515625, 0.855712890625, 1.02386474609375, 1.1920166015625, 1.36016845703125, 1.5283203125, 1.69647216796875, 1.8646240234375, 2.03277587890625, 2.200927734375, 2.36907958984375, 2.5372314453125, 2.70538330078125, 2.87353515625, 3.04168701171875, 3.2098388671875, 3.37799072265625, 3.546142578125, 3.71429443359375, 3.8824462890625, 4.05059814453125, 4.21875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 23.0, 25.0, 44.0, 66.0, 93.0, 157.0, 255.0, 417.0, 713.0, 1205.0, 2250.0, 4161.0, 7568.0, 14089.0, 26717.0, 50339.0, 91752.0, 152320.0, 202914.0, 192205.0, 133439.0, 77849.0, 41962.0, 22198.0, 11659.0, 6191.0, 3409.0, 1835.0, 1070.0, 612.0, 364.0, 207.0, 144.0, 86.0, 62.0, 46.0, 23.0, 18.0, 8.0, 9.0, 4.0, 7.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1.1220703125, -1.089874267578125, -1.05767822265625, -1.025482177734375, -0.9932861328125, -0.961090087890625, -0.92889404296875, -0.896697998046875, -0.864501953125, -0.832305908203125, -0.80010986328125, -0.767913818359375, -0.7357177734375, -0.703521728515625, -0.67132568359375, -0.639129638671875, -0.60693359375, -0.574737548828125, -0.54254150390625, -0.510345458984375, -0.4781494140625, -0.445953369140625, -0.41375732421875, -0.381561279296875, -0.349365234375, -0.317169189453125, -0.28497314453125, -0.252777099609375, -0.2205810546875, -0.188385009765625, -0.15618896484375, -0.123992919921875, -0.091796875, -0.059600830078125, -0.02740478515625, 0.004791259765625, 0.0369873046875, 0.069183349609375, 0.10137939453125, 0.133575439453125, 0.165771484375, 0.197967529296875, 0.23016357421875, 0.262359619140625, 0.2945556640625, 0.326751708984375, 0.35894775390625, 0.391143798828125, 0.42333984375, 0.455535888671875, 0.48773193359375, 0.519927978515625, 0.5521240234375, 0.584320068359375, 0.61651611328125, 0.648712158203125, 0.680908203125, 0.713104248046875, 0.74530029296875, 0.777496337890625, 0.8096923828125, 0.841888427734375, 0.87408447265625, 0.906280517578125, 0.9384765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 10.0, 10.0, 7.0, 15.0, 20.0, 17.0, 18.0, 20.0, 19.0, 26.0, 23.0, 33.0, 38.0, 48.0, 55.0, 31.0, 44.0, 43.0, 42.0, 34.0, 49.0, 49.0, 37.0, 49.0, 33.0, 27.0, 28.0, 24.0, 23.0, 20.0, 24.0, 17.0, 12.0, 13.0, 5.0, 11.0, 3.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-14.6875, -14.27978515625, -13.8720703125, -13.46435546875, -13.056640625, -12.64892578125, -12.2412109375, -11.83349609375, -11.42578125, -11.01806640625, -10.6103515625, -10.20263671875, -9.794921875, -9.38720703125, -8.9794921875, -8.57177734375, -8.1640625, -7.75634765625, -7.3486328125, -6.94091796875, -6.533203125, -6.12548828125, -5.7177734375, -5.31005859375, -4.90234375, -4.49462890625, -4.0869140625, -3.67919921875, -3.271484375, -2.86376953125, -2.4560546875, -2.04833984375, -1.640625, -1.23291015625, -0.8251953125, -0.41748046875, -0.009765625, 0.39794921875, 0.8056640625, 1.21337890625, 1.62109375, 2.02880859375, 2.4365234375, 2.84423828125, 3.251953125, 3.65966796875, 4.0673828125, 4.47509765625, 4.8828125, 5.29052734375, 5.6982421875, 6.10595703125, 6.513671875, 6.92138671875, 7.3291015625, 7.73681640625, 8.14453125, 8.55224609375, 8.9599609375, 9.36767578125, 9.775390625, 10.18310546875, 10.5908203125, 10.99853515625, 11.40625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 11.0, 8.0, 19.0, 24.0, 32.0, 52.0, 56.0, 95.0, 112.0, 146.0, 234.0, 315.0, 446.0, 622.0, 932.0, 1558.0, 2788.0, 5945.0, 14591.0, 44457.0, 142935.0, 321629.0, 311234.0, 132828.0, 41212.0, 13599.0, 5474.0, 2660.0, 1515.0, 886.0, 642.0, 427.0, 289.0, 186.0, 175.0, 126.0, 85.0, 50.0, 46.0, 30.0, 25.0, 13.0, 12.0, 8.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4130859375, -0.3997459411621094, -0.38640594482421875, -0.3730659484863281, -0.3597259521484375, -0.3463859558105469, -0.33304595947265625, -0.3197059631347656, -0.306365966796875, -0.2930259704589844, -0.27968597412109375, -0.2663459777832031, -0.2530059814453125, -0.23966598510742188, -0.22632598876953125, -0.21298599243164062, -0.19964599609375, -0.18630599975585938, -0.17296600341796875, -0.15962600708007812, -0.1462860107421875, -0.13294601440429688, -0.11960601806640625, -0.10626602172851562, -0.092926025390625, -0.07958602905273438, -0.06624603271484375, -0.052906036376953125, -0.0395660400390625, -0.026226043701171875, -0.01288604736328125, 0.000453948974609375, 0.0137939453125, 0.027133941650390625, 0.04047393798828125, 0.053813934326171875, 0.0671539306640625, 0.08049392700195312, 0.09383392333984375, 0.10717391967773438, 0.120513916015625, 0.13385391235351562, 0.14719390869140625, 0.16053390502929688, 0.1738739013671875, 0.18721389770507812, 0.20055389404296875, 0.21389389038085938, 0.22723388671875, 0.24057388305664062, 0.25391387939453125, 0.2672538757324219, 0.2805938720703125, 0.2939338684082031, 0.30727386474609375, 0.3206138610839844, 0.333953857421875, 0.3472938537597656, 0.36063385009765625, 0.3739738464355469, 0.3873138427734375, 0.4006538391113281, 0.41399383544921875, 0.4273338317871094, 0.440673828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 8.0, 8.0, 19.0, 37.0, 42.0, 62.0, 85.0, 101.0, 134.0, 138.0, 96.0, 100.0, 53.0, 44.0, 20.0, 15.0, 5.0, 8.0, 7.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020694732666015625, -0.00019535422325134277, -0.0001837611198425293, -0.00017216801643371582, -0.00016057491302490234, -0.00014898180961608887, -0.0001373887062072754, -0.00012579560279846191, -0.00011420249938964844, -0.00010260939598083496, -9.101629257202148e-05, -7.942318916320801e-05, -6.783008575439453e-05, -5.6236982345581055e-05, -4.464387893676758e-05, -3.30507755279541e-05, -2.1457672119140625e-05, -9.864568710327148e-06, 1.7285346984863281e-06, 1.3321638107299805e-05, 2.491474151611328e-05, 3.650784492492676e-05, 4.8100948333740234e-05, 5.969405174255371e-05, 7.128715515136719e-05, 8.288025856018066e-05, 9.447336196899414e-05, 0.00010606646537780762, 0.0001176595687866211, 0.00012925267219543457, 0.00014084577560424805, 0.00015243887901306152, 0.000164031982421875, 0.00017562508583068848, 0.00018721818923950195, 0.00019881129264831543, 0.0002104043960571289, 0.00022199749946594238, 0.00023359060287475586, 0.00024518370628356934, 0.0002567768096923828, 0.0002683699131011963, 0.00027996301651000977, 0.00029155611991882324, 0.0003031492233276367, 0.0003147423267364502, 0.00032633543014526367, 0.00033792853355407715, 0.0003495216369628906, 0.0003611147403717041, 0.0003727078437805176, 0.00038430094718933105, 0.00039589405059814453, 0.000407487154006958, 0.0004190802574157715, 0.00043067336082458496, 0.00044226646423339844, 0.0004538595676422119, 0.0004654526710510254, 0.00047704577445983887, 0.0004886388778686523, 0.0005002319812774658, 0.0005118250846862793, 0.0005234181880950928, 0.0005350112915039062]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 9.0, 18.0, 43.0, 49.0, 76.0, 133.0, 205.0, 337.0, 608.0, 1093.0, 1916.0, 3598.0, 6806.0, 12995.0, 24760.0, 46911.0, 85314.0, 138769.0, 187102.0, 189771.0, 147637.0, 92413.0, 50872.0, 26924.0, 14100.0, 7185.0, 3952.0, 2033.0, 1198.0, 700.0, 387.0, 231.0, 126.0, 96.0, 56.0, 41.0, 17.0, 20.0, 10.0, 7.0, 8.0, 5.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.250244140625, -0.24219512939453125, -0.2341461181640625, -0.22609710693359375, -0.218048095703125, -0.20999908447265625, -0.2019500732421875, -0.19390106201171875, -0.18585205078125, -0.17780303955078125, -0.1697540283203125, -0.16170501708984375, -0.153656005859375, -0.14560699462890625, -0.1375579833984375, -0.12950897216796875, -0.1214599609375, -0.11341094970703125, -0.1053619384765625, -0.09731292724609375, -0.089263916015625, -0.08121490478515625, -0.0731658935546875, -0.06511688232421875, -0.05706787109375, -0.04901885986328125, -0.0409698486328125, -0.03292083740234375, -0.024871826171875, -0.01682281494140625, -0.0087738037109375, -0.00072479248046875, 0.00732421875, 0.01537322998046875, 0.0234222412109375, 0.03147125244140625, 0.039520263671875, 0.04756927490234375, 0.0556182861328125, 0.06366729736328125, 0.07171630859375, 0.07976531982421875, 0.0878143310546875, 0.09586334228515625, 0.103912353515625, 0.11196136474609375, 0.1200103759765625, 0.12805938720703125, 0.1361083984375, 0.14415740966796875, 0.1522064208984375, 0.16025543212890625, 0.168304443359375, 0.17635345458984375, 0.1844024658203125, 0.19245147705078125, 0.20050048828125, 0.20854949951171875, 0.2165985107421875, 0.22464752197265625, 0.232696533203125, 0.24074554443359375, 0.2487945556640625, 0.25684356689453125, 0.264892578125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 10.0, 7.0, 8.0, 10.0, 8.0, 10.0, 10.0, 25.0, 19.0, 20.0, 35.0, 31.0, 36.0, 37.0, 47.0, 43.0, 38.0, 42.0, 61.0, 53.0, 41.0, 65.0, 46.0, 45.0, 38.0, 35.0, 25.0, 33.0, 20.0, 17.0, 11.0, 14.0, 11.0, 9.0, 9.0, 7.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12042236328125, -0.11678504943847656, -0.11314773559570312, -0.10951042175292969, -0.10587310791015625, -0.10223579406738281, -0.09859848022460938, -0.09496116638183594, -0.0913238525390625, -0.08768653869628906, -0.08404922485351562, -0.08041191101074219, -0.07677459716796875, -0.07313728332519531, -0.06949996948242188, -0.06586265563964844, -0.062225341796875, -0.05858802795410156, -0.054950714111328125, -0.05131340026855469, -0.04767608642578125, -0.04403877258300781, -0.040401458740234375, -0.03676414489746094, -0.0331268310546875, -0.029489517211914062, -0.025852203369140625, -0.022214889526367188, -0.01857757568359375, -0.014940261840820312, -0.011302947998046875, -0.0076656341552734375, -0.0040283203125, -0.0003910064697265625, 0.003246307373046875, 0.0068836212158203125, 0.01052093505859375, 0.014158248901367188, 0.017795562744140625, 0.021432876586914062, 0.0250701904296875, 0.028707504272460938, 0.032344818115234375, 0.03598213195800781, 0.03961944580078125, 0.04325675964355469, 0.046894073486328125, 0.05053138732910156, 0.054168701171875, 0.05780601501464844, 0.061443328857421875, 0.06508064270019531, 0.06871795654296875, 0.07235527038574219, 0.07599258422851562, 0.07962989807128906, 0.0832672119140625, 0.08690452575683594, 0.09054183959960938, 0.09417915344238281, 0.09781646728515625, 0.10145378112792969, 0.10509109497070312, 0.10872840881347656, 0.11236572265625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 4.0, 3.0, 2.0, 7.0, 7.0, 6.0, 13.0, 9.0, 25.0, 25.0, 20.0, 26.0, 32.0, 36.0, 36.0, 40.0, 55.0, 33.0, 54.0, 48.0, 41.0, 56.0, 42.0, 41.0, 40.0, 36.0, 38.0, 44.0, 29.0, 29.0, 16.0, 21.0, 21.0, 11.0, 9.0, 11.0, 8.0, 9.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.880415916442871, -3.7494759559631348, -3.6185359954833984, -3.487596035003662, -3.356656074523926, -3.2257161140441895, -3.094776153564453, -2.963836193084717, -2.8328962326049805, -2.701956272125244, -2.571016311645508, -2.4400763511657715, -2.309136390686035, -2.178196430206299, -2.0472564697265625, -1.9163165092468262, -1.7853765487670898, -1.6544365882873535, -1.5234966278076172, -1.3925566673278809, -1.2616167068481445, -1.1306767463684082, -0.9997367858886719, -0.8687968254089355, -0.7378568649291992, -0.6069169044494629, -0.47597694396972656, -0.34503698348999023, -0.2140970230102539, -0.08315706253051758, 0.04778289794921875, 0.17872285842895508, 0.3096632957458496, 0.44060325622558594, 0.5715432167053223, 0.7024831771850586, 0.8334231376647949, 0.9643630981445312, 1.0953030586242676, 1.226243019104004, 1.3571829795837402, 1.4881229400634766, 1.619062900543213, 1.7500028610229492, 1.8809428215026855, 2.011882781982422, 2.142822742462158, 2.2737627029418945, 2.404702663421631, 2.535642623901367, 2.6665825843811035, 2.79752254486084, 2.928462505340576, 3.0594024658203125, 3.190342426300049, 3.321282386779785, 3.4522223472595215, 3.583162307739258, 3.714102268218994, 3.8450422286987305, 3.975982189178467, 4.106922149658203, 4.2378621101379395, 4.368802070617676, 4.499742031097412]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 7.0, 8.0, 9.0, 8.0, 19.0, 18.0, 16.0, 25.0, 21.0, 35.0, 30.0, 36.0, 51.0, 46.0, 44.0, 47.0, 34.0, 42.0, 43.0, 35.0, 49.0, 32.0, 37.0, 46.0, 30.0, 38.0, 21.0, 25.0, 22.0, 15.0, 14.0, 16.0, 15.0, 8.0, 8.0, 8.0, 10.0, 8.0, 5.0, 5.0, 3.0, 0.0, 0.0, 4.0], "bins": [-5.612306118011475, -5.4637346267700195, -5.315162658691406, -5.166590690612793, -5.018019199371338, -4.869447708129883, -4.7208757400512695, -4.572303771972656, -4.423732280731201, -4.275160789489746, -4.126588821411133, -3.9780170917510986, -3.8294453620910645, -3.6808736324310303, -3.532301902770996, -3.383730173110962, -3.2351584434509277, -3.0865867137908936, -2.9380149841308594, -2.789443254470825, -2.640871524810791, -2.492299795150757, -2.3437280654907227, -2.1951563358306885, -2.0465846061706543, -1.8980128765106201, -1.749441146850586, -1.6008694171905518, -1.4522976875305176, -1.3037259578704834, -1.1551542282104492, -1.006582498550415, -0.85801100730896, -0.7094392776489258, -0.5608675479888916, -0.4122958183288574, -0.26372408866882324, -0.11515235900878906, 0.03341937065124512, 0.1819911003112793, 0.3305628299713135, 0.47913455963134766, 0.6277062892913818, 0.776278018951416, 0.9248497486114502, 1.0734214782714844, 1.2219932079315186, 1.3705649375915527, 1.519136667251587, 1.667708396911621, 1.8162801265716553, 1.9648518562316895, 2.1134235858917236, 2.261995315551758, 2.410567045211792, 2.559138774871826, 2.7077105045318604, 2.8562822341918945, 3.0048539638519287, 3.153425693511963, 3.301997423171997, 3.4505691528320312, 3.5991408824920654, 3.7477126121520996, 3.896284341812134]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 14.0, 15.0, 25.0, 41.0, 50.0, 94.0, 127.0, 159.0, 250.0, 377.0, 666.0, 1113.0, 1890.0, 3430.0, 6477.0, 12170.0, 23700.0, 49122.0, 103288.0, 192374.0, 255700.0, 193087.0, 104178.0, 49262.0, 23841.0, 12179.0, 6485.0, 3457.0, 2035.0, 1089.0, 682.0, 400.0, 259.0, 157.0, 97.0, 69.0, 54.0, 44.0, 24.0, 25.0, 15.0, 10.0, 6.0, 2.0, 9.0, 2.0, 1.0, 1.0, 2.0], "bins": [-6.69140625, -6.5029296875, -6.314453125, -6.1259765625, -5.9375, -5.7490234375, -5.560546875, -5.3720703125, -5.18359375, -4.9951171875, -4.806640625, -4.6181640625, -4.4296875, -4.2412109375, -4.052734375, -3.8642578125, -3.67578125, -3.4873046875, -3.298828125, -3.1103515625, -2.921875, -2.7333984375, -2.544921875, -2.3564453125, -2.16796875, -1.9794921875, -1.791015625, -1.6025390625, -1.4140625, -1.2255859375, -1.037109375, -0.8486328125, -0.66015625, -0.4716796875, -0.283203125, -0.0947265625, 0.09375, 0.2822265625, 0.470703125, 0.6591796875, 0.84765625, 1.0361328125, 1.224609375, 1.4130859375, 1.6015625, 1.7900390625, 1.978515625, 2.1669921875, 2.35546875, 2.5439453125, 2.732421875, 2.9208984375, 3.109375, 3.2978515625, 3.486328125, 3.6748046875, 3.86328125, 4.0517578125, 4.240234375, 4.4287109375, 4.6171875, 4.8056640625, 4.994140625, 5.1826171875, 5.37109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 8.0, 6.0, 8.0, 7.0, 19.0, 14.0, 13.0, 21.0, 30.0, 21.0, 30.0, 22.0, 37.0, 43.0, 41.0, 37.0, 43.0, 42.0, 39.0, 44.0, 31.0, 49.0, 40.0, 33.0, 30.0, 19.0, 32.0, 43.0, 22.0, 27.0, 20.0, 21.0, 19.0, 7.0, 15.0, 11.0, 11.0, 5.0, 6.0, 3.0, 6.0, 6.0, 2.0, 3.0, 2.0, 4.0, 2.0], "bins": [-8.4375, -8.20477294921875, -7.9720458984375, -7.73931884765625, -7.506591796875, -7.27386474609375, -7.0411376953125, -6.80841064453125, -6.57568359375, -6.34295654296875, -6.1102294921875, -5.87750244140625, -5.644775390625, -5.41204833984375, -5.1793212890625, -4.94659423828125, -4.7138671875, -4.48114013671875, -4.2484130859375, -4.01568603515625, -3.782958984375, -3.55023193359375, -3.3175048828125, -3.08477783203125, -2.85205078125, -2.61932373046875, -2.3865966796875, -2.15386962890625, -1.921142578125, -1.68841552734375, -1.4556884765625, -1.22296142578125, -0.990234375, -0.75750732421875, -0.5247802734375, -0.29205322265625, -0.059326171875, 0.17340087890625, 0.4061279296875, 0.63885498046875, 0.87158203125, 1.10430908203125, 1.3370361328125, 1.56976318359375, 1.802490234375, 2.03521728515625, 2.2679443359375, 2.50067138671875, 2.7333984375, 2.96612548828125, 3.1988525390625, 3.43157958984375, 3.664306640625, 3.89703369140625, 4.1297607421875, 4.36248779296875, 4.59521484375, 4.82794189453125, 5.0606689453125, 5.29339599609375, 5.526123046875, 5.75885009765625, 5.9915771484375, 6.22430419921875, 6.45703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 7.0, 11.0, 9.0, 7.0, 19.0, 24.0, 33.0, 53.0, 69.0, 119.0, 167.0, 267.0, 424.0, 1048.0, 2364.0, 6113.0, 17717.0, 56096.0, 181665.0, 397305.0, 259984.0, 83810.0, 26506.0, 8807.0, 3141.0, 1258.0, 591.0, 342.0, 184.0, 113.0, 95.0, 57.0, 43.0, 28.0, 21.0, 15.0, 14.0, 9.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.2861328125, -9.939453125, -9.5927734375, -9.24609375, -8.8994140625, -8.552734375, -8.2060546875, -7.859375, -7.5126953125, -7.166015625, -6.8193359375, -6.47265625, -6.1259765625, -5.779296875, -5.4326171875, -5.0859375, -4.7392578125, -4.392578125, -4.0458984375, -3.69921875, -3.3525390625, -3.005859375, -2.6591796875, -2.3125, -1.9658203125, -1.619140625, -1.2724609375, -0.92578125, -0.5791015625, -0.232421875, 0.1142578125, 0.4609375, 0.8076171875, 1.154296875, 1.5009765625, 1.84765625, 2.1943359375, 2.541015625, 2.8876953125, 3.234375, 3.5810546875, 3.927734375, 4.2744140625, 4.62109375, 4.9677734375, 5.314453125, 5.6611328125, 6.0078125, 6.3544921875, 6.701171875, 7.0478515625, 7.39453125, 7.7412109375, 8.087890625, 8.4345703125, 8.78125, 9.1279296875, 9.474609375, 9.8212890625, 10.16796875, 10.5146484375, 10.861328125, 11.2080078125, 11.5546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 11.0, 10.0, 24.0, 21.0, 29.0, 32.0, 34.0, 29.0, 48.0, 52.0, 57.0, 54.0, 47.0, 48.0, 46.0, 47.0, 59.0, 50.0, 45.0, 38.0, 32.0, 23.0, 34.0, 26.0, 23.0, 15.0, 11.0, 14.0, 8.0, 4.0, 8.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-14.4765625, -14.1214599609375, -13.766357421875, -13.4112548828125, -13.05615234375, -12.7010498046875, -12.345947265625, -11.9908447265625, -11.6357421875, -11.2806396484375, -10.925537109375, -10.5704345703125, -10.21533203125, -9.8602294921875, -9.505126953125, -9.1500244140625, -8.794921875, -8.4398193359375, -8.084716796875, -7.7296142578125, -7.37451171875, -7.0194091796875, -6.664306640625, -6.3092041015625, -5.9541015625, -5.5989990234375, -5.243896484375, -4.8887939453125, -4.53369140625, -4.1785888671875, -3.823486328125, -3.4683837890625, -3.11328125, -2.7581787109375, -2.403076171875, -2.0479736328125, -1.69287109375, -1.3377685546875, -0.982666015625, -0.6275634765625, -0.2724609375, 0.0826416015625, 0.437744140625, 0.7928466796875, 1.14794921875, 1.5030517578125, 1.858154296875, 2.2132568359375, 2.568359375, 2.9234619140625, 3.278564453125, 3.6336669921875, 3.98876953125, 4.3438720703125, 4.698974609375, 5.0540771484375, 5.4091796875, 5.7642822265625, 6.119384765625, 6.4744873046875, 6.82958984375, 7.1846923828125, 7.539794921875, 7.8948974609375, 8.25]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 9.0, 8.0, 15.0, 14.0, 26.0, 45.0, 50.0, 73.0, 97.0, 178.0, 236.0, 383.0, 650.0, 1174.0, 2478.0, 5917.0, 16911.0, 56562.0, 194155.0, 468752.0, 209216.0, 61719.0, 18315.0, 6164.0, 2509.0, 1139.0, 639.0, 338.0, 225.0, 175.0, 119.0, 72.0, 55.0, 38.0, 29.0, 18.0, 17.0, 14.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.356414794921875, -2.27923583984375, -2.202056884765625, -2.1248779296875, -2.047698974609375, -1.97052001953125, -1.893341064453125, -1.816162109375, -1.738983154296875, -1.66180419921875, -1.584625244140625, -1.5074462890625, -1.430267333984375, -1.35308837890625, -1.275909423828125, -1.19873046875, -1.121551513671875, -1.04437255859375, -0.967193603515625, -0.8900146484375, -0.812835693359375, -0.73565673828125, -0.658477783203125, -0.581298828125, -0.504119873046875, -0.42694091796875, -0.349761962890625, -0.2725830078125, -0.195404052734375, -0.11822509765625, -0.041046142578125, 0.0361328125, 0.113311767578125, 0.19049072265625, 0.267669677734375, 0.3448486328125, 0.422027587890625, 0.49920654296875, 0.576385498046875, 0.653564453125, 0.730743408203125, 0.80792236328125, 0.885101318359375, 0.9622802734375, 1.039459228515625, 1.11663818359375, 1.193817138671875, 1.27099609375, 1.348175048828125, 1.42535400390625, 1.502532958984375, 1.5797119140625, 1.656890869140625, 1.73406982421875, 1.811248779296875, 1.888427734375, 1.965606689453125, 2.04278564453125, 2.119964599609375, 2.1971435546875, 2.274322509765625, 2.35150146484375, 2.428680419921875, 2.505859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 11.0, 5.0, 7.0, 16.0, 15.0, 19.0, 28.0, 36.0, 49.0, 64.0, 82.0, 90.0, 160.0, 85.0, 73.0, 63.0, 53.0, 33.0, 33.0, 24.0, 18.0, 14.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006289482116699219, -0.0006138086318969727, -0.0005986690521240234, -0.0005835294723510742, -0.000568389892578125, -0.0005532503128051758, -0.0005381107330322266, -0.0005229711532592773, -0.0005078315734863281, -0.0004926919937133789, -0.0004775524139404297, -0.00046241283416748047, -0.00044727325439453125, -0.00043213367462158203, -0.0004169940948486328, -0.0004018545150756836, -0.0003867149353027344, -0.00037157535552978516, -0.00035643577575683594, -0.0003412961959838867, -0.0003261566162109375, -0.0003110170364379883, -0.00029587745666503906, -0.00028073787689208984, -0.0002655982971191406, -0.0002504587173461914, -0.0002353191375732422, -0.00022017955780029297, -0.00020503997802734375, -0.00018990039825439453, -0.0001747608184814453, -0.0001596212387084961, -0.00014448165893554688, -0.00012934207916259766, -0.00011420249938964844, -9.906291961669922e-05, -8.392333984375e-05, -6.878376007080078e-05, -5.364418029785156e-05, -3.8504600524902344e-05, -2.3365020751953125e-05, -8.225440979003906e-06, 6.9141387939453125e-06, 2.205371856689453e-05, 3.719329833984375e-05, 5.233287811279297e-05, 6.747245788574219e-05, 8.26120376586914e-05, 9.775161743164062e-05, 0.00011289119720458984, 0.00012803077697753906, 0.00014317035675048828, 0.0001583099365234375, 0.00017344951629638672, 0.00018858909606933594, 0.00020372867584228516, 0.00021886825561523438, 0.0002340078353881836, 0.0002491474151611328, 0.00026428699493408203, 0.00027942657470703125, 0.00029456615447998047, 0.0003097057342529297, 0.0003248453140258789, 0.0003399848937988281]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 6.0, 3.0, 3.0, 3.0, 12.0, 10.0, 12.0, 14.0, 23.0, 41.0, 47.0, 57.0, 108.0, 144.0, 203.0, 303.0, 384.0, 652.0, 1067.0, 1560.0, 2782.0, 4955.0, 9684.0, 22496.0, 63233.0, 187380.0, 422519.0, 210382.0, 71626.0, 25087.0, 10535.0, 5346.0, 2987.0, 1754.0, 1106.0, 650.0, 430.0, 293.0, 220.0, 115.0, 91.0, 61.0, 56.0, 29.0, 29.0, 16.0, 9.0, 12.0, 5.0, 7.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.31640625, -2.2406005859375, -2.164794921875, -2.0889892578125, -2.01318359375, -1.9373779296875, -1.861572265625, -1.7857666015625, -1.7099609375, -1.6341552734375, -1.558349609375, -1.4825439453125, -1.40673828125, -1.3309326171875, -1.255126953125, -1.1793212890625, -1.103515625, -1.0277099609375, -0.951904296875, -0.8760986328125, -0.80029296875, -0.7244873046875, -0.648681640625, -0.5728759765625, -0.4970703125, -0.4212646484375, -0.345458984375, -0.2696533203125, -0.19384765625, -0.1180419921875, -0.042236328125, 0.0335693359375, 0.109375, 0.1851806640625, 0.260986328125, 0.3367919921875, 0.41259765625, 0.4884033203125, 0.564208984375, 0.6400146484375, 0.7158203125, 0.7916259765625, 0.867431640625, 0.9432373046875, 1.01904296875, 1.0948486328125, 1.170654296875, 1.2464599609375, 1.322265625, 1.3980712890625, 1.473876953125, 1.5496826171875, 1.62548828125, 1.7012939453125, 1.777099609375, 1.8529052734375, 1.9287109375, 2.0045166015625, 2.080322265625, 2.1561279296875, 2.23193359375, 2.3077392578125, 2.383544921875, 2.4593505859375, 2.53515625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 3.0, 2.0, 8.0, 13.0, 14.0, 24.0, 17.0, 24.0, 39.0, 49.0, 72.0, 78.0, 104.0, 149.0, 81.0, 56.0, 58.0, 33.0, 35.0, 39.0, 23.0, 17.0, 13.0, 9.0, 13.0, 3.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.681640625, -1.6279449462890625, -1.574249267578125, -1.5205535888671875, -1.46685791015625, -1.4131622314453125, -1.359466552734375, -1.3057708740234375, -1.2520751953125, -1.1983795166015625, -1.144683837890625, -1.0909881591796875, -1.03729248046875, -0.9835968017578125, -0.929901123046875, -0.8762054443359375, -0.822509765625, -0.7688140869140625, -0.715118408203125, -0.6614227294921875, -0.60772705078125, -0.5540313720703125, -0.500335693359375, -0.4466400146484375, -0.3929443359375, -0.3392486572265625, -0.285552978515625, -0.2318572998046875, -0.17816162109375, -0.1244659423828125, -0.070770263671875, -0.0170745849609375, 0.03662109375, 0.0903167724609375, 0.144012451171875, 0.1977081298828125, 0.25140380859375, 0.3050994873046875, 0.358795166015625, 0.4124908447265625, 0.4661865234375, 0.5198822021484375, 0.573577880859375, 0.6272735595703125, 0.68096923828125, 0.7346649169921875, 0.788360595703125, 0.8420562744140625, 0.895751953125, 0.9494476318359375, 1.003143310546875, 1.0568389892578125, 1.11053466796875, 1.1642303466796875, 1.217926025390625, 1.2716217041015625, 1.3253173828125, 1.3790130615234375, 1.432708740234375, 1.4864044189453125, 1.54010009765625, 1.5937957763671875, 1.647491455078125, 1.7011871337890625, 1.7548828125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 20.0, 27.0, 70.0, 116.0, 168.0, 159.0, 141.0, 113.0, 82.0, 41.0, 23.0, 14.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.465322494506836, -17.573015213012695, -16.680707931518555, -15.788400650024414, -14.896093368530273, -14.003786087036133, -13.111478805541992, -12.219171524047852, -11.326864242553711, -10.43455696105957, -9.54224967956543, -8.649942398071289, -7.757635116577148, -6.865327835083008, -5.973020553588867, -5.080713272094727, -4.188405990600586, -3.2960987091064453, -2.4037914276123047, -1.511484146118164, -0.6191768646240234, 0.2731304168701172, 1.1654376983642578, 2.0577449798583984, 2.950052261352539, 3.8423595428466797, 4.73466682434082, 5.626974105834961, 6.519281387329102, 7.411588668823242, 8.303895950317383, 9.196203231811523, 10.088512420654297, 10.980819702148438, 11.873126983642578, 12.765434265136719, 13.65774154663086, 14.550048828125, 15.44235610961914, 16.33466339111328, 17.226970672607422, 18.119277954101562, 19.011585235595703, 19.903892517089844, 20.796199798583984, 21.688507080078125, 22.580814361572266, 23.473121643066406, 24.365428924560547, 25.257736206054688, 26.150043487548828, 27.04235076904297, 27.93465805053711, 28.82696533203125, 29.71927261352539, 30.61157989501953, 31.503887176513672, 32.39619445800781, 33.28850173950195, 34.180809020996094, 35.073116302490234, 35.965423583984375, 36.857730865478516, 37.750038146972656, 38.6423454284668]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 9.0, 9.0, 8.0, 11.0, 12.0, 3.0, 12.0, 14.0, 20.0, 20.0, 17.0, 19.0, 22.0, 23.0, 25.0, 28.0, 28.0, 25.0, 43.0, 34.0, 34.0, 45.0, 35.0, 46.0, 35.0, 34.0, 34.0, 34.0, 40.0, 23.0, 29.0, 16.0, 12.0, 32.0, 22.0, 11.0, 20.0, 18.0, 15.0, 16.0, 12.0, 9.0, 8.0, 7.0, 3.0, 5.0, 8.0, 2.0, 1.0, 4.0, 5.0, 1.0, 2.0], "bins": [-13.604690551757812, -13.202754020690918, -12.800816535949707, -12.398880004882812, -11.996943473815918, -11.595005989074707, -11.193069458007812, -10.791131973266602, -10.389195442199707, -9.987258911132812, -9.585321426391602, -9.183384895324707, -8.781448364257812, -8.379510879516602, -7.977574348449707, -7.575637340545654, -7.17370080947876, -6.771763801574707, -6.3698272705078125, -5.96789026260376, -5.565953254699707, -5.1640167236328125, -4.76207971572876, -4.360142707824707, -3.9582059383392334, -3.5562691688537598, -3.154332160949707, -2.7523953914642334, -2.3504586219787598, -1.948521614074707, -1.5465848445892334, -1.1446478366851807, -0.742711067199707, -0.34077420830726624, 0.06116265058517456, 0.46309947967529297, 0.8650363683700562, 1.2669732570648193, 1.668910026550293, 2.0708470344543457, 2.4727838039398193, 2.874720573425293, 3.2766575813293457, 3.6785943508148193, 4.080531120300293, 4.482468128204346, 4.884405136108398, 5.286341667175293, 5.688278675079346, 6.090215682983398, 6.492152214050293, 6.894089221954346, 7.296026229858398, 7.697962760925293, 8.099899291992188, 8.501836776733398, 8.903773307800293, 9.305709838867188, 9.707647323608398, 10.109583854675293, 10.511520385742188, 10.913457870483398, 11.315394401550293, 11.717330932617188, 12.119268417358398]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 8.0, 8.0, 9.0, 12.0, 13.0, 16.0, 31.0, 31.0, 38.0, 48.0, 65.0, 91.0, 107.0, 148.0, 197.0, 284.0, 374.0, 493.0, 657.0, 901.0, 1239.0, 1783.0, 2570.0, 3626.0, 5107.0, 9537.0, 1002931.0, 6088.0, 4049.0, 2851.0, 2041.0, 1409.0, 982.0, 719.0, 517.0, 394.0, 292.0, 221.0, 150.0, 148.0, 100.0, 72.0, 61.0, 44.0, 44.0, 32.0, 11.0, 15.0, 13.0, 13.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-10.43497085571289, -10.11055850982666, -9.78614616394043, -9.4617338180542, -9.137321472167969, -8.812908172607422, -8.488495826721191, -8.164083480834961, -7.8396711349487305, -7.5152587890625, -7.1908464431762695, -6.866433620452881, -6.54202127456665, -6.21760892868042, -5.893196105957031, -5.568783760070801, -5.24437141418457, -4.91995906829834, -4.595546722412109, -4.271133899688721, -3.9467215538024902, -3.6223092079162598, -3.29789662361145, -2.9734840393066406, -2.64907169342041, -2.3246593475341797, -2.00024676322937, -1.67583429813385, -1.35142183303833, -1.02700936794281, -0.70259690284729, -0.37818431854248047, -0.053771018981933594, 0.2706414461135864, 0.5950539112091064, 0.9194663763046265, 1.2438788414001465, 1.5682913064956665, 1.8927037715911865, 2.217116355895996, 2.5415287017822266, 2.865941047668457, 3.1903536319732666, 3.514766216278076, 3.8391785621643066, 4.163590908050537, 4.488003730773926, 4.812416076660156, 5.136828422546387, 5.461240768432617, 5.785653114318848, 6.110065937042236, 6.434478282928467, 6.758890628814697, 7.083303451538086, 7.407715797424316, 7.732128143310547, 8.056540489196777, 8.380952835083008, 8.705365180969238, 9.029777526855469, 9.354190826416016, 9.678603172302246, 10.003015518188477, 10.327427864074707]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 21.0, 25.0, 82.0, 149.0, 414.0, 2145.0, 25360.0, 51373192.0, 63102.0, 4641.0, 724.0, 246.0, 104.0, 48.0, 30.0, 15.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.755859375, -66.43700408935547, -64.11814880371094, -61.79930114746094, -59.480445861816406, -57.161590576171875, -54.84273910522461, -52.523887634277344, -50.20503234863281, -47.88617706298828, -45.567325592041016, -43.24847412109375, -40.92961883544922, -38.61076354980469, -36.29191207885742, -33.973060607910156, -31.654205322265625, -29.335351943969727, -27.016498565673828, -24.69764518737793, -22.37879180908203, -20.059938430786133, -17.741085052490234, -15.422231674194336, -13.103378295898438, -10.784524917602539, -8.46567153930664, -6.146818161010742, -3.8279647827148438, -1.5091114044189453, 0.8097419738769531, 3.1285953521728516, 5.447456359863281, 7.76630973815918, 10.085163116455078, 12.404016494750977, 14.722869873046875, 17.041723251342773, 19.360576629638672, 21.67943000793457, 23.99828338623047, 26.317136764526367, 28.635990142822266, 30.954843521118164, 33.27369689941406, 35.592552185058594, 37.91140365600586, 40.230255126953125, 42.549110412597656, 44.86796569824219, 47.18681716918945, 49.50566864013672, 51.82452392578125, 54.14337921142578, 56.46223068237305, 58.78108215332031, 61.099937438964844, 63.418792724609375, 65.73764038085938, 68.0564956665039, 70.37535095214844, 72.69420623779297, 75.0130615234375, 77.3319091796875, 79.65076446533203]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 10.0, 9.0, 22.0, 31.0, 44.0, 62.0, 90.0, 104.0, 168.0, 225.0, 365.0, 579.0, 878.0, 1420.0, 2544.0, 4556.0, 8495.0, 16414.0, 32349.0, 64145.0, 123843.0, 228760.0, 375571.0, 614330.0, 3583894.0, 496965.0, 329835.0, 193343.0, 102699.0, 52361.0, 26613.0, 13753.0, 7179.0, 3952.0, 2187.0, 1326.0, 780.0, 493.0, 310.0, 223.0, 138.0, 97.0, 67.0, 59.0, 41.0, 34.0, 16.0, 21.0, 12.0, 8.0, 11.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-6.15234375, -5.95611572265625, -5.7598876953125, -5.56365966796875, -5.367431640625, -5.17120361328125, -4.9749755859375, -4.77874755859375, -4.58251953125, -4.38629150390625, -4.1900634765625, -3.99383544921875, -3.797607421875, -3.60137939453125, -3.4051513671875, -3.20892333984375, -3.0126953125, -2.81646728515625, -2.6202392578125, -2.42401123046875, -2.227783203125, -2.03155517578125, -1.8353271484375, -1.63909912109375, -1.44287109375, -1.24664306640625, -1.0504150390625, -0.85418701171875, -0.657958984375, -0.46173095703125, -0.2655029296875, -0.06927490234375, 0.126953125, 0.32318115234375, 0.5194091796875, 0.71563720703125, 0.911865234375, 1.10809326171875, 1.3043212890625, 1.50054931640625, 1.69677734375, 1.89300537109375, 2.0892333984375, 2.28546142578125, 2.481689453125, 2.67791748046875, 2.8741455078125, 3.07037353515625, 3.2666015625, 3.46282958984375, 3.6590576171875, 3.85528564453125, 4.051513671875, 4.24774169921875, 4.4439697265625, 4.64019775390625, 4.83642578125, 5.03265380859375, 5.2288818359375, 5.42510986328125, 5.621337890625, 5.81756591796875, 6.0137939453125, 6.21002197265625, 6.40625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 14.0, 11.0, 12.0, 12.0, 14.0, 13.0, 18.0, 27.0, 38.0, 30.0, 41.0, 29.0, 29.0, 37.0, 45.0, 104.0, 990.0, 78.0, 37.0, 53.0, 46.0, 27.0, 44.0, 37.0, 24.0, 25.0, 28.0, 21.0, 21.0, 27.0, 29.0, 6.0, 13.0, 8.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-62.375, -60.39453125, -58.4140625, -56.43359375, -54.453125, -52.47265625, -50.4921875, -48.51171875, -46.53125, -44.55078125, -42.5703125, -40.58984375, -38.609375, -36.62890625, -34.6484375, -32.66796875, -30.6875, -28.70703125, -26.7265625, -24.74609375, -22.765625, -20.78515625, -18.8046875, -16.82421875, -14.84375, -12.86328125, -10.8828125, -8.90234375, -6.921875, -4.94140625, -2.9609375, -0.98046875, 1.0, 2.98046875, 4.9609375, 6.94140625, 8.921875, 10.90234375, 12.8828125, 14.86328125, 16.84375, 18.82421875, 20.8046875, 22.78515625, 24.765625, 26.74609375, 28.7265625, 30.70703125, 32.6875, 34.66796875, 36.6484375, 38.62890625, 40.609375, 42.58984375, 44.5703125, 46.55078125, 48.53125, 50.51171875, 52.4921875, 54.47265625, 56.453125, 58.43359375, 60.4140625, 62.39453125, 64.375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 14.0, 13.0, 27.0, 53.0, 68.0, 71.0, 107.0, 176.0, 264.0, 391.0, 569.0, 891.0, 1450.0, 2175.0, 3610.0, 5563.0, 8642.0, 13651.0, 21329.0, 33514.0, 50963.0, 77677.0, 112450.0, 157021.0, 208145.0, 260549.0, 312245.0, 2082887.0, 1698998.0, 304747.0, 254628.0, 202646.0, 152065.0, 109926.0, 74693.0, 49935.0, 32458.0, 20626.0, 13077.0, 8398.0, 5201.0, 3497.0, 2168.0, 1406.0, 873.0, 603.0, 370.0, 226.0, 138.0, 82.0, 66.0, 46.0, 21.0, 13.0, 7.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.033203125, -2.928466796875, -2.82373046875, -2.718994140625, -2.6142578125, -2.509521484375, -2.40478515625, -2.300048828125, -2.1953125, -2.090576171875, -1.98583984375, -1.881103515625, -1.7763671875, -1.671630859375, -1.56689453125, -1.462158203125, -1.357421875, -1.252685546875, -1.14794921875, -1.043212890625, -0.9384765625, -0.833740234375, -0.72900390625, -0.624267578125, -0.51953125, -0.414794921875, -0.31005859375, -0.205322265625, -0.1005859375, 0.004150390625, 0.10888671875, 0.213623046875, 0.318359375, 0.423095703125, 0.52783203125, 0.632568359375, 0.7373046875, 0.842041015625, 0.94677734375, 1.051513671875, 1.15625, 1.260986328125, 1.36572265625, 1.470458984375, 1.5751953125, 1.679931640625, 1.78466796875, 1.889404296875, 1.994140625, 2.098876953125, 2.20361328125, 2.308349609375, 2.4130859375, 2.517822265625, 2.62255859375, 2.727294921875, 2.83203125, 2.936767578125, 3.04150390625, 3.146240234375, 3.2509765625, 3.355712890625, 3.46044921875, 3.565185546875, 3.669921875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 8.0, 2.0, 7.0, 10.0, 7.0, 10.0, 14.0, 12.0, 20.0, 25.0, 33.0, 39.0, 36.0, 38.0, 40.0, 35.0, 41.0, 50.0, 43.0, 882.0, 226.0, 48.0, 32.0, 48.0, 31.0, 30.0, 39.0, 31.0, 33.0, 22.0, 33.0, 20.0, 12.0, 15.0, 10.0, 13.0, 6.0, 6.0, 5.0, 1.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-61.6875, -59.966796875, -58.24609375, -56.525390625, -54.8046875, -53.083984375, -51.36328125, -49.642578125, -47.921875, -46.201171875, -44.48046875, -42.759765625, -41.0390625, -39.318359375, -37.59765625, -35.876953125, -34.15625, -32.435546875, -30.71484375, -28.994140625, -27.2734375, -25.552734375, -23.83203125, -22.111328125, -20.390625, -18.669921875, -16.94921875, -15.228515625, -13.5078125, -11.787109375, -10.06640625, -8.345703125, -6.625, -4.904296875, -3.18359375, -1.462890625, 0.2578125, 1.978515625, 3.69921875, 5.419921875, 7.140625, 8.861328125, 10.58203125, 12.302734375, 14.0234375, 15.744140625, 17.46484375, 19.185546875, 20.90625, 22.626953125, 24.34765625, 26.068359375, 27.7890625, 29.509765625, 31.23046875, 32.951171875, 34.671875, 36.392578125, 38.11328125, 39.833984375, 41.5546875, 43.275390625, 44.99609375, 46.716796875, 48.4375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 0.0, 10.0, 1.0, 10.0, 13.0, 12.0, 33.0, 38.0, 41.0, 81.0, 91.0, 106.0, 154.0, 231.0, 282.0, 371.0, 587.0, 859.0, 1442.0, 2414.0, 4291.0, 8222.0, 16536.0, 34862.0, 69864.0, 141886.0, 5665748.0, 178223.0, 82144.0, 41064.0, 19764.0, 9538.0, 5006.0, 2736.0, 1615.0, 935.0, 685.0, 453.0, 253.0, 211.0, 188.0, 128.0, 83.0, 78.0, 35.0, 30.0, 26.0, 17.0, 23.0, 4.0, 5.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.8046875, -11.4190673828125, -11.033447265625, -10.6478271484375, -10.26220703125, -9.8765869140625, -9.490966796875, -9.1053466796875, -8.7197265625, -8.3341064453125, -7.948486328125, -7.5628662109375, -7.17724609375, -6.7916259765625, -6.406005859375, -6.0203857421875, -5.634765625, -5.2491455078125, -4.863525390625, -4.4779052734375, -4.09228515625, -3.7066650390625, -3.321044921875, -2.9354248046875, -2.5498046875, -2.1641845703125, -1.778564453125, -1.3929443359375, -1.00732421875, -0.6217041015625, -0.236083984375, 0.1495361328125, 0.53515625, 0.9207763671875, 1.306396484375, 1.6920166015625, 2.07763671875, 2.4632568359375, 2.848876953125, 3.2344970703125, 3.6201171875, 4.0057373046875, 4.391357421875, 4.7769775390625, 5.16259765625, 5.5482177734375, 5.933837890625, 6.3194580078125, 6.705078125, 7.0906982421875, 7.476318359375, 7.8619384765625, 8.24755859375, 8.6331787109375, 9.018798828125, 9.4044189453125, 9.7900390625, 10.1756591796875, 10.561279296875, 10.9468994140625, 11.33251953125, 11.7181396484375, 12.103759765625, 12.4893798828125, 12.875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 10.0, 17.0, 11.0, 7.0, 12.0, 16.0, 21.0, 22.0, 34.0, 28.0, 30.0, 34.0, 26.0, 35.0, 32.0, 29.0, 41.0, 221.0, 884.0, 54.0, 44.0, 45.0, 40.0, 25.0, 42.0, 38.0, 30.0, 35.0, 24.0, 22.0, 20.0, 14.0, 18.0, 13.0, 7.0, 6.0, 5.0, 8.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-51.5625, -50.06005859375, -48.5576171875, -47.05517578125, -45.552734375, -44.05029296875, -42.5478515625, -41.04541015625, -39.54296875, -38.04052734375, -36.5380859375, -35.03564453125, -33.533203125, -32.03076171875, -30.5283203125, -29.02587890625, -27.5234375, -26.02099609375, -24.5185546875, -23.01611328125, -21.513671875, -20.01123046875, -18.5087890625, -17.00634765625, -15.50390625, -14.00146484375, -12.4990234375, -10.99658203125, -9.494140625, -7.99169921875, -6.4892578125, -4.98681640625, -3.484375, -1.98193359375, -0.4794921875, 1.02294921875, 2.525390625, 4.02783203125, 5.5302734375, 7.03271484375, 8.53515625, 10.03759765625, 11.5400390625, 13.04248046875, 14.544921875, 16.04736328125, 17.5498046875, 19.05224609375, 20.5546875, 22.05712890625, 23.5595703125, 25.06201171875, 26.564453125, 28.06689453125, 29.5693359375, 31.07177734375, 32.57421875, 34.07666015625, 35.5791015625, 37.08154296875, 38.583984375, 40.08642578125, 41.5888671875, 43.09130859375, 44.59375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 22.0, 24.0, 35.0, 63.0, 124.0, 302.0, 170.0, 87.0, 66.0, 35.0, 24.0, 10.0, 6.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-364.9962158203125, -353.1197204589844, -341.2432556152344, -329.36676025390625, -317.49029541015625, -305.6138000488281, -293.7373046875, -281.86083984375, -269.984375, -258.1078796386719, -246.23141479492188, -234.35491943359375, -222.47845458984375, -210.60195922851562, -198.72547912597656, -186.8489990234375, -174.97250366210938, -163.0960235595703, -151.21954345703125, -139.34304809570312, -127.4665756225586, -115.59009552001953, -103.71360778808594, -91.83712768554688, -79.96064758300781, -68.08416748046875, -56.20768356323242, -44.331199645996094, -32.45471954345703, -20.57823944091797, -8.701751708984375, 3.1747283935546875, 15.05120849609375, 26.927690505981445, 38.80417251586914, 50.68065643310547, 62.55713653564453, 74.4336166381836, 86.31010437011719, 98.18658447265625, 110.06306457519531, 121.93954467773438, 133.81602478027344, 145.6925048828125, 157.56900024414062, 169.44546508789062, 181.32196044921875, 193.1984405517578, 205.07492065429688, 216.95140075683594, 228.827880859375, 240.70437622070312, 252.58084106445312, 264.45733642578125, 276.33380126953125, 288.2102966308594, 300.0867919921875, 311.9632873535156, 323.8397521972656, 335.71624755859375, 347.59271240234375, 359.4692077636719, 371.345703125, 383.22216796875, 395.0986328125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 10.0, 11.0, 14.0, 15.0, 14.0, 11.0, 37.0, 30.0, 32.0, 52.0, 77.0, 105.0, 94.0, 104.0, 83.0, 47.0, 54.0, 31.0, 36.0, 33.0, 18.0, 20.0, 9.0, 8.0, 6.0, 7.0, 8.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-586.9769897460938, -567.143310546875, -547.3095703125, -527.4758911132812, -507.64215087890625, -487.8084411621094, -467.9747314453125, -448.14105224609375, -428.30731201171875, -408.4736022949219, -388.639892578125, -368.8061828613281, -348.97247314453125, -329.1387634277344, -309.3050537109375, -289.47137451171875, -269.6376647949219, -249.803955078125, -229.97024536132812, -210.13653564453125, -190.30282592773438, -170.4691162109375, -150.6354217529297, -130.8017120361328, -110.96800231933594, -91.13429260253906, -71.30058288574219, -51.466880798339844, -31.63317108154297, -11.799461364746094, 8.03424072265625, 27.867950439453125, 47.70166015625, 67.53536987304688, 87.36907958984375, 107.2027816772461, 127.03649139404297, 146.87020874023438, 166.7039031982422, 186.53761291503906, 206.37132263183594, 226.2050323486328, 246.0387420654297, 265.8724365234375, 285.7061462402344, 305.53985595703125, 325.3735656738281, 345.207275390625, 365.0409851074219, 384.87469482421875, 404.7084045410156, 424.5421142578125, 444.3758239746094, 464.20953369140625, 484.043212890625, 503.876953125, 523.7106323242188, 543.5443115234375, 563.3780517578125, 583.2117309570312, 603.0454711914062, 622.879150390625, 642.712890625, 662.5465698242188, 682.3803100585938]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 6.0, 7.0, 12.0, 7.0, 9.0, 25.0, 34.0, 41.0, 58.0, 61.0, 79.0, 109.0, 189.0, 237.0, 313.0, 512.0, 750.0, 1183.0, 2112.0, 3869.0, 8565.0, 23725.0, 127151.0, 3860902.0, 121834.0, 24452.0, 8601.0, 4018.0, 2063.0, 1239.0, 687.0, 460.0, 291.0, 195.0, 132.0, 99.0, 76.0, 52.0, 31.0, 26.0, 15.0, 16.0, 5.0, 7.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.3671875, -1.3286590576171875, -1.290130615234375, -1.2516021728515625, -1.21307373046875, -1.1745452880859375, -1.136016845703125, -1.0974884033203125, -1.0589599609375, -1.0204315185546875, -0.981903076171875, -0.9433746337890625, -0.90484619140625, -0.8663177490234375, -0.827789306640625, -0.7892608642578125, -0.750732421875, -0.7122039794921875, -0.673675537109375, -0.6351470947265625, -0.59661865234375, -0.5580902099609375, -0.519561767578125, -0.4810333251953125, -0.4425048828125, -0.4039764404296875, -0.365447998046875, -0.3269195556640625, -0.28839111328125, -0.2498626708984375, -0.211334228515625, -0.1728057861328125, -0.13427734375, -0.0957489013671875, -0.057220458984375, -0.0186920166015625, 0.01983642578125, 0.0583648681640625, 0.096893310546875, 0.1354217529296875, 0.1739501953125, 0.2124786376953125, 0.251007080078125, 0.2895355224609375, 0.32806396484375, 0.3665924072265625, 0.405120849609375, 0.4436492919921875, 0.482177734375, 0.5207061767578125, 0.559234619140625, 0.5977630615234375, 0.63629150390625, 0.6748199462890625, 0.713348388671875, 0.7518768310546875, 0.7904052734375, 0.8289337158203125, 0.867462158203125, 0.9059906005859375, 0.94451904296875, 0.9830474853515625, 1.021575927734375, 1.0601043701171875, 1.0986328125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 8.0, 4.0, 14.0, 21.0, 22.0, 58.0, 70.0, 433.0, 157.0, 58.0, 31.0, 26.0, 26.0, 10.0, 11.0, 4.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8369140625, -0.814178466796875, -0.79144287109375, -0.768707275390625, -0.7459716796875, -0.723236083984375, -0.70050048828125, -0.677764892578125, -0.655029296875, -0.632293701171875, -0.60955810546875, -0.586822509765625, -0.5640869140625, -0.541351318359375, -0.51861572265625, -0.495880126953125, -0.47314453125, -0.450408935546875, -0.42767333984375, -0.404937744140625, -0.3822021484375, -0.359466552734375, -0.33673095703125, -0.313995361328125, -0.291259765625, -0.268524169921875, -0.24578857421875, -0.223052978515625, -0.2003173828125, -0.177581787109375, -0.15484619140625, -0.132110595703125, -0.109375, -0.086639404296875, -0.06390380859375, -0.041168212890625, -0.0184326171875, 0.004302978515625, 0.02703857421875, 0.049774169921875, 0.072509765625, 0.095245361328125, 0.11798095703125, 0.140716552734375, 0.1634521484375, 0.186187744140625, 0.20892333984375, 0.231658935546875, 0.25439453125, 0.277130126953125, 0.29986572265625, 0.322601318359375, 0.3453369140625, 0.368072509765625, 0.39080810546875, 0.413543701171875, 0.436279296875, 0.459014892578125, 0.48175048828125, 0.504486083984375, 0.5272216796875, 0.549957275390625, 0.57269287109375, 0.595428466796875, 0.6181640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 3.0, 11.0, 13.0, 25.0, 33.0, 51.0, 75.0, 110.0, 182.0, 291.0, 560.0, 1149.0, 2597.0, 6638.0, 20968.0, 100841.0, 1276770.0, 2571132.0, 169725.0, 29398.0, 8295.0, 2982.0, 1168.0, 550.0, 273.0, 159.0, 104.0, 55.0, 39.0, 30.0, 18.0, 6.0, 6.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81005859375, -0.7822494506835938, -0.7544403076171875, -0.7266311645507812, -0.698822021484375, -0.6710128784179688, -0.6432037353515625, -0.6153945922851562, -0.58758544921875, -0.5597763061523438, -0.5319671630859375, -0.5041580200195312, -0.476348876953125, -0.44853973388671875, -0.4207305908203125, -0.39292144775390625, -0.3651123046875, -0.33730316162109375, -0.3094940185546875, -0.28168487548828125, -0.253875732421875, -0.22606658935546875, -0.1982574462890625, -0.17044830322265625, -0.14263916015625, -0.11483001708984375, -0.0870208740234375, -0.05921173095703125, -0.031402587890625, -0.00359344482421875, 0.0242156982421875, 0.05202484130859375, 0.079833984375, 0.10764312744140625, 0.1354522705078125, 0.16326141357421875, 0.191070556640625, 0.21887969970703125, 0.2466888427734375, 0.27449798583984375, 0.30230712890625, 0.33011627197265625, 0.3579254150390625, 0.38573455810546875, 0.413543701171875, 0.44135284423828125, 0.4691619873046875, 0.49697113037109375, 0.5247802734375, 0.5525894165039062, 0.5803985595703125, 0.6082077026367188, 0.636016845703125, 0.6638259887695312, 0.6916351318359375, 0.7194442749023438, 0.74725341796875, 0.7750625610351562, 0.8028717041015625, 0.8306808471679688, 0.858489990234375, 0.8862991333007812, 0.9141082763671875, 0.9419174194335938, 0.9697265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 1.0, 10.0, 5.0, 7.0, 16.0, 10.0, 19.0, 34.0, 44.0, 66.0, 132.0, 288.0, 586.0, 1343.0, 773.0, 320.0, 154.0, 90.0, 49.0, 34.0, 29.0, 17.0, 11.0, 13.0, 7.0, 9.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.75830078125, -0.739654541015625, -0.72100830078125, -0.702362060546875, -0.6837158203125, -0.665069580078125, -0.64642333984375, -0.627777099609375, -0.609130859375, -0.590484619140625, -0.57183837890625, -0.553192138671875, -0.5345458984375, -0.515899658203125, -0.49725341796875, -0.478607177734375, -0.4599609375, -0.441314697265625, -0.42266845703125, -0.404022216796875, -0.3853759765625, -0.366729736328125, -0.34808349609375, -0.329437255859375, -0.310791015625, -0.292144775390625, -0.27349853515625, -0.254852294921875, -0.2362060546875, -0.217559814453125, -0.19891357421875, -0.180267333984375, -0.16162109375, -0.142974853515625, -0.12432861328125, -0.105682373046875, -0.0870361328125, -0.068389892578125, -0.04974365234375, -0.031097412109375, -0.012451171875, 0.006195068359375, 0.02484130859375, 0.043487548828125, 0.0621337890625, 0.080780029296875, 0.09942626953125, 0.118072509765625, 0.13671875, 0.155364990234375, 0.17401123046875, 0.192657470703125, 0.2113037109375, 0.229949951171875, 0.24859619140625, 0.267242431640625, 0.285888671875, 0.304534912109375, 0.32318115234375, 0.341827392578125, 0.3604736328125, 0.379119873046875, 0.39776611328125, 0.416412353515625, 0.43505859375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 8.0, 36.0, 277.0, 529.0, 133.0, 15.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91096830368042, -2.708282709121704, -2.5055973529815674, -2.3029117584228516, -2.100226402282715, -1.897540807723999, -1.6948552131652832, -1.492169737815857, -1.2894842624664307, -1.0867987871170044, -0.8841132521629333, -0.6814277172088623, -0.47874224185943604, -0.27605676651000977, -0.07337117195129395, 0.12931430339813232, 0.3319997787475586, 0.5346852540969849, 0.7373707890510559, 0.940056324005127, 1.1427417993545532, 1.3454272747039795, 1.5481128692626953, 1.7507983446121216, 1.9534838199615479, 2.1561694145202637, 2.3588547706604004, 2.561540365219116, 2.764225959777832, 2.9669113159179688, 3.1695969104766846, 3.3722825050354004, 3.574967384338379, 3.7776529788970947, 3.9803383350372314, 4.183023929595947, 4.385709285736084, 4.588395118713379, 4.791080474853516, 4.993765830993652, 5.196451187133789, 5.399136543273926, 5.601822376251221, 5.804507732391357, 6.007193088531494, 6.209878921508789, 6.412564277648926, 6.6152496337890625, 6.817935466766357, 7.020620822906494, 7.223306655883789, 7.425992012023926, 7.6286773681640625, 7.831362724304199, 8.034048080444336, 8.236734390258789, 8.439419746398926, 8.642105102539062, 8.8447904586792, 9.047475814819336, 9.250162124633789, 9.452847480773926, 9.655532836914062, 9.8582181930542, 10.060903549194336]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 9.0, 11.0, 13.0, 22.0, 29.0, 32.0, 44.0, 50.0, 51.0, 79.0, 94.0, 84.0, 79.0, 73.0, 61.0, 59.0, 46.0, 44.0, 26.0, 25.0, 14.0, 11.0, 5.0, 3.0, 2.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.829029083251953, -2.7540111541748047, -2.6789932250976562, -2.603975296020508, -2.5289573669433594, -2.453939437866211, -2.3789215087890625, -2.303903579711914, -2.2288856506347656, -2.153867721557617, -2.0788497924804688, -2.0038318634033203, -1.9288139343261719, -1.8537960052490234, -1.7787781953811646, -1.7037602663040161, -1.6287424564361572, -1.5537245273590088, -1.4787065982818604, -1.403688669204712, -1.3286707401275635, -1.253652811050415, -1.1786350011825562, -1.1036170721054077, -1.0285991430282593, -0.9535812139511108, -0.8785632848739624, -0.8035454154014587, -0.7285274863243103, -0.6535095572471619, -0.5784916877746582, -0.5034737586975098, -0.42845582962036133, -0.3534379005432129, -0.27842000126838684, -0.2034020870923996, -0.12838417291641235, -0.053366243839263916, 0.021651655435562134, 0.09666955471038818, 0.17168748378753662, 0.24670539796352386, 0.3217233121395111, 0.39674121141433716, 0.4717591404914856, 0.546777069568634, 0.6217949390411377, 0.6968128681182861, 0.7718307971954346, 0.846848726272583, 0.9218666553497314, 0.9968845248222351, 1.0719025135040283, 1.1469204425811768, 1.2219382524490356, 1.296956181526184, 1.3719741106033325, 1.446992039680481, 1.5220099687576294, 1.5970278978347778, 1.6720457077026367, 1.7470636367797852, 1.8220815658569336, 1.897099494934082, 1.9721174240112305]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 8.0, 18.0, 30.0, 31.0, 41.0, 52.0, 95.0, 126.0, 205.0, 290.0, 420.0, 591.0, 931.0, 1418.0, 2262.0, 3606.0, 7182.0, 16282.0, 48977.0, 674185.0, 227655.0, 35893.0, 13140.0, 6043.0, 3248.0, 1953.0, 1259.0, 857.0, 562.0, 373.0, 241.0, 172.0, 123.0, 88.0, 50.0, 41.0, 32.0, 23.0, 14.0, 6.0, 8.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.525390625, -2.448577880859375, -2.37176513671875, -2.294952392578125, -2.2181396484375, -2.141326904296875, -2.06451416015625, -1.987701416015625, -1.910888671875, -1.834075927734375, -1.75726318359375, -1.680450439453125, -1.6036376953125, -1.526824951171875, -1.45001220703125, -1.373199462890625, -1.29638671875, -1.219573974609375, -1.14276123046875, -1.065948486328125, -0.9891357421875, -0.912322998046875, -0.83551025390625, -0.758697509765625, -0.681884765625, -0.605072021484375, -0.52825927734375, -0.451446533203125, -0.3746337890625, -0.297821044921875, -0.22100830078125, -0.144195556640625, -0.0673828125, 0.009429931640625, 0.08624267578125, 0.163055419921875, 0.2398681640625, 0.316680908203125, 0.39349365234375, 0.470306396484375, 0.547119140625, 0.623931884765625, 0.70074462890625, 0.777557373046875, 0.8543701171875, 0.931182861328125, 1.00799560546875, 1.084808349609375, 1.16162109375, 1.238433837890625, 1.31524658203125, 1.392059326171875, 1.4688720703125, 1.545684814453125, 1.62249755859375, 1.699310302734375, 1.776123046875, 1.852935791015625, 1.92974853515625, 2.006561279296875, 2.0833740234375, 2.160186767578125, 2.23699951171875, 2.313812255859375, 2.390625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 6.0, 10.0, 6.0, 8.0, 20.0, 22.0, 46.0, 69.0, 197.0, 369.0, 76.0, 40.0, 31.0, 26.0, 16.0, 15.0, 5.0, 3.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81298828125, -0.7911224365234375, -0.769256591796875, -0.7473907470703125, -0.72552490234375, -0.7036590576171875, -0.681793212890625, -0.6599273681640625, -0.6380615234375, -0.6161956787109375, -0.594329833984375, -0.5724639892578125, -0.55059814453125, -0.5287322998046875, -0.506866455078125, -0.4850006103515625, -0.463134765625, -0.4412689208984375, -0.419403076171875, -0.3975372314453125, -0.37567138671875, -0.3538055419921875, -0.331939697265625, -0.3100738525390625, -0.2882080078125, -0.2663421630859375, -0.244476318359375, -0.2226104736328125, -0.20074462890625, -0.1788787841796875, -0.157012939453125, -0.1351470947265625, -0.11328125, -0.0914154052734375, -0.069549560546875, -0.0476837158203125, -0.02581787109375, -0.0039520263671875, 0.017913818359375, 0.0397796630859375, 0.0616455078125, 0.0835113525390625, 0.105377197265625, 0.1272430419921875, 0.14910888671875, 0.1709747314453125, 0.192840576171875, 0.2147064208984375, 0.236572265625, 0.2584381103515625, 0.280303955078125, 0.3021697998046875, 0.32403564453125, 0.3459014892578125, 0.367767333984375, 0.3896331787109375, 0.4114990234375, 0.4333648681640625, 0.455230712890625, 0.4770965576171875, 0.49896240234375, 0.5208282470703125, 0.542694091796875, 0.5645599365234375, 0.58642578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 4.0, 4.0, 9.0, 14.0, 12.0, 27.0, 21.0, 50.0, 68.0, 116.0, 183.0, 293.0, 533.0, 925.0, 1862.0, 3875.0, 8916.0, 23508.0, 73690.0, 298438.0, 459617.0, 118480.0, 35066.0, 12470.0, 5122.0, 2384.0, 1211.0, 615.0, 382.0, 220.0, 129.0, 87.0, 72.0, 40.0, 29.0, 12.0, 22.0, 12.0, 13.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3662109375, -1.323760986328125, -1.28131103515625, -1.238861083984375, -1.1964111328125, -1.153961181640625, -1.11151123046875, -1.069061279296875, -1.026611328125, -0.984161376953125, -0.94171142578125, -0.899261474609375, -0.8568115234375, -0.814361572265625, -0.77191162109375, -0.729461669921875, -0.68701171875, -0.644561767578125, -0.60211181640625, -0.559661865234375, -0.5172119140625, -0.474761962890625, -0.43231201171875, -0.389862060546875, -0.347412109375, -0.304962158203125, -0.26251220703125, -0.220062255859375, -0.1776123046875, -0.135162353515625, -0.09271240234375, -0.050262451171875, -0.0078125, 0.034637451171875, 0.07708740234375, 0.119537353515625, 0.1619873046875, 0.204437255859375, 0.24688720703125, 0.289337158203125, 0.331787109375, 0.374237060546875, 0.41668701171875, 0.459136962890625, 0.5015869140625, 0.544036865234375, 0.58648681640625, 0.628936767578125, 0.67138671875, 0.713836669921875, 0.75628662109375, 0.798736572265625, 0.8411865234375, 0.883636474609375, 0.92608642578125, 0.968536376953125, 1.010986328125, 1.053436279296875, 1.09588623046875, 1.138336181640625, 1.1807861328125, 1.223236083984375, 1.26568603515625, 1.308135986328125, 1.3505859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 5.0, 6.0, 12.0, 5.0, 5.0, 10.0, 17.0, 21.0, 21.0, 21.0, 24.0, 27.0, 24.0, 36.0, 42.0, 45.0, 38.0, 54.0, 49.0, 41.0, 43.0, 40.0, 43.0, 46.0, 39.0, 43.0, 25.0, 35.0, 23.0, 29.0, 17.0, 13.0, 24.0, 17.0, 14.0, 8.0, 5.0, 8.0, 4.0, 4.0, 4.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.283203125, -2.2099609375, -2.13671875, -2.0634765625, -1.990234375, -1.9169921875, -1.84375, -1.7705078125, -1.697265625, -1.6240234375, -1.55078125, -1.4775390625, -1.404296875, -1.3310546875, -1.2578125, -1.1845703125, -1.111328125, -1.0380859375, -0.96484375, -0.8916015625, -0.818359375, -0.7451171875, -0.671875, -0.5986328125, -0.525390625, -0.4521484375, -0.37890625, -0.3056640625, -0.232421875, -0.1591796875, -0.0859375, -0.0126953125, 0.060546875, 0.1337890625, 0.20703125, 0.2802734375, 0.353515625, 0.4267578125, 0.5, 0.5732421875, 0.646484375, 0.7197265625, 0.79296875, 0.8662109375, 0.939453125, 1.0126953125, 1.0859375, 1.1591796875, 1.232421875, 1.3056640625, 1.37890625, 1.4521484375, 1.525390625, 1.5986328125, 1.671875, 1.7451171875, 1.818359375, 1.8916015625, 1.96484375, 2.0380859375, 2.111328125, 2.1845703125, 2.2578125, 2.3310546875, 2.404296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 8.0, 7.0, 19.0, 27.0, 40.0, 59.0, 113.0, 214.0, 456.0, 1074.0, 3119.0, 12808.0, 154000.0, 829640.0, 37241.0, 6367.0, 1866.0, 736.0, 333.0, 161.0, 88.0, 57.0, 31.0, 28.0, 13.0, 12.0, 6.0, 7.0, 5.0, 4.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.76953125, -2.695220947265625, -2.62091064453125, -2.546600341796875, -2.4722900390625, -2.397979736328125, -2.32366943359375, -2.249359130859375, -2.175048828125, -2.100738525390625, -2.02642822265625, -1.952117919921875, -1.8778076171875, -1.803497314453125, -1.72918701171875, -1.654876708984375, -1.58056640625, -1.506256103515625, -1.43194580078125, -1.357635498046875, -1.2833251953125, -1.209014892578125, -1.13470458984375, -1.060394287109375, -0.986083984375, -0.911773681640625, -0.83746337890625, -0.763153076171875, -0.6888427734375, -0.614532470703125, -0.54022216796875, -0.465911865234375, -0.3916015625, -0.317291259765625, -0.24298095703125, -0.168670654296875, -0.0943603515625, -0.020050048828125, 0.05426025390625, 0.128570556640625, 0.202880859375, 0.277191162109375, 0.35150146484375, 0.425811767578125, 0.5001220703125, 0.574432373046875, 0.64874267578125, 0.723052978515625, 0.79736328125, 0.871673583984375, 0.94598388671875, 1.020294189453125, 1.0946044921875, 1.168914794921875, 1.24322509765625, 1.317535400390625, 1.391845703125, 1.466156005859375, 1.54046630859375, 1.614776611328125, 1.6890869140625, 1.763397216796875, 1.83770751953125, 1.912017822265625, 1.986328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 15.0, 5.0, 21.0, 27.0, 28.0, 25.0, 44.0, 49.0, 41.0, 71.0, 76.0, 82.0, 92.0, 67.0, 78.0, 62.0, 48.0, 41.0, 29.0, 26.0, 10.0, 12.0, 18.0, 6.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.514787673950195e-05, -6.282050162553787e-05, -6.049312651157379e-05, -5.816575139760971e-05, -5.583837628364563e-05, -5.351100116968155e-05, -5.118362605571747e-05, -4.885625094175339e-05, -4.652887582778931e-05, -4.4201500713825226e-05, -4.1874125599861145e-05, -3.9546750485897064e-05, -3.7219375371932983e-05, -3.48920002579689e-05, -3.256462514400482e-05, -3.023725003004074e-05, -2.790987491607666e-05, -2.558249980211258e-05, -2.32551246881485e-05, -2.0927749574184418e-05, -1.8600374460220337e-05, -1.6272999346256256e-05, -1.3945624232292175e-05, -1.1618249118328094e-05, -9.290874004364014e-06, -6.963498890399933e-06, -4.636123776435852e-06, -2.3087486624717712e-06, 1.862645149230957e-08, 2.3460015654563904e-06, 4.673376679420471e-06, 7.000751793384552e-06, 9.328126907348633e-06, 1.1655502021312714e-05, 1.3982877135276794e-05, 1.6310252249240875e-05, 1.8637627363204956e-05, 2.0965002477169037e-05, 2.3292377591133118e-05, 2.56197527050972e-05, 2.794712781906128e-05, 3.027450293302536e-05, 3.260187804698944e-05, 3.492925316095352e-05, 3.72566282749176e-05, 3.958400338888168e-05, 4.1911378502845764e-05, 4.4238753616809845e-05, 4.6566128730773926e-05, 4.8893503844738007e-05, 5.122087895870209e-05, 5.354825407266617e-05, 5.587562918663025e-05, 5.820300430059433e-05, 6.053037941455841e-05, 6.285775452852249e-05, 6.518512964248657e-05, 6.751250475645065e-05, 6.983987987041473e-05, 7.216725498437881e-05, 7.44946300983429e-05, 7.682200521230698e-05, 7.914938032627106e-05, 8.147675544023514e-05, 8.380413055419922e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 10.0, 14.0, 10.0, 17.0, 25.0, 56.0, 64.0, 152.0, 279.0, 535.0, 1157.0, 2961.0, 9262.0, 40738.0, 345895.0, 563456.0, 64250.0, 13084.0, 3813.0, 1452.0, 623.0, 304.0, 154.0, 108.0, 54.0, 36.0, 15.0, 9.0, 9.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4423828125, -1.3960418701171875, -1.349700927734375, -1.3033599853515625, -1.25701904296875, -1.2106781005859375, -1.164337158203125, -1.1179962158203125, -1.0716552734375, -1.0253143310546875, -0.978973388671875, -0.9326324462890625, -0.88629150390625, -0.8399505615234375, -0.793609619140625, -0.7472686767578125, -0.700927734375, -0.6545867919921875, -0.608245849609375, -0.5619049072265625, -0.51556396484375, -0.4692230224609375, -0.422882080078125, -0.3765411376953125, -0.3302001953125, -0.2838592529296875, -0.237518310546875, -0.1911773681640625, -0.14483642578125, -0.0984954833984375, -0.052154541015625, -0.0058135986328125, 0.04052734375, 0.0868682861328125, 0.133209228515625, 0.1795501708984375, 0.22589111328125, 0.2722320556640625, 0.318572998046875, 0.3649139404296875, 0.4112548828125, 0.4575958251953125, 0.503936767578125, 0.5502777099609375, 0.59661865234375, 0.6429595947265625, 0.689300537109375, 0.7356414794921875, 0.781982421875, 0.8283233642578125, 0.874664306640625, 0.9210052490234375, 0.96734619140625, 1.0136871337890625, 1.060028076171875, 1.1063690185546875, 1.1527099609375, 1.1990509033203125, 1.245391845703125, 1.2917327880859375, 1.33807373046875, 1.3844146728515625, 1.430755615234375, 1.4770965576171875, 1.5234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 6.0, 6.0, 11.0, 18.0, 24.0, 41.0, 46.0, 64.0, 81.0, 101.0, 137.0, 118.0, 94.0, 75.0, 51.0, 37.0, 27.0, 15.0, 15.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.57421875, -2.510711669921875, -2.44720458984375, -2.383697509765625, -2.3201904296875, -2.256683349609375, -2.19317626953125, -2.129669189453125, -2.066162109375, -2.002655029296875, -1.93914794921875, -1.875640869140625, -1.8121337890625, -1.748626708984375, -1.68511962890625, -1.621612548828125, -1.55810546875, -1.494598388671875, -1.43109130859375, -1.367584228515625, -1.3040771484375, -1.240570068359375, -1.17706298828125, -1.113555908203125, -1.050048828125, -0.986541748046875, -0.92303466796875, -0.859527587890625, -0.7960205078125, -0.732513427734375, -0.66900634765625, -0.605499267578125, -0.5419921875, -0.478485107421875, -0.41497802734375, -0.351470947265625, -0.2879638671875, -0.224456787109375, -0.16094970703125, -0.097442626953125, -0.033935546875, 0.029571533203125, 0.09307861328125, 0.156585693359375, 0.2200927734375, 0.283599853515625, 0.34710693359375, 0.410614013671875, 0.47412109375, 0.537628173828125, 0.60113525390625, 0.664642333984375, 0.7281494140625, 0.791656494140625, 0.85516357421875, 0.918670654296875, 0.982177734375, 1.045684814453125, 1.10919189453125, 1.172698974609375, 1.2362060546875, 1.299713134765625, 1.36322021484375, 1.426727294921875, 1.490234375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 24.0, 81.0, 417.0, 334.0, 82.0, 27.0, 10.0, 9.0, 8.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.089799880981445, -27.003108978271484, -25.916419982910156, -24.829729080200195, -23.743038177490234, -22.656349182128906, -21.569658279418945, -20.482967376708984, -19.396278381347656, -18.309587478637695, -17.222898483276367, -16.136207580566406, -15.049517631530762, -13.962827682495117, -12.876136779785156, -11.789446830749512, -10.702756881713867, -9.616066932678223, -8.529376983642578, -7.442686080932617, -6.355996131896973, -5.269306182861328, -4.182615756988525, -3.0959253311157227, -2.009235382080078, -0.9225451946258545, 0.16414499282836914, 1.2508351802825928, 2.3375253677368164, 3.424215316772461, 4.510905742645264, 5.597596168518066, 6.684288024902344, 7.770977973937988, 8.857667922973633, 9.944358825683594, 11.031048774719238, 12.117738723754883, 13.204429626464844, 14.291119575500488, 15.377809524536133, 16.464500427246094, 17.551189422607422, 18.637880325317383, 19.724571228027344, 20.811260223388672, 21.897951126098633, 22.984642028808594, 24.071331024169922, 25.158021926879883, 26.24471092224121, 27.331401824951172, 28.4180908203125, 29.50478172302246, 30.591472625732422, 31.67816162109375, 32.764854431152344, 33.85154342651367, 34.938236236572266, 36.024925231933594, 37.11161422729492, 38.19830322265625, 39.284996032714844, 40.37168502807617, 41.4583740234375]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 19.0, 12.0, 8.0, 16.0, 23.0, 41.0, 93.0, 171.0, 195.0, 174.0, 107.0, 54.0, 27.0, 16.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.53739166259766, -62.71542739868164, -60.89345932006836, -59.071495056152344, -57.24952697753906, -55.42756271362305, -53.60559844970703, -51.78363037109375, -49.96166229248047, -48.13969802856445, -46.31772994995117, -44.495765686035156, -42.673797607421875, -40.85183334350586, -39.029869079589844, -37.20790100097656, -35.38593673706055, -33.56397247314453, -31.74200439453125, -29.920040130615234, -28.098072052001953, -26.276107788085938, -24.45414161682129, -22.63217544555664, -20.810209274291992, -18.988243103027344, -17.166276931762695, -15.344311714172363, -13.522345542907715, -11.700379371643066, -9.878414154052734, -8.056447982788086, -6.2344818115234375, -4.412515640258789, -2.590549945831299, -0.7685842514038086, 1.0533819198608398, 2.8753480911254883, 4.69731330871582, 6.519279479980469, 8.341245651245117, 10.163211822509766, 11.985177993774414, 13.807143211364746, 15.629109382629395, 17.45107650756836, 19.273040771484375, 21.095006942749023, 22.916973114013672, 24.73893928527832, 26.56090545654297, 28.382869720458984, 30.204837799072266, 32.02680206298828, 33.84877014160156, 35.67073440551758, 37.492698669433594, 39.31466293334961, 41.13663101196289, 42.958595275878906, 44.78056335449219, 46.6025276184082, 48.42449188232422, 50.2464599609375, 52.06842803955078]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 11.0, 4.0, 20.0, 24.0, 20.0, 41.0, 40.0, 62.0, 130.0, 210.0, 278.0, 400.0, 664.0, 1275.0, 2497.0, 5657.0, 15710.0, 72005.0, 3618475.0, 423078.0, 36455.0, 9780.0, 3678.0, 1695.0, 900.0, 422.0, 276.0, 175.0, 84.0, 61.0, 48.0, 39.0, 22.0, 19.0, 7.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3046875, -6.137939453125, -5.97119140625, -5.804443359375, -5.6376953125, -5.470947265625, -5.30419921875, -5.137451171875, -4.970703125, -4.803955078125, -4.63720703125, -4.470458984375, -4.3037109375, -4.136962890625, -3.97021484375, -3.803466796875, -3.63671875, -3.469970703125, -3.30322265625, -3.136474609375, -2.9697265625, -2.802978515625, -2.63623046875, -2.469482421875, -2.302734375, -2.135986328125, -1.96923828125, -1.802490234375, -1.6357421875, -1.468994140625, -1.30224609375, -1.135498046875, -0.96875, -0.802001953125, -0.63525390625, -0.468505859375, -0.3017578125, -0.135009765625, 0.03173828125, 0.198486328125, 0.365234375, 0.531982421875, 0.69873046875, 0.865478515625, 1.0322265625, 1.198974609375, 1.36572265625, 1.532470703125, 1.69921875, 1.865966796875, 2.03271484375, 2.199462890625, 2.3662109375, 2.532958984375, 2.69970703125, 2.866455078125, 3.033203125, 3.199951171875, 3.36669921875, 3.533447265625, 3.7001953125, 3.866943359375, 4.03369140625, 4.200439453125, 4.3671875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 1.0, 5.0, 0.0, 6.0, 3.0, 1.0, 8.0, 10.0, 10.0, 12.0, 19.0, 31.0, 49.0, 60.0, 117.0, 208.0, 160.0, 102.0, 58.0, 28.0, 21.0, 20.0, 12.0, 12.0, 8.0, 6.0, 4.0, 6.0, 4.0, 1.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.6103515625, -0.5941734313964844, -0.5779953002929688, -0.5618171691894531, -0.5456390380859375, -0.5294609069824219, -0.5132827758789062, -0.4971046447753906, -0.480926513671875, -0.4647483825683594, -0.44857025146484375, -0.4323921203613281, -0.4162139892578125, -0.4000358581542969, -0.38385772705078125, -0.3676795959472656, -0.35150146484375, -0.3353233337402344, -0.31914520263671875, -0.3029670715332031, -0.2867889404296875, -0.2706108093261719, -0.25443267822265625, -0.23825454711914062, -0.222076416015625, -0.20589828491210938, -0.18972015380859375, -0.17354202270507812, -0.1573638916015625, -0.14118576049804688, -0.12500762939453125, -0.10882949829101562, -0.0926513671875, -0.07647323608398438, -0.06029510498046875, -0.044116973876953125, -0.0279388427734375, -0.011760711669921875, 0.00441741943359375, 0.020595550537109375, 0.036773681640625, 0.052951812744140625, 0.06912994384765625, 0.08530807495117188, 0.1014862060546875, 0.11766433715820312, 0.13384246826171875, 0.15002059936523438, 0.16619873046875, 0.18237686157226562, 0.19855499267578125, 0.21473312377929688, 0.2309112548828125, 0.24708938598632812, 0.26326751708984375, 0.2794456481933594, 0.295623779296875, 0.3118019104003906, 0.32798004150390625, 0.3441581726074219, 0.3603363037109375, 0.3765144348144531, 0.39269256591796875, 0.4088706970214844, 0.425048828125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 7.0, 8.0, 15.0, 16.0, 28.0, 64.0, 60.0, 110.0, 158.0, 289.0, 505.0, 1083.0, 2301.0, 5735.0, 17474.0, 87929.0, 1916437.0, 2040931.0, 91572.0, 18318.0, 6083.0, 2490.0, 1201.0, 606.0, 283.0, 186.0, 115.0, 74.0, 61.0, 45.0, 33.0, 15.0, 6.0, 11.0, 5.0, 10.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.1527099609375, -2.072998046875, -1.9932861328125, -1.91357421875, -1.8338623046875, -1.754150390625, -1.6744384765625, -1.5947265625, -1.5150146484375, -1.435302734375, -1.3555908203125, -1.27587890625, -1.1961669921875, -1.116455078125, -1.0367431640625, -0.95703125, -0.8773193359375, -0.797607421875, -0.7178955078125, -0.63818359375, -0.5584716796875, -0.478759765625, -0.3990478515625, -0.3193359375, -0.2396240234375, -0.159912109375, -0.0802001953125, -0.00048828125, 0.0792236328125, 0.158935546875, 0.2386474609375, 0.318359375, 0.3980712890625, 0.477783203125, 0.5574951171875, 0.63720703125, 0.7169189453125, 0.796630859375, 0.8763427734375, 0.9560546875, 1.0357666015625, 1.115478515625, 1.1951904296875, 1.27490234375, 1.3546142578125, 1.434326171875, 1.5140380859375, 1.59375, 1.6734619140625, 1.753173828125, 1.8328857421875, 1.91259765625, 1.9923095703125, 2.072021484375, 2.1517333984375, 2.2314453125, 2.3111572265625, 2.390869140625, 2.4705810546875, 2.55029296875, 2.6300048828125, 2.709716796875, 2.7894287109375, 2.869140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 11.0, 16.0, 11.0, 29.0, 47.0, 45.0, 90.0, 149.0, 306.0, 576.0, 1175.0, 737.0, 345.0, 176.0, 92.0, 71.0, 46.0, 32.0, 21.0, 12.0, 12.0, 9.0, 13.0, 8.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58154296875, -0.5625534057617188, -0.5435638427734375, -0.5245742797851562, -0.505584716796875, -0.48659515380859375, -0.4676055908203125, -0.44861602783203125, -0.42962646484375, -0.41063690185546875, -0.3916473388671875, -0.37265777587890625, -0.353668212890625, -0.33467864990234375, -0.3156890869140625, -0.29669952392578125, -0.2777099609375, -0.25872039794921875, -0.2397308349609375, -0.22074127197265625, -0.201751708984375, -0.18276214599609375, -0.1637725830078125, -0.14478302001953125, -0.12579345703125, -0.10680389404296875, -0.0878143310546875, -0.06882476806640625, -0.049835205078125, -0.03084564208984375, -0.0118560791015625, 0.00713348388671875, 0.026123046875, 0.04511260986328125, 0.0641021728515625, 0.08309173583984375, 0.102081298828125, 0.12107086181640625, 0.1400604248046875, 0.15904998779296875, 0.17803955078125, 0.19702911376953125, 0.2160186767578125, 0.23500823974609375, 0.253997802734375, 0.27298736572265625, 0.2919769287109375, 0.31096649169921875, 0.3299560546875, 0.34894561767578125, 0.3679351806640625, 0.38692474365234375, 0.405914306640625, 0.42490386962890625, 0.4438934326171875, 0.46288299560546875, 0.48187255859375, 0.5008621215820312, 0.5198516845703125, 0.5388412475585938, 0.557830810546875, 0.5768203735351562, 0.5958099365234375, 0.6147994995117188, 0.6337890625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 36.0, 116.0, 283.0, 299.0, 169.0, 45.0, 17.0, 6.0, 3.0, 2.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1349658966064453, -1.9947179555892944, -1.854469895362854, -1.7142219543457031, -1.5739738941192627, -1.4337259531021118, -1.293478012084961, -1.1532299518585205, -1.0129820108413696, -0.872734010219574, -0.7324860095977783, -0.5922380685806274, -0.4519900679588318, -0.31174206733703613, -0.17149412631988525, -0.0312461256980896, 0.10900187492370605, 0.24924986064434052, 0.389497846364975, 0.5297458171844482, 0.6699938178062439, 0.8102418184280396, 0.9504897594451904, 1.0907378196716309, 1.2309857606887817, 1.3712337017059326, 1.511481761932373, 1.651729702949524, 1.7919776439666748, 1.9322257041931152, 2.0724735260009766, 2.212721586227417, 2.3529696464538574, 2.493217706680298, 2.633465528488159, 2.7737135887145996, 2.91396164894104, 3.0542097091674805, 3.194457530975342, 3.3347055912017822, 3.4749536514282227, 3.615201711654663, 3.7554495334625244, 3.895697593688965, 4.035945415496826, 4.176193714141846, 4.316441535949707, 4.456689357757568, 4.59693717956543, 4.737185001373291, 4.8774333000183105, 5.017681121826172, 5.157928943634033, 5.298177242279053, 5.438425064086914, 5.578672885894775, 5.718921184539795, 5.859169006347656, 5.999417304992676, 6.139665126800537, 6.279912948608398, 6.420161247253418, 6.560409069061279, 6.700656890869141, 6.84090518951416]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 4.0, 6.0, 11.0, 6.0, 16.0, 38.0, 44.0, 66.0, 81.0, 94.0, 130.0, 130.0, 94.0, 91.0, 58.0, 31.0, 32.0, 23.0, 14.0, 3.0, 5.0, 7.0, 8.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7223267555236816, -3.589586019515991, -3.456845283508301, -3.3241047859191895, -3.191364049911499, -3.0586233139038086, -2.925882577896118, -2.7931418418884277, -2.6604013442993164, -2.527660608291626, -2.3949198722839355, -2.262179374694824, -2.129438638687134, -1.9966979026794434, -1.863957166671753, -1.7312164306640625, -1.598475694656372, -1.4657349586486816, -1.3329943418502808, -1.2002536058425903, -1.0675129890441895, -0.934772253036499, -0.8020315170288086, -0.6692908406257629, -0.5365501642227173, -0.40380948781967163, -0.2710687816143036, -0.13832807540893555, -0.005587399005889893, 0.12715327739715576, 0.2598940134048462, 0.39263468980789185, 0.5253753662109375, 0.6581160426139832, 0.7908567190170288, 0.9235974550247192, 1.0563380718231201, 1.1890788078308105, 1.321819543838501, 1.4545602798461914, 1.5873008966445923, 1.7200416326522827, 1.8527822494506836, 1.985522985458374, 2.1182637214660645, 2.251004219055176, 2.3837451934814453, 2.5164856910705566, 2.649226427078247, 2.7819671630859375, 2.914707899093628, 3.0474486351013184, 3.1801891326904297, 3.31292986869812, 3.4456706047058105, 3.578411340713501, 3.7111520767211914, 3.843892812728882, 3.9766335487365723, 4.109374046325684, 4.242115020751953, 4.3748555183410645, 4.507596015930176, 4.640336990356445, 4.773077487945557]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 3.0, 2.0, 3.0, 13.0, 16.0, 13.0, 22.0, 17.0, 48.0, 61.0, 76.0, 130.0, 162.0, 258.0, 368.0, 579.0, 820.0, 1355.0, 2173.0, 3697.0, 6981.0, 13858.0, 34075.0, 129454.0, 630953.0, 153328.0, 37518.0, 15031.0, 7370.0, 3888.0, 2207.0, 1392.0, 854.0, 562.0, 429.0, 245.0, 181.0, 125.0, 80.0, 61.0, 43.0, 31.0, 23.0, 13.0, 16.0, 6.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9287109375, -1.8675689697265625, -1.806427001953125, -1.7452850341796875, -1.68414306640625, -1.6230010986328125, -1.561859130859375, -1.5007171630859375, -1.4395751953125, -1.3784332275390625, -1.317291259765625, -1.2561492919921875, -1.19500732421875, -1.1338653564453125, -1.072723388671875, -1.0115814208984375, -0.950439453125, -0.8892974853515625, -0.828155517578125, -0.7670135498046875, -0.70587158203125, -0.6447296142578125, -0.583587646484375, -0.5224456787109375, -0.4613037109375, -0.4001617431640625, -0.339019775390625, -0.2778778076171875, -0.21673583984375, -0.1555938720703125, -0.094451904296875, -0.0333099365234375, 0.02783203125, 0.0889739990234375, 0.150115966796875, 0.2112579345703125, 0.27239990234375, 0.3335418701171875, 0.394683837890625, 0.4558258056640625, 0.5169677734375, 0.5781097412109375, 0.639251708984375, 0.7003936767578125, 0.76153564453125, 0.8226776123046875, 0.883819580078125, 0.9449615478515625, 1.006103515625, 1.0672454833984375, 1.128387451171875, 1.1895294189453125, 1.25067138671875, 1.3118133544921875, 1.372955322265625, 1.4340972900390625, 1.4952392578125, 1.5563812255859375, 1.617523193359375, 1.6786651611328125, 1.73980712890625, 1.8009490966796875, 1.862091064453125, 1.9232330322265625, 1.984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 8.0, 8.0, 7.0, 8.0, 12.0, 20.0, 27.0, 27.0, 46.0, 68.0, 117.0, 180.0, 153.0, 104.0, 60.0, 35.0, 21.0, 17.0, 16.0, 16.0, 6.0, 8.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.499267578125, -0.4853019714355469, -0.47133636474609375, -0.4573707580566406, -0.4434051513671875, -0.4294395446777344, -0.41547393798828125, -0.4015083312988281, -0.387542724609375, -0.3735771179199219, -0.35961151123046875, -0.3456459045410156, -0.3316802978515625, -0.3177146911621094, -0.30374908447265625, -0.2897834777832031, -0.27581787109375, -0.2618522644042969, -0.24788665771484375, -0.23392105102539062, -0.2199554443359375, -0.20598983764648438, -0.19202423095703125, -0.17805862426757812, -0.164093017578125, -0.15012741088867188, -0.13616180419921875, -0.12219619750976562, -0.1082305908203125, -0.09426498413085938, -0.08029937744140625, -0.06633377075195312, -0.0523681640625, -0.038402557373046875, -0.02443695068359375, -0.010471343994140625, 0.0034942626953125, 0.017459869384765625, 0.03142547607421875, 0.045391082763671875, 0.059356689453125, 0.07332229614257812, 0.08728790283203125, 0.10125350952148438, 0.1152191162109375, 0.12918472290039062, 0.14315032958984375, 0.15711593627929688, 0.17108154296875, 0.18504714965820312, 0.19901275634765625, 0.21297836303710938, 0.2269439697265625, 0.24090957641601562, 0.25487518310546875, 0.2688407897949219, 0.282806396484375, 0.2967720031738281, 0.31073760986328125, 0.3247032165527344, 0.3386688232421875, 0.3526344299316406, 0.36660003662109375, 0.3805656433105469, 0.39453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 10.0, 32.0, 69.0, 165.0, 558.0, 2263.0, 14435.0, 171626.0, 777534.0, 71519.0, 8127.0, 1534.0, 396.0, 150.0, 58.0, 31.0, 7.0, 11.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.396484375, -3.310150146484375, -3.22381591796875, -3.137481689453125, -3.0511474609375, -2.964813232421875, -2.87847900390625, -2.792144775390625, -2.705810546875, -2.619476318359375, -2.53314208984375, -2.446807861328125, -2.3604736328125, -2.274139404296875, -2.18780517578125, -2.101470947265625, -2.01513671875, -1.928802490234375, -1.84246826171875, -1.756134033203125, -1.6697998046875, -1.583465576171875, -1.49713134765625, -1.410797119140625, -1.324462890625, -1.238128662109375, -1.15179443359375, -1.065460205078125, -0.9791259765625, -0.892791748046875, -0.80645751953125, -0.720123291015625, -0.6337890625, -0.547454833984375, -0.46112060546875, -0.374786376953125, -0.2884521484375, -0.202117919921875, -0.11578369140625, -0.029449462890625, 0.056884765625, 0.143218994140625, 0.22955322265625, 0.315887451171875, 0.4022216796875, 0.488555908203125, 0.57489013671875, 0.661224365234375, 0.74755859375, 0.833892822265625, 0.92022705078125, 1.006561279296875, 1.0928955078125, 1.179229736328125, 1.26556396484375, 1.351898193359375, 1.438232421875, 1.524566650390625, 1.61090087890625, 1.697235107421875, 1.7835693359375, 1.869903564453125, 1.95623779296875, 2.042572021484375, 2.12890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 4.0, 3.0, 7.0, 7.0, 5.0, 8.0, 12.0, 12.0, 23.0, 16.0, 22.0, 20.0, 31.0, 29.0, 50.0, 32.0, 40.0, 45.0, 46.0, 40.0, 46.0, 53.0, 52.0, 34.0, 33.0, 37.0, 37.0, 34.0, 26.0, 30.0, 31.0, 21.0, 19.0, 16.0, 14.0, 9.0, 11.0, 15.0, 9.0, 7.0, 3.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.228515625, -1.186553955078125, -1.14459228515625, -1.102630615234375, -1.0606689453125, -1.018707275390625, -0.97674560546875, -0.934783935546875, -0.892822265625, -0.850860595703125, -0.80889892578125, -0.766937255859375, -0.7249755859375, -0.683013916015625, -0.64105224609375, -0.599090576171875, -0.55712890625, -0.515167236328125, -0.47320556640625, -0.431243896484375, -0.3892822265625, -0.347320556640625, -0.30535888671875, -0.263397216796875, -0.221435546875, -0.179473876953125, -0.13751220703125, -0.095550537109375, -0.0535888671875, -0.011627197265625, 0.03033447265625, 0.072296142578125, 0.1142578125, 0.156219482421875, 0.19818115234375, 0.240142822265625, 0.2821044921875, 0.324066162109375, 0.36602783203125, 0.407989501953125, 0.449951171875, 0.491912841796875, 0.53387451171875, 0.575836181640625, 0.6177978515625, 0.659759521484375, 0.70172119140625, 0.743682861328125, 0.78564453125, 0.827606201171875, 0.86956787109375, 0.911529541015625, 0.9534912109375, 0.995452880859375, 1.03741455078125, 1.079376220703125, 1.121337890625, 1.163299560546875, 1.20526123046875, 1.247222900390625, 1.2891845703125, 1.331146240234375, 1.37310791015625, 1.415069580078125, 1.45703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 8.0, 8.0, 4.0, 17.0, 18.0, 35.0, 46.0, 78.0, 168.0, 351.0, 1036.0, 4817.0, 133220.0, 893948.0, 12013.0, 1765.0, 503.0, 212.0, 109.0, 66.0, 46.0, 25.0, 19.0, 11.0, 9.0, 6.0, 4.0, 3.0, 1.0, 7.0, 1.0, 0.0, 3.0], "bins": [-7.7265625, -7.5517578125, -7.376953125, -7.2021484375, -7.02734375, -6.8525390625, -6.677734375, -6.5029296875, -6.328125, -6.1533203125, -5.978515625, -5.8037109375, -5.62890625, -5.4541015625, -5.279296875, -5.1044921875, -4.9296875, -4.7548828125, -4.580078125, -4.4052734375, -4.23046875, -4.0556640625, -3.880859375, -3.7060546875, -3.53125, -3.3564453125, -3.181640625, -3.0068359375, -2.83203125, -2.6572265625, -2.482421875, -2.3076171875, -2.1328125, -1.9580078125, -1.783203125, -1.6083984375, -1.43359375, -1.2587890625, -1.083984375, -0.9091796875, -0.734375, -0.5595703125, -0.384765625, -0.2099609375, -0.03515625, 0.1396484375, 0.314453125, 0.4892578125, 0.6640625, 0.8388671875, 1.013671875, 1.1884765625, 1.36328125, 1.5380859375, 1.712890625, 1.8876953125, 2.0625, 2.2373046875, 2.412109375, 2.5869140625, 2.76171875, 2.9365234375, 3.111328125, 3.2861328125, 3.4609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 8.0, 24.0, 38.0, 76.0, 144.0, 224.0, 185.0, 125.0, 59.0, 38.0, 18.0, 14.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019049644470214844, -0.00018431991338729858, -0.00017814338207244873, -0.00017196685075759888, -0.00016579031944274902, -0.00015961378812789917, -0.00015343725681304932, -0.00014726072549819946, -0.0001410841941833496, -0.00013490766286849976, -0.0001287311315536499, -0.00012255460023880005, -0.0001163780689239502, -0.00011020153760910034, -0.00010402500629425049, -9.784847497940063e-05, -9.167194366455078e-05, -8.549541234970093e-05, -7.931888103485107e-05, -7.314234972000122e-05, -6.696581840515137e-05, -6.0789287090301514e-05, -5.461275577545166e-05, -4.843622446060181e-05, -4.225969314575195e-05, -3.60831618309021e-05, -2.9906630516052246e-05, -2.3730099201202393e-05, -1.755356788635254e-05, -1.1377036571502686e-05, -5.200505256652832e-06, 9.760260581970215e-07, 7.152557373046875e-06, 1.3329088687896729e-05, 1.9505620002746582e-05, 2.5682151317596436e-05, 3.185868263244629e-05, 3.803521394729614e-05, 4.4211745262145996e-05, 5.038827657699585e-05, 5.65648078918457e-05, 6.274133920669556e-05, 6.891787052154541e-05, 7.509440183639526e-05, 8.127093315124512e-05, 8.744746446609497e-05, 9.362399578094482e-05, 9.980052709579468e-05, 0.00010597705841064453, 0.00011215358972549438, 0.00011833012104034424, 0.0001245066523551941, 0.00013068318367004395, 0.0001368597149848938, 0.00014303624629974365, 0.0001492127776145935, 0.00015538930892944336, 0.0001615658402442932, 0.00016774237155914307, 0.00017391890287399292, 0.00018009543418884277, 0.00018627196550369263, 0.00019244849681854248, 0.00019862502813339233, 0.0002048015594482422]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 11.0, 10.0, 19.0, 20.0, 36.0, 56.0, 100.0, 175.0, 297.0, 576.0, 1327.0, 3014.0, 10339.0, 57419.0, 555265.0, 370172.0, 38149.0, 7525.0, 2187.0, 892.0, 409.0, 215.0, 126.0, 85.0, 37.0, 23.0, 18.0, 11.0, 12.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796875, -1.73248291015625, -1.6680908203125, -1.60369873046875, -1.539306640625, -1.47491455078125, -1.4105224609375, -1.34613037109375, -1.28173828125, -1.21734619140625, -1.1529541015625, -1.08856201171875, -1.024169921875, -0.95977783203125, -0.8953857421875, -0.83099365234375, -0.7666015625, -0.70220947265625, -0.6378173828125, -0.57342529296875, -0.509033203125, -0.44464111328125, -0.3802490234375, -0.31585693359375, -0.25146484375, -0.18707275390625, -0.1226806640625, -0.05828857421875, 0.006103515625, 0.07049560546875, 0.1348876953125, 0.19927978515625, 0.263671875, 0.32806396484375, 0.3924560546875, 0.45684814453125, 0.521240234375, 0.58563232421875, 0.6500244140625, 0.71441650390625, 0.77880859375, 0.84320068359375, 0.9075927734375, 0.97198486328125, 1.036376953125, 1.10076904296875, 1.1651611328125, 1.22955322265625, 1.2939453125, 1.35833740234375, 1.4227294921875, 1.48712158203125, 1.551513671875, 1.61590576171875, 1.6802978515625, 1.74468994140625, 1.80908203125, 1.87347412109375, 1.9378662109375, 2.00225830078125, 2.066650390625, 2.13104248046875, 2.1954345703125, 2.25982666015625, 2.32421875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 6.0, 2.0, 11.0, 20.0, 14.0, 49.0, 54.0, 67.0, 102.0, 161.0, 189.0, 100.0, 63.0, 46.0, 34.0, 31.0, 18.0, 11.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.042083740234375, -1.96697998046875, -1.891876220703125, -1.8167724609375, -1.741668701171875, -1.66656494140625, -1.591461181640625, -1.516357421875, -1.441253662109375, -1.36614990234375, -1.291046142578125, -1.2159423828125, -1.140838623046875, -1.06573486328125, -0.990631103515625, -0.91552734375, -0.840423583984375, -0.76531982421875, -0.690216064453125, -0.6151123046875, -0.540008544921875, -0.46490478515625, -0.389801025390625, -0.314697265625, -0.239593505859375, -0.16448974609375, -0.089385986328125, -0.0142822265625, 0.060821533203125, 0.13592529296875, 0.211029052734375, 0.2861328125, 0.361236572265625, 0.43634033203125, 0.511444091796875, 0.5865478515625, 0.661651611328125, 0.73675537109375, 0.811859130859375, 0.886962890625, 0.962066650390625, 1.03717041015625, 1.112274169921875, 1.1873779296875, 1.262481689453125, 1.33758544921875, 1.412689208984375, 1.48779296875, 1.562896728515625, 1.63800048828125, 1.713104248046875, 1.7882080078125, 1.863311767578125, 1.93841552734375, 2.013519287109375, 2.088623046875, 2.163726806640625, 2.23883056640625, 2.313934326171875, 2.3890380859375, 2.464141845703125, 2.53924560546875, 2.614349365234375, 2.689453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 15.0, 63.0, 465.0, 391.0, 44.0, 14.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.818442344665527, -10.637960433959961, -9.457478523254395, -8.276996612548828, -7.09651517868042, -5.9160332679748535, -4.735551834106445, -3.555069923400879, -2.3745880126953125, -1.1941062211990356, -0.013624429702758789, 1.1668572425842285, 2.347339153289795, 3.5278210639953613, 4.7083024978637695, 5.888784408569336, 7.069266319274902, 8.249748229980469, 9.430230140686035, 10.610712051391602, 11.791193008422852, 12.971675872802734, 14.152156829833984, 15.33263874053955, 16.513120651245117, 17.693601608276367, 18.87408447265625, 20.0545654296875, 21.235048294067383, 22.415529251098633, 23.596012115478516, 24.776493072509766, 25.956974029541016, 27.137454986572266, 28.31793785095215, 29.4984188079834, 30.67890167236328, 31.85938262939453, 33.03986358642578, 34.22034454345703, 35.40082931518555, 36.5813102722168, 37.76179122924805, 38.94227600097656, 40.12275695800781, 41.30323791503906, 42.48371887207031, 43.66419982910156, 44.84468078613281, 46.02516174316406, 47.20564270019531, 48.38612747192383, 49.56660842895508, 50.74708938598633, 51.92757034301758, 53.108055114746094, 54.288536071777344, 55.469017028808594, 56.649497985839844, 57.82998275756836, 59.01046371459961, 60.19094467163086, 61.37142562866211, 62.551910400390625, 63.732391357421875]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 5.0, 3.0, 7.0, 9.0, 13.0, 14.0, 12.0, 20.0, 24.0, 42.0, 47.0, 63.0, 81.0, 75.0, 87.0, 73.0, 73.0, 62.0, 67.0, 46.0, 43.0, 30.0, 19.0, 17.0, 13.0, 11.0, 9.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.340595245361328, -14.84911823272705, -14.357641220092773, -13.866165161132812, -13.374688148498535, -12.883211135864258, -12.391735076904297, -11.90025806427002, -11.408781051635742, -10.917304039001465, -10.425827026367188, -9.934350967407227, -9.44287395477295, -8.951396942138672, -8.459920883178711, -7.968443870544434, -7.476966857910156, -6.985489845275879, -6.49401330947876, -6.002536773681641, -5.511059761047363, -5.019582748413086, -4.528106212615967, -4.036629676818848, -3.5451526641845703, -3.053675889968872, -2.562199115753174, -2.0707223415374756, -1.5792455673217773, -1.087768793106079, -0.5962920188903809, -0.10481524467468262, 0.3866615295410156, 0.8781383037567139, 1.369615077972412, 1.8610918521881104, 2.3525686264038086, 2.844045400619507, 3.335522174835205, 3.8269989490509033, 4.318475723266602, 4.809952735900879, 5.301429271697998, 5.792905807495117, 6.2843828201293945, 6.775859832763672, 7.267336368560791, 7.75881290435791, 8.250289916992188, 8.741766929626465, 9.233243942260742, 9.724720001220703, 10.21619701385498, 10.707674026489258, 11.199150085449219, 11.690627098083496, 12.182104110717773, 12.67358112335205, 13.165058135986328, 13.656534194946289, 14.148011207580566, 14.639488220214844, 15.130964279174805, 15.622441291809082, 16.11391830444336]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 1.0, 8.0, 11.0, 22.0, 11.0, 13.0, 29.0, 48.0, 58.0, 64.0, 93.0, 93.0, 140.0, 151.0, 231.0, 374.0, 586.0, 844.0, 1299.0, 2193.0, 3881.0, 8290.0, 24002.0, 174148.0, 3826781.0, 114164.0, 20077.0, 7513.0, 3502.0, 1965.0, 1206.0, 712.0, 516.0, 375.0, 227.0, 155.0, 119.0, 76.0, 67.0, 42.0, 57.0, 29.0, 25.0, 26.0, 16.0, 11.0, 5.0, 9.0, 7.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.359375, -5.19903564453125, -5.0386962890625, -4.87835693359375, -4.718017578125, -4.55767822265625, -4.3973388671875, -4.23699951171875, -4.07666015625, -3.91632080078125, -3.7559814453125, -3.59564208984375, -3.435302734375, -3.27496337890625, -3.1146240234375, -2.95428466796875, -2.7939453125, -2.63360595703125, -2.4732666015625, -2.31292724609375, -2.152587890625, -1.99224853515625, -1.8319091796875, -1.67156982421875, -1.51123046875, -1.35089111328125, -1.1905517578125, -1.03021240234375, -0.869873046875, -0.70953369140625, -0.5491943359375, -0.38885498046875, -0.228515625, -0.06817626953125, 0.0921630859375, 0.25250244140625, 0.412841796875, 0.57318115234375, 0.7335205078125, 0.89385986328125, 1.05419921875, 1.21453857421875, 1.3748779296875, 1.53521728515625, 1.695556640625, 1.85589599609375, 2.0162353515625, 2.17657470703125, 2.3369140625, 2.49725341796875, 2.6575927734375, 2.81793212890625, 2.978271484375, 3.13861083984375, 3.2989501953125, 3.45928955078125, 3.61962890625, 3.77996826171875, 3.9403076171875, 4.10064697265625, 4.260986328125, 4.42132568359375, 4.5816650390625, 4.74200439453125, 4.90234375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 11.0, 9.0, 9.0, 16.0, 14.0, 25.0, 26.0, 38.0, 57.0, 104.0, 137.0, 158.0, 111.0, 83.0, 53.0, 36.0, 28.0, 17.0, 15.0, 14.0, 6.0, 6.0, 7.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4765625, -0.46221160888671875, -0.4478607177734375, -0.43350982666015625, -0.419158935546875, -0.40480804443359375, -0.3904571533203125, -0.37610626220703125, -0.36175537109375, -0.34740447998046875, -0.3330535888671875, -0.31870269775390625, -0.304351806640625, -0.29000091552734375, -0.2756500244140625, -0.26129913330078125, -0.2469482421875, -0.23259735107421875, -0.2182464599609375, -0.20389556884765625, -0.189544677734375, -0.17519378662109375, -0.1608428955078125, -0.14649200439453125, -0.13214111328125, -0.11779022216796875, -0.1034393310546875, -0.08908843994140625, -0.074737548828125, -0.06038665771484375, -0.0460357666015625, -0.03168487548828125, -0.017333984375, -0.00298309326171875, 0.0113677978515625, 0.02571868896484375, 0.040069580078125, 0.05442047119140625, 0.0687713623046875, 0.08312225341796875, 0.09747314453125, 0.11182403564453125, 0.1261749267578125, 0.14052581787109375, 0.154876708984375, 0.16922760009765625, 0.1835784912109375, 0.19792938232421875, 0.2122802734375, 0.22663116455078125, 0.2409820556640625, 0.25533294677734375, 0.269683837890625, 0.28403472900390625, 0.2983856201171875, 0.31273651123046875, 0.32708740234375, 0.34143829345703125, 0.3557891845703125, 0.37014007568359375, 0.384490966796875, 0.39884185791015625, 0.4131927490234375, 0.42754364013671875, 0.44189453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 7.0, 3.0, 5.0, 4.0, 8.0, 8.0, 13.0, 25.0, 41.0, 70.0, 133.0, 347.0, 1537.0, 12967.0, 3714787.0, 455409.0, 7208.0, 1110.0, 326.0, 113.0, 59.0, 31.0, 9.0, 11.0, 13.0, 8.0, 4.0, 5.0, 7.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-10.6171875, -10.3636474609375, -10.110107421875, -9.8565673828125, -9.60302734375, -9.3494873046875, -9.095947265625, -8.8424072265625, -8.5888671875, -8.3353271484375, -8.081787109375, -7.8282470703125, -7.57470703125, -7.3211669921875, -7.067626953125, -6.8140869140625, -6.560546875, -6.3070068359375, -6.053466796875, -5.7999267578125, -5.54638671875, -5.2928466796875, -5.039306640625, -4.7857666015625, -4.5322265625, -4.2786865234375, -4.025146484375, -3.7716064453125, -3.51806640625, -3.2645263671875, -3.010986328125, -2.7574462890625, -2.50390625, -2.2503662109375, -1.996826171875, -1.7432861328125, -1.48974609375, -1.2362060546875, -0.982666015625, -0.7291259765625, -0.4755859375, -0.2220458984375, 0.031494140625, 0.2850341796875, 0.53857421875, 0.7921142578125, 1.045654296875, 1.2991943359375, 1.552734375, 1.8062744140625, 2.059814453125, 2.3133544921875, 2.56689453125, 2.8204345703125, 3.073974609375, 3.3275146484375, 3.5810546875, 3.8345947265625, 4.088134765625, 4.3416748046875, 4.59521484375, 4.8487548828125, 5.102294921875, 5.3558349609375, 5.609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 5.0, 11.0, 7.0, 13.0, 25.0, 39.0, 63.0, 117.0, 259.0, 491.0, 1451.0, 802.0, 312.0, 168.0, 109.0, 55.0, 33.0, 24.0, 17.0, 14.0, 5.0, 3.0, 9.0, 1.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49609375, -0.47521209716796875, -0.4543304443359375, -0.43344879150390625, -0.412567138671875, -0.39168548583984375, -0.3708038330078125, -0.34992218017578125, -0.32904052734375, -0.30815887451171875, -0.2872772216796875, -0.26639556884765625, -0.245513916015625, -0.22463226318359375, -0.2037506103515625, -0.18286895751953125, -0.1619873046875, -0.14110565185546875, -0.1202239990234375, -0.09934234619140625, -0.078460693359375, -0.05757904052734375, -0.0366973876953125, -0.01581573486328125, 0.00506591796875, 0.02594757080078125, 0.0468292236328125, 0.06771087646484375, 0.088592529296875, 0.10947418212890625, 0.1303558349609375, 0.15123748779296875, 0.172119140625, 0.19300079345703125, 0.2138824462890625, 0.23476409912109375, 0.255645751953125, 0.27652740478515625, 0.2974090576171875, 0.31829071044921875, 0.33917236328125, 0.36005401611328125, 0.3809356689453125, 0.40181732177734375, 0.422698974609375, 0.44358062744140625, 0.4644622802734375, 0.48534393310546875, 0.5062255859375, 0.5271072387695312, 0.5479888916015625, 0.5688705444335938, 0.589752197265625, 0.6106338500976562, 0.6315155029296875, 0.6523971557617188, 0.67327880859375, 0.6941604614257812, 0.7150421142578125, 0.7359237670898438, 0.756805419921875, 0.7776870727539062, 0.7985687255859375, 0.8194503784179688, 0.84033203125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 16.0, 50.0, 166.0, 319.0, 272.0, 105.0, 43.0, 19.0, 7.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.305271148681641, -5.1436662673950195, -4.98206090927124, -4.820456027984619, -4.658851146697998, -4.497245788574219, -4.335640907287598, -4.174036026000977, -4.0124311447143555, -3.8508260250091553, -3.689221143722534, -3.527616024017334, -3.366011142730713, -3.2044060230255127, -3.0428009033203125, -2.8811960220336914, -2.719590663909912, -2.557985544204712, -2.396380662918091, -2.2347755432128906, -2.0731706619262695, -1.9115655422210693, -1.7499604225158691, -1.5883554220199585, -1.4267504215240479, -1.2651454210281372, -1.1035404205322266, -0.9419353008270264, -0.7803303003311157, -0.6187252998352051, -0.45712023973464966, -0.29551517963409424, -0.1339106559753418, 0.027694374322891235, 0.18929940462112427, 0.3509044349193573, 0.5125094652175903, 0.674114465713501, 0.8357195258140564, 0.9973245859146118, 1.1589295864105225, 1.320534586906433, 1.4821395874023438, 1.643744707107544, 1.8053497076034546, 1.9669547080993652, 2.1285598278045654, 2.2901649475097656, 2.4517698287963867, 2.613374948501587, 2.774979829788208, 2.936584949493408, 3.0981898307800293, 3.2597949504852295, 3.4214000701904297, 3.583004951477051, 3.744610071182251, 3.906215190887451, 4.067820072174072, 4.229424953460693, 4.391030311584473, 4.552635192871094, 4.714240074157715, 4.875845432281494, 5.037450313568115]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 12.0, 9.0, 14.0, 22.0, 36.0, 36.0, 51.0, 61.0, 67.0, 74.0, 92.0, 80.0, 84.0, 62.0, 53.0, 47.0, 38.0, 35.0, 34.0, 17.0, 13.0, 11.0, 6.0, 5.0, 6.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.89243745803833, -2.798994779586792, -2.705552339553833, -2.612109661102295, -2.518667221069336, -2.425224542617798, -2.3317818641662598, -2.238339424133301, -2.1448967456817627, -2.0514540672302246, -1.9580116271972656, -1.8645689487457275, -1.771126389503479, -1.6776838302612305, -1.5842411518096924, -1.4907985925674438, -1.3973560333251953, -1.3039134740829468, -1.2104709148406982, -1.1170282363891602, -1.0235856771469116, -0.9301431179046631, -0.8367004990577698, -0.7432578802108765, -0.6498153209686279, -0.5563727617263794, -0.4629301428794861, -0.36948755383491516, -0.27604496479034424, -0.18260237574577332, -0.08915978670120239, 0.004282832145690918, 0.09772539138793945, 0.19116798043251038, 0.2846105694770813, 0.3780531585216522, 0.47149574756622314, 0.5649383068084717, 0.658380925655365, 0.7518235445022583, 0.8452661037445068, 0.9387086629867554, 1.032151222229004, 1.125593900680542, 1.2190364599227905, 1.312479019165039, 1.4059216976165771, 1.4993642568588257, 1.5928068161010742, 1.6862493753433228, 1.7796919345855713, 1.8731346130371094, 1.966577172279358, 2.0600197315216064, 2.1534624099731445, 2.2469048500061035, 2.3403475284576416, 2.4337902069091797, 2.5272326469421387, 2.6206753253936768, 2.714118003845215, 2.807560443878174, 2.901003122329712, 2.99444580078125, 3.087888240814209]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 2.0, 7.0, 7.0, 8.0, 8.0, 8.0, 13.0, 8.0, 21.0, 29.0, 56.0, 85.0, 157.0, 437.0, 1819.0, 16944.0, 927069.0, 96408.0, 4089.0, 796.0, 255.0, 98.0, 58.0, 42.0, 33.0, 19.0, 11.0, 12.0, 11.0, 6.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8515625, -8.58905029296875, -8.3265380859375, -8.06402587890625, -7.801513671875, -7.53900146484375, -7.2764892578125, -7.01397705078125, -6.75146484375, -6.48895263671875, -6.2264404296875, -5.96392822265625, -5.701416015625, -5.43890380859375, -5.1763916015625, -4.91387939453125, -4.6513671875, -4.38885498046875, -4.1263427734375, -3.86383056640625, -3.601318359375, -3.33880615234375, -3.0762939453125, -2.81378173828125, -2.55126953125, -2.28875732421875, -2.0262451171875, -1.76373291015625, -1.501220703125, -1.23870849609375, -0.9761962890625, -0.71368408203125, -0.451171875, -0.18865966796875, 0.0738525390625, 0.33636474609375, 0.598876953125, 0.86138916015625, 1.1239013671875, 1.38641357421875, 1.64892578125, 1.91143798828125, 2.1739501953125, 2.43646240234375, 2.698974609375, 2.96148681640625, 3.2239990234375, 3.48651123046875, 3.7490234375, 4.01153564453125, 4.2740478515625, 4.53656005859375, 4.799072265625, 5.06158447265625, 5.3240966796875, 5.58660888671875, 5.84912109375, 6.11163330078125, 6.3741455078125, 6.63665771484375, 6.899169921875, 7.16168212890625, 7.4241943359375, 7.68670654296875, 7.94921875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 7.0, 10.0, 33.0, 35.0, 48.0, 101.0, 129.0, 173.0, 153.0, 118.0, 79.0, 34.0, 27.0, 18.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48388671875, -0.46578216552734375, -0.4476776123046875, -0.42957305908203125, -0.411468505859375, -0.39336395263671875, -0.3752593994140625, -0.35715484619140625, -0.33905029296875, -0.32094573974609375, -0.3028411865234375, -0.28473663330078125, -0.266632080078125, -0.24852752685546875, -0.2304229736328125, -0.21231842041015625, -0.1942138671875, -0.17610931396484375, -0.1580047607421875, -0.13990020751953125, -0.121795654296875, -0.10369110107421875, -0.0855865478515625, -0.06748199462890625, -0.04937744140625, -0.03127288818359375, -0.0131683349609375, 0.00493621826171875, 0.023040771484375, 0.04114532470703125, 0.0592498779296875, 0.07735443115234375, 0.095458984375, 0.11356353759765625, 0.1316680908203125, 0.14977264404296875, 0.167877197265625, 0.18598175048828125, 0.2040863037109375, 0.22219085693359375, 0.24029541015625, 0.25839996337890625, 0.2765045166015625, 0.29460906982421875, 0.312713623046875, 0.33081817626953125, 0.3489227294921875, 0.36702728271484375, 0.3851318359375, 0.40323638916015625, 0.4213409423828125, 0.43944549560546875, 0.457550048828125, 0.47565460205078125, 0.4937591552734375, 0.5118637084960938, 0.52996826171875, 0.5480728149414062, 0.5661773681640625, 0.5842819213867188, 0.602386474609375, 0.6204910278320312, 0.6385955810546875, 0.6567001342773438, 0.6748046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 9.0, 7.0, 6.0, 12.0, 8.0, 17.0, 17.0, 27.0, 45.0, 41.0, 66.0, 119.0, 181.0, 327.0, 712.0, 1762.0, 5661.0, 25700.0, 155863.0, 613841.0, 202490.0, 31243.0, 6680.0, 1926.0, 788.0, 388.0, 190.0, 131.0, 88.0, 43.0, 32.0, 31.0, 25.0, 13.0, 21.0, 9.0, 7.0, 5.0, 7.0, 1.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.619140625, -2.536163330078125, -2.45318603515625, -2.370208740234375, -2.2872314453125, -2.204254150390625, -2.12127685546875, -2.038299560546875, -1.955322265625, -1.872344970703125, -1.78936767578125, -1.706390380859375, -1.6234130859375, -1.540435791015625, -1.45745849609375, -1.374481201171875, -1.29150390625, -1.208526611328125, -1.12554931640625, -1.042572021484375, -0.9595947265625, -0.876617431640625, -0.79364013671875, -0.710662841796875, -0.627685546875, -0.544708251953125, -0.46173095703125, -0.378753662109375, -0.2957763671875, -0.212799072265625, -0.12982177734375, -0.046844482421875, 0.0361328125, 0.119110107421875, 0.20208740234375, 0.285064697265625, 0.3680419921875, 0.451019287109375, 0.53399658203125, 0.616973876953125, 0.699951171875, 0.782928466796875, 0.86590576171875, 0.948883056640625, 1.0318603515625, 1.114837646484375, 1.19781494140625, 1.280792236328125, 1.36376953125, 1.446746826171875, 1.52972412109375, 1.612701416015625, 1.6956787109375, 1.778656005859375, 1.86163330078125, 1.944610595703125, 2.027587890625, 2.110565185546875, 2.19354248046875, 2.276519775390625, 2.3594970703125, 2.442474365234375, 2.52545166015625, 2.608428955078125, 2.69140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 7.0, 9.0, 7.0, 6.0, 5.0, 13.0, 26.0, 17.0, 23.0, 22.0, 20.0, 24.0, 37.0, 36.0, 44.0, 40.0, 51.0, 53.0, 46.0, 61.0, 45.0, 40.0, 34.0, 39.0, 43.0, 38.0, 44.0, 34.0, 25.0, 18.0, 18.0, 16.0, 14.0, 11.0, 6.0, 3.0, 5.0, 3.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5703125, -1.5227508544921875, -1.475189208984375, -1.4276275634765625, -1.38006591796875, -1.3325042724609375, -1.284942626953125, -1.2373809814453125, -1.1898193359375, -1.1422576904296875, -1.094696044921875, -1.0471343994140625, -0.99957275390625, -0.9520111083984375, -0.904449462890625, -0.8568878173828125, -0.809326171875, -0.7617645263671875, -0.714202880859375, -0.6666412353515625, -0.61907958984375, -0.5715179443359375, -0.523956298828125, -0.4763946533203125, -0.4288330078125, -0.3812713623046875, -0.333709716796875, -0.2861480712890625, -0.23858642578125, -0.1910247802734375, -0.143463134765625, -0.0959014892578125, -0.04833984375, -0.0007781982421875, 0.046783447265625, 0.0943450927734375, 0.14190673828125, 0.1894683837890625, 0.237030029296875, 0.2845916748046875, 0.3321533203125, 0.3797149658203125, 0.427276611328125, 0.4748382568359375, 0.52239990234375, 0.5699615478515625, 0.617523193359375, 0.6650848388671875, 0.712646484375, 0.7602081298828125, 0.807769775390625, 0.8553314208984375, 0.90289306640625, 0.9504547119140625, 0.998016357421875, 1.0455780029296875, 1.0931396484375, 1.1407012939453125, 1.188262939453125, 1.2358245849609375, 1.28338623046875, 1.3309478759765625, 1.378509521484375, 1.4260711669921875, 1.4736328125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 6.0, 7.0, 18.0, 24.0, 35.0, 63.0, 91.0, 178.0, 320.0, 716.0, 2239.0, 7414.0, 37877.0, 323329.0, 579553.0, 78655.0, 12917.0, 3159.0, 1010.0, 455.0, 187.0, 116.0, 63.0, 41.0, 28.0, 18.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4560546875, -1.404388427734375, -1.35272216796875, -1.301055908203125, -1.2493896484375, -1.197723388671875, -1.14605712890625, -1.094390869140625, -1.042724609375, -0.991058349609375, -0.93939208984375, -0.887725830078125, -0.8360595703125, -0.784393310546875, -0.73272705078125, -0.681060791015625, -0.62939453125, -0.577728271484375, -0.52606201171875, -0.474395751953125, -0.4227294921875, -0.371063232421875, -0.31939697265625, -0.267730712890625, -0.216064453125, -0.164398193359375, -0.11273193359375, -0.061065673828125, -0.0093994140625, 0.042266845703125, 0.09393310546875, 0.145599365234375, 0.197265625, 0.248931884765625, 0.30059814453125, 0.352264404296875, 0.4039306640625, 0.455596923828125, 0.50726318359375, 0.558929443359375, 0.610595703125, 0.662261962890625, 0.71392822265625, 0.765594482421875, 0.8172607421875, 0.868927001953125, 0.92059326171875, 0.972259521484375, 1.02392578125, 1.075592041015625, 1.12725830078125, 1.178924560546875, 1.2305908203125, 1.282257080078125, 1.33392333984375, 1.385589599609375, 1.437255859375, 1.488922119140625, 1.54058837890625, 1.592254638671875, 1.6439208984375, 1.695587158203125, 1.74725341796875, 1.798919677734375, 1.8505859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 0.0, 3.0, 3.0, 5.0, 6.0, 15.0, 9.0, 13.0, 30.0, 23.0, 32.0, 41.0, 52.0, 77.0, 135.0, 138.0, 98.0, 85.0, 58.0, 48.0, 28.0, 24.0, 19.0, 20.0, 4.0, 6.0, 7.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002435445785522461, -0.0002354886382818222, -0.00022743269801139832, -0.00021937675774097443, -0.00021132081747055054, -0.00020326487720012665, -0.00019520893692970276, -0.00018715299665927887, -0.00017909705638885498, -0.0001710411161184311, -0.0001629851758480072, -0.0001549292355775833, -0.00014687329530715942, -0.00013881735503673553, -0.00013076141476631165, -0.00012270547449588776, -0.00011464953422546387, -0.00010659359395503998, -9.853765368461609e-05, -9.04817134141922e-05, -8.242577314376831e-05, -7.436983287334442e-05, -6.631389260292053e-05, -5.825795233249664e-05, -5.0202012062072754e-05, -4.2146071791648865e-05, -3.4090131521224976e-05, -2.6034191250801086e-05, -1.7978250980377197e-05, -9.922310709953308e-06, -1.866370439529419e-06, 6.18956983089447e-06, 1.424551010131836e-05, 2.230145037174225e-05, 3.0357390642166138e-05, 3.841333091259003e-05, 4.6469271183013916e-05, 5.4525211453437805e-05, 6.25811517238617e-05, 7.063709199428558e-05, 7.869303226470947e-05, 8.674897253513336e-05, 9.480491280555725e-05, 0.00010286085307598114, 0.00011091679334640503, 0.00011897273361682892, 0.0001270286738872528, 0.0001350846141576767, 0.00014314055442810059, 0.00015119649469852448, 0.00015925243496894836, 0.00016730837523937225, 0.00017536431550979614, 0.00018342025578022003, 0.00019147619605064392, 0.0001995321363210678, 0.0002075880765914917, 0.0002156440168619156, 0.00022369995713233948, 0.00023175589740276337, 0.00023981183767318726, 0.00024786777794361115, 0.00025592371821403503, 0.0002639796584844589, 0.0002720355987548828]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 9.0, 10.0, 11.0, 19.0, 32.0, 40.0, 72.0, 98.0, 164.0, 287.0, 695.0, 1528.0, 4204.0, 15577.0, 94229.0, 675419.0, 219505.0, 26629.0, 6237.0, 2029.0, 828.0, 394.0, 190.0, 117.0, 71.0, 45.0, 20.0, 19.0, 22.0, 8.0, 7.0, 7.0, 8.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6796875, -1.6230926513671875, -1.566497802734375, -1.5099029541015625, -1.45330810546875, -1.3967132568359375, -1.340118408203125, -1.2835235595703125, -1.2269287109375, -1.1703338623046875, -1.113739013671875, -1.0571441650390625, -1.00054931640625, -0.9439544677734375, -0.887359619140625, -0.8307647705078125, -0.774169921875, -0.7175750732421875, -0.660980224609375, -0.6043853759765625, -0.54779052734375, -0.4911956787109375, -0.434600830078125, -0.3780059814453125, -0.3214111328125, -0.2648162841796875, -0.208221435546875, -0.1516265869140625, -0.09503173828125, -0.0384368896484375, 0.018157958984375, 0.0747528076171875, 0.13134765625, 0.1879425048828125, 0.244537353515625, 0.3011322021484375, 0.35772705078125, 0.4143218994140625, 0.470916748046875, 0.5275115966796875, 0.5841064453125, 0.6407012939453125, 0.697296142578125, 0.7538909912109375, 0.81048583984375, 0.8670806884765625, 0.923675537109375, 0.9802703857421875, 1.036865234375, 1.0934600830078125, 1.150054931640625, 1.2066497802734375, 1.26324462890625, 1.3198394775390625, 1.376434326171875, 1.4330291748046875, 1.4896240234375, 1.5462188720703125, 1.602813720703125, 1.6594085693359375, 1.71600341796875, 1.7725982666015625, 1.829193115234375, 1.8857879638671875, 1.9423828125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 4.0, 8.0, 8.0, 12.0, 16.0, 23.0, 23.0, 38.0, 51.0, 45.0, 44.0, 77.0, 67.0, 92.0, 89.0, 82.0, 65.0, 54.0, 44.0, 29.0, 23.0, 18.0, 20.0, 14.0, 8.0, 10.0, 7.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80419921875, -0.7823562622070312, -0.7605133056640625, -0.7386703491210938, -0.716827392578125, -0.6949844360351562, -0.6731414794921875, -0.6512985229492188, -0.62945556640625, -0.6076126098632812, -0.5857696533203125, -0.5639266967773438, -0.542083740234375, -0.5202407836914062, -0.4983978271484375, -0.47655487060546875, -0.4547119140625, -0.43286895751953125, -0.4110260009765625, -0.38918304443359375, -0.367340087890625, -0.34549713134765625, -0.3236541748046875, -0.30181121826171875, -0.27996826171875, -0.25812530517578125, -0.2362823486328125, -0.21443939208984375, -0.192596435546875, -0.17075347900390625, -0.1489105224609375, -0.12706756591796875, -0.105224609375, -0.08338165283203125, -0.0615386962890625, -0.03969573974609375, -0.017852783203125, 0.00399017333984375, 0.0258331298828125, 0.04767608642578125, 0.06951904296875, 0.09136199951171875, 0.1132049560546875, 0.13504791259765625, 0.156890869140625, 0.17873382568359375, 0.2005767822265625, 0.22241973876953125, 0.2442626953125, 0.26610565185546875, 0.2879486083984375, 0.30979156494140625, 0.331634521484375, 0.35347747802734375, 0.3753204345703125, 0.39716339111328125, 0.41900634765625, 0.44084930419921875, 0.4626922607421875, 0.48453521728515625, 0.506378173828125, 0.5282211303710938, 0.5500640869140625, 0.5719070434570312, 0.59375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 11.0, 16.0, 36.0, 81.0, 146.0, 245.0, 221.0, 122.0, 59.0, 29.0, 14.0, 10.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.150394439697266, -21.583927154541016, -21.017459869384766, -20.450990676879883, -19.884523391723633, -19.318056106567383, -18.751588821411133, -18.18511962890625, -17.61865234375, -17.05218505859375, -16.4857177734375, -15.919249534606934, -15.352781295776367, -14.786314010620117, -14.219846725463867, -13.6533784866333, -13.08691120147705, -12.5204439163208, -11.953975677490234, -11.387508392333984, -10.821040153503418, -10.254572868347168, -9.688104629516602, -9.121637344360352, -8.555170059204102, -7.988702297210693, -7.422234535217285, -6.855767250061035, -6.289299011230469, -5.722831726074219, -5.1563639640808105, -4.589896202087402, -4.023428916931152, -3.456961154937744, -2.890493392944336, -2.324025869369507, -1.7575581073760986, -1.1910903453826904, -0.6246228218078613, -0.058155059814453125, 0.5083127021789551, 1.0747804641723633, 1.641248106956482, 2.2077157497406006, 2.774183511734009, 3.340651273727417, 3.907118797302246, 4.473586559295654, 5.0400543212890625, 5.606522083282471, 6.172989845275879, 6.739457130432129, 7.305925369262695, 7.872392654418945, 8.438859939575195, 9.005328178405762, 9.571796417236328, 10.138263702392578, 10.704731941223145, 11.271199226379395, 11.837667465209961, 12.404134750366211, 12.970602035522461, 13.537070274353027, 14.103537559509277]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 3.0, 5.0, 10.0, 11.0, 10.0, 11.0, 17.0, 21.0, 17.0, 28.0, 36.0, 35.0, 44.0, 48.0, 42.0, 59.0, 52.0, 53.0, 59.0, 45.0, 44.0, 56.0, 49.0, 41.0, 37.0, 27.0, 26.0, 23.0, 23.0, 19.0, 15.0, 15.0, 6.0, 8.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.378341674804688, -10.967613220214844, -10.556885719299316, -10.146157264709473, -9.735428810119629, -9.324701309204102, -8.913972854614258, -8.503244400024414, -8.09251594543457, -7.681787967681885, -7.271059513092041, -6.8603315353393555, -6.449603080749512, -6.038875102996826, -5.628147125244141, -5.217418670654297, -4.806690692901611, -4.395962715148926, -3.985234260559082, -3.5745062828063965, -3.1637778282165527, -2.753049850463867, -2.3423216342926025, -1.931593418121338, -1.5208652019500732, -1.1101369857788086, -0.6994088292121887, -0.28868067264556885, 0.1220475435256958, 0.5327756404876709, 0.9435038566589355, 1.3542320728302002, 1.7649602890014648, 2.1756885051727295, 2.586416721343994, 2.9971446990966797, 3.4078731536865234, 3.818601131439209, 4.2293291091918945, 4.640057563781738, 5.050786018371582, 5.461513996124268, 5.872242450714111, 6.282970428466797, 6.693698883056641, 7.104426860809326, 7.515154838562012, 7.9258832931518555, 8.336610794067383, 8.747339248657227, 9.158066749572754, 9.568795204162598, 9.979523658752441, 10.390251159667969, 10.800979614257812, 11.211708068847656, 11.6224365234375, 12.033164978027344, 12.443892478942871, 12.854620933532715, 13.265349388122559, 13.676076889038086, 14.08680534362793, 14.497533798217773, 14.908262252807617]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 13.0, 24.0, 36.0, 60.0, 125.0, 234.0, 646.0, 3029.0, 47450.0, 4120340.0, 18944.0, 2100.0, 558.0, 242.0, 148.0, 88.0, 55.0, 46.0, 29.0, 21.0, 21.0, 13.0, 13.0, 12.0, 3.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -10.94189453125, -10.4931640625, -10.04443359375, -9.595703125, -9.14697265625, -8.6982421875, -8.24951171875, -7.80078125, -7.35205078125, -6.9033203125, -6.45458984375, -6.005859375, -5.55712890625, -5.1083984375, -4.65966796875, -4.2109375, -3.76220703125, -3.3134765625, -2.86474609375, -2.416015625, -1.96728515625, -1.5185546875, -1.06982421875, -0.62109375, -0.17236328125, 0.2763671875, 0.72509765625, 1.173828125, 1.62255859375, 2.0712890625, 2.52001953125, 2.96875, 3.41748046875, 3.8662109375, 4.31494140625, 4.763671875, 5.21240234375, 5.6611328125, 6.10986328125, 6.55859375, 7.00732421875, 7.4560546875, 7.90478515625, 8.353515625, 8.80224609375, 9.2509765625, 9.69970703125, 10.1484375, 10.59716796875, 11.0458984375, 11.49462890625, 11.943359375, 12.39208984375, 12.8408203125, 13.28955078125, 13.73828125, 14.18701171875, 14.6357421875, 15.08447265625, 15.533203125, 15.98193359375, 16.4306640625, 16.87939453125, 17.328125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 8.0, 16.0, 16.0, 31.0, 36.0, 52.0, 81.0, 98.0, 126.0, 111.0, 108.0, 66.0, 80.0, 53.0, 31.0, 31.0, 17.0, 9.0, 10.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49560546875, -0.47747039794921875, -0.4593353271484375, -0.44120025634765625, -0.423065185546875, -0.40493011474609375, -0.3867950439453125, -0.36865997314453125, -0.35052490234375, -0.33238983154296875, -0.3142547607421875, -0.29611968994140625, -0.277984619140625, -0.25984954833984375, -0.2417144775390625, -0.22357940673828125, -0.2054443359375, -0.18730926513671875, -0.1691741943359375, -0.15103912353515625, -0.132904052734375, -0.11476898193359375, -0.0966339111328125, -0.07849884033203125, -0.06036376953125, -0.04222869873046875, -0.0240936279296875, -0.00595855712890625, 0.012176513671875, 0.03031158447265625, 0.0484466552734375, 0.06658172607421875, 0.084716796875, 0.10285186767578125, 0.1209869384765625, 0.13912200927734375, 0.157257080078125, 0.17539215087890625, 0.1935272216796875, 0.21166229248046875, 0.22979736328125, 0.24793243408203125, 0.2660675048828125, 0.28420257568359375, 0.302337646484375, 0.32047271728515625, 0.3386077880859375, 0.35674285888671875, 0.3748779296875, 0.39301300048828125, 0.4111480712890625, 0.42928314208984375, 0.447418212890625, 0.46555328369140625, 0.4836883544921875, 0.5018234252929688, 0.51995849609375, 0.5380935668945312, 0.5562286376953125, 0.5743637084960938, 0.592498779296875, 0.6106338500976562, 0.6287689208984375, 0.6469039916992188, 0.6650390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 8.0, 10.0, 15.0, 25.0, 33.0, 40.0, 48.0, 50.0, 76.0, 192.0, 10302.0, 4181311.0, 1707.0, 94.0, 73.0, 57.0, 61.0, 38.0, 40.0, 24.0, 29.0, 12.0, 15.0, 6.0, 2.0, 5.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.734375, -18.889404296875, -18.04443359375, -17.199462890625, -16.3544921875, -15.509521484375, -14.66455078125, -13.819580078125, -12.974609375, -12.129638671875, -11.28466796875, -10.439697265625, -9.5947265625, -8.749755859375, -7.90478515625, -7.059814453125, -6.21484375, -5.369873046875, -4.52490234375, -3.679931640625, -2.8349609375, -1.989990234375, -1.14501953125, -0.300048828125, 0.544921875, 1.389892578125, 2.23486328125, 3.079833984375, 3.9248046875, 4.769775390625, 5.61474609375, 6.459716796875, 7.3046875, 8.149658203125, 8.99462890625, 9.839599609375, 10.6845703125, 11.529541015625, 12.37451171875, 13.219482421875, 14.064453125, 14.909423828125, 15.75439453125, 16.599365234375, 17.4443359375, 18.289306640625, 19.13427734375, 19.979248046875, 20.82421875, 21.669189453125, 22.51416015625, 23.359130859375, 24.2041015625, 25.049072265625, 25.89404296875, 26.739013671875, 27.583984375, 28.428955078125, 29.27392578125, 30.118896484375, 30.9638671875, 31.808837890625, 32.65380859375, 33.498779296875, 34.34375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 9.0, 14.0, 31.0, 100.0, 389.0, 2824.0, 558.0, 117.0, 27.0, 15.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82421875, -0.746337890625, -0.66845703125, -0.590576171875, -0.5126953125, -0.434814453125, -0.35693359375, -0.279052734375, -0.201171875, -0.123291015625, -0.04541015625, 0.032470703125, 0.1103515625, 0.188232421875, 0.26611328125, 0.343994140625, 0.421875, 0.499755859375, 0.57763671875, 0.655517578125, 0.7333984375, 0.811279296875, 0.88916015625, 0.967041015625, 1.044921875, 1.122802734375, 1.20068359375, 1.278564453125, 1.3564453125, 1.434326171875, 1.51220703125, 1.590087890625, 1.66796875, 1.745849609375, 1.82373046875, 1.901611328125, 1.9794921875, 2.057373046875, 2.13525390625, 2.213134765625, 2.291015625, 2.368896484375, 2.44677734375, 2.524658203125, 2.6025390625, 2.680419921875, 2.75830078125, 2.836181640625, 2.9140625, 2.991943359375, 3.06982421875, 3.147705078125, 3.2255859375, 3.303466796875, 3.38134765625, 3.459228515625, 3.537109375, 3.614990234375, 3.69287109375, 3.770751953125, 3.8486328125, 3.926513671875, 4.00439453125, 4.082275390625, 4.16015625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 10.0, 43.0, 231.0, 536.0, 126.0, 36.0, 12.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-42.24636459350586, -41.45452117919922, -40.66267776489258, -39.87083053588867, -39.07898712158203, -38.28714370727539, -37.49530029296875, -36.703453063964844, -35.9116096496582, -35.11976623535156, -34.32792282104492, -33.536075592041016, -32.744232177734375, -31.952388763427734, -31.16054344177246, -30.36870002746582, -29.576854705810547, -28.785011291503906, -27.993165969848633, -27.201322555541992, -26.40947723388672, -25.617633819580078, -24.825788497924805, -24.033945083618164, -23.242101669311523, -22.450258255004883, -21.65841293334961, -20.86656951904297, -20.074724197387695, -19.282880783081055, -18.49103546142578, -17.69919204711914, -16.907344818115234, -16.115501403808594, -15.32365608215332, -14.531811714172363, -13.739967346191406, -12.94812297821045, -12.156278610229492, -11.364435195922852, -10.572591781616211, -9.780747413635254, -8.988903045654297, -8.19705867767334, -7.405214309692383, -6.613369941711426, -5.821526050567627, -5.02968168258667, -4.237836837768555, -3.4459924697875977, -2.6541481018066406, -1.8623039722442627, -1.0704596042633057, -0.27861523628234863, 0.5132288932800293, 1.3050732612609863, 2.0969176292419434, 2.8887619972229004, 3.6806063652038574, 4.472450256347656, 5.264294624328613, 6.05613899230957, 6.847983360290527, 7.639827728271484, 8.431672096252441]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 19.0, 20.0, 43.0, 55.0, 86.0, 69.0, 84.0, 87.0, 113.0, 97.0, 82.0, 78.0, 42.0, 49.0, 30.0, 10.0, 10.0, 9.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.779561519622803, -7.55860710144043, -7.337652206420898, -7.116697788238525, -6.895743370056152, -6.674788475036621, -6.453834056854248, -6.232879638671875, -6.011924743652344, -5.790970325469971, -5.5700154304504395, -5.349061012268066, -5.128106594085693, -4.90715217590332, -4.686197280883789, -4.465242862701416, -4.244288444519043, -4.02333402633667, -3.8023793697357178, -3.5814247131347656, -3.3604702949523926, -3.1395156383514404, -2.9185609817504883, -2.6976065635681152, -2.476651906967163, -2.255697250366211, -2.034742832183838, -1.8137881755828857, -1.5928336381912231, -1.3718791007995605, -1.1509244441986084, -0.9299699068069458, -0.7090158462524414, -0.4880612790584564, -0.26710671186447144, -0.04615211486816406, 0.17480242252349854, 0.39575695991516113, 0.6167116165161133, 0.8376661539077759, 1.0586206912994385, 1.279575228691101, 1.5005297660827637, 1.7214844226837158, 1.9424389600753784, 2.163393497467041, 2.384348154067993, 2.6053028106689453, 2.8262572288513184, 3.0472118854522705, 3.2681663036346436, 3.4891209602355957, 3.7100753784179688, 3.931030035018921, 4.151984691619873, 4.372939109802246, 4.593894004821777, 4.81484842300415, 5.035803318023682, 5.256757736206055, 5.477712154388428, 5.698666572570801, 5.919621467590332, 6.140575885772705, 6.361530303955078]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 10.0, 9.0, 10.0, 14.0, 21.0, 31.0, 34.0, 72.0, 156.0, 355.0, 1099.0, 4651.0, 44546.0, 840454.0, 145012.0, 9298.0, 1772.0, 519.0, 196.0, 106.0, 49.0, 42.0, 21.0, 24.0, 10.0, 12.0, 11.0, 7.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73046875, -6.49578857421875, -6.2611083984375, -6.02642822265625, -5.791748046875, -5.55706787109375, -5.3223876953125, -5.08770751953125, -4.85302734375, -4.61834716796875, -4.3836669921875, -4.14898681640625, -3.914306640625, -3.67962646484375, -3.4449462890625, -3.21026611328125, -2.9755859375, -2.74090576171875, -2.5062255859375, -2.27154541015625, -2.036865234375, -1.80218505859375, -1.5675048828125, -1.33282470703125, -1.09814453125, -0.86346435546875, -0.6287841796875, -0.39410400390625, -0.159423828125, 0.07525634765625, 0.3099365234375, 0.54461669921875, 0.779296875, 1.01397705078125, 1.2486572265625, 1.48333740234375, 1.718017578125, 1.95269775390625, 2.1873779296875, 2.42205810546875, 2.65673828125, 2.89141845703125, 3.1260986328125, 3.36077880859375, 3.595458984375, 3.83013916015625, 4.0648193359375, 4.29949951171875, 4.5341796875, 4.76885986328125, 5.0035400390625, 5.23822021484375, 5.472900390625, 5.70758056640625, 5.9422607421875, 6.17694091796875, 6.41162109375, 6.64630126953125, 6.8809814453125, 7.11566162109375, 7.350341796875, 7.58502197265625, 7.8197021484375, 8.05438232421875, 8.2890625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 9.0, 15.0, 20.0, 26.0, 40.0, 60.0, 78.0, 101.0, 108.0, 120.0, 98.0, 85.0, 67.0, 49.0, 38.0, 31.0, 21.0, 12.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.450927734375, -0.4308128356933594, -0.41069793701171875, -0.3905830383300781, -0.3704681396484375, -0.3503532409667969, -0.33023834228515625, -0.3101234436035156, -0.290008544921875, -0.2698936462402344, -0.24977874755859375, -0.22966384887695312, -0.2095489501953125, -0.18943405151367188, -0.16931915283203125, -0.14920425415039062, -0.12908935546875, -0.10897445678710938, -0.08885955810546875, -0.06874465942382812, -0.0486297607421875, -0.028514862060546875, -0.00839996337890625, 0.011714935302734375, 0.031829833984375, 0.051944732666015625, 0.07205963134765625, 0.09217453002929688, 0.1122894287109375, 0.13240432739257812, 0.15251922607421875, 0.17263412475585938, 0.1927490234375, 0.21286392211914062, 0.23297882080078125, 0.2530937194824219, 0.2732086181640625, 0.2933235168457031, 0.31343841552734375, 0.3335533142089844, 0.353668212890625, 0.3737831115722656, 0.39389801025390625, 0.4140129089355469, 0.4341278076171875, 0.4542427062988281, 0.47435760498046875, 0.4944725036621094, 0.51458740234375, 0.5347023010253906, 0.5548171997070312, 0.5749320983886719, 0.5950469970703125, 0.6151618957519531, 0.6352767944335938, 0.6553916931152344, 0.675506591796875, 0.6956214904785156, 0.7157363891601562, 0.7358512878417969, 0.7559661865234375, 0.7760810852050781, 0.7961959838867188, 0.8163108825683594, 0.83642578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 14.0, 7.0, 7.0, 14.0, 19.0, 30.0, 43.0, 47.0, 61.0, 130.0, 171.0, 288.0, 449.0, 790.0, 1641.0, 3793.0, 10049.0, 30370.0, 113328.0, 425280.0, 339105.0, 84065.0, 24164.0, 8061.0, 3193.0, 1447.0, 757.0, 406.0, 242.0, 181.0, 102.0, 79.0, 66.0, 47.0, 30.0, 24.0, 16.0, 6.0, 11.0, 5.0, 4.0, 6.0, 4.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.05859375, -1.987335205078125, -1.91607666015625, -1.844818115234375, -1.7735595703125, -1.702301025390625, -1.63104248046875, -1.559783935546875, -1.488525390625, -1.417266845703125, -1.34600830078125, -1.274749755859375, -1.2034912109375, -1.132232666015625, -1.06097412109375, -0.989715576171875, -0.91845703125, -0.847198486328125, -0.77593994140625, -0.704681396484375, -0.6334228515625, -0.562164306640625, -0.49090576171875, -0.419647216796875, -0.348388671875, -0.277130126953125, -0.20587158203125, -0.134613037109375, -0.0633544921875, 0.007904052734375, 0.07916259765625, 0.150421142578125, 0.2216796875, 0.292938232421875, 0.36419677734375, 0.435455322265625, 0.5067138671875, 0.577972412109375, 0.64923095703125, 0.720489501953125, 0.791748046875, 0.863006591796875, 0.93426513671875, 1.005523681640625, 1.0767822265625, 1.148040771484375, 1.21929931640625, 1.290557861328125, 1.36181640625, 1.433074951171875, 1.50433349609375, 1.575592041015625, 1.6468505859375, 1.718109130859375, 1.78936767578125, 1.860626220703125, 1.931884765625, 2.003143310546875, 2.07440185546875, 2.145660400390625, 2.2169189453125, 2.288177490234375, 2.35943603515625, 2.430694580078125, 2.501953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 9.0, 2.0, 10.0, 15.0, 11.0, 14.0, 17.0, 18.0, 27.0, 24.0, 33.0, 33.0, 49.0, 48.0, 46.0, 55.0, 55.0, 51.0, 45.0, 49.0, 37.0, 35.0, 40.0, 41.0, 36.0, 32.0, 34.0, 19.0, 23.0, 21.0, 11.0, 16.0, 9.0, 16.0, 2.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7041015625, -1.6442718505859375, -1.584442138671875, -1.5246124267578125, -1.46478271484375, -1.4049530029296875, -1.345123291015625, -1.2852935791015625, -1.2254638671875, -1.1656341552734375, -1.105804443359375, -1.0459747314453125, -0.98614501953125, -0.9263153076171875, -0.866485595703125, -0.8066558837890625, -0.746826171875, -0.6869964599609375, -0.627166748046875, -0.5673370361328125, -0.50750732421875, -0.4476776123046875, -0.387847900390625, -0.3280181884765625, -0.2681884765625, -0.2083587646484375, -0.148529052734375, -0.0886993408203125, -0.02886962890625, 0.0309600830078125, 0.090789794921875, 0.1506195068359375, 0.21044921875, 0.2702789306640625, 0.330108642578125, 0.3899383544921875, 0.44976806640625, 0.5095977783203125, 0.569427490234375, 0.6292572021484375, 0.6890869140625, 0.7489166259765625, 0.808746337890625, 0.8685760498046875, 0.92840576171875, 0.9882354736328125, 1.048065185546875, 1.1078948974609375, 1.167724609375, 1.2275543212890625, 1.287384033203125, 1.3472137451171875, 1.40704345703125, 1.4668731689453125, 1.526702880859375, 1.5865325927734375, 1.6463623046875, 1.7061920166015625, 1.766021728515625, 1.8258514404296875, 1.88568115234375, 1.9455108642578125, 2.005340576171875, 2.0651702880859375, 2.125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 8.0, 10.0, 15.0, 25.0, 19.0, 36.0, 32.0, 99.0, 100.0, 169.0, 311.0, 538.0, 1090.0, 2267.0, 5587.0, 18980.0, 126731.0, 715305.0, 145533.0, 20817.0, 5997.0, 2336.0, 1139.0, 536.0, 315.0, 176.0, 110.0, 80.0, 47.0, 26.0, 34.0, 22.0, 17.0, 9.0, 6.0, 9.0, 8.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.630859375, -2.558837890625, -2.48681640625, -2.414794921875, -2.3427734375, -2.270751953125, -2.19873046875, -2.126708984375, -2.0546875, -1.982666015625, -1.91064453125, -1.838623046875, -1.7666015625, -1.694580078125, -1.62255859375, -1.550537109375, -1.478515625, -1.406494140625, -1.33447265625, -1.262451171875, -1.1904296875, -1.118408203125, -1.04638671875, -0.974365234375, -0.90234375, -0.830322265625, -0.75830078125, -0.686279296875, -0.6142578125, -0.542236328125, -0.47021484375, -0.398193359375, -0.326171875, -0.254150390625, -0.18212890625, -0.110107421875, -0.0380859375, 0.033935546875, 0.10595703125, 0.177978515625, 0.25, 0.322021484375, 0.39404296875, 0.466064453125, 0.5380859375, 0.610107421875, 0.68212890625, 0.754150390625, 0.826171875, 0.898193359375, 0.97021484375, 1.042236328125, 1.1142578125, 1.186279296875, 1.25830078125, 1.330322265625, 1.40234375, 1.474365234375, 1.54638671875, 1.618408203125, 1.6904296875, 1.762451171875, 1.83447265625, 1.906494140625, 1.978515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 2.0, 8.0, 21.0, 27.0, 33.0, 59.0, 72.0, 89.0, 135.0, 186.0, 119.0, 48.0, 56.0, 38.0, 25.0, 24.0, 18.0, 9.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003685951232910156, -0.00035509467124938965, -0.00034159421920776367, -0.0003280937671661377, -0.0003145933151245117, -0.00030109286308288574, -0.00028759241104125977, -0.0002740919589996338, -0.0002605915069580078, -0.00024709105491638184, -0.00023359060287475586, -0.00022009015083312988, -0.0002065896987915039, -0.00019308924674987793, -0.00017958879470825195, -0.00016608834266662598, -0.000152587890625, -0.00013908743858337402, -0.00012558698654174805, -0.00011208653450012207, -9.85860824584961e-05, -8.508563041687012e-05, -7.158517837524414e-05, -5.8084726333618164e-05, -4.458427429199219e-05, -3.108382225036621e-05, -1.7583370208740234e-05, -4.082918167114258e-06, 9.417533874511719e-06, 2.2917985916137695e-05, 3.641843795776367e-05, 4.991888999938965e-05, 6.341934204101562e-05, 7.69197940826416e-05, 9.042024612426758e-05, 0.00010392069816589355, 0.00011742115020751953, 0.0001309216022491455, 0.00014442205429077148, 0.00015792250633239746, 0.00017142295837402344, 0.00018492341041564941, 0.0001984238624572754, 0.00021192431449890137, 0.00022542476654052734, 0.00023892521858215332, 0.0002524256706237793, 0.0002659261226654053, 0.00027942657470703125, 0.0002929270267486572, 0.0003064274787902832, 0.0003199279308319092, 0.00033342838287353516, 0.00034692883491516113, 0.0003604292869567871, 0.0003739297389984131, 0.00038743019104003906, 0.00040093064308166504, 0.000414431095123291, 0.000427931547164917, 0.00044143199920654297, 0.00045493245124816895, 0.0004684329032897949, 0.0004819333553314209, 0.0004954338073730469]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 6.0, 10.0, 14.0, 27.0, 22.0, 25.0, 63.0, 72.0, 139.0, 176.0, 317.0, 667.0, 1235.0, 2863.0, 7671.0, 31183.0, 293872.0, 628588.0, 62292.0, 11765.0, 4074.0, 1616.0, 798.0, 426.0, 225.0, 117.0, 85.0, 54.0, 38.0, 28.0, 15.0, 17.0, 13.0, 7.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.384765625, -2.30828857421875, -2.2318115234375, -2.15533447265625, -2.078857421875, -2.00238037109375, -1.9259033203125, -1.84942626953125, -1.77294921875, -1.69647216796875, -1.6199951171875, -1.54351806640625, -1.467041015625, -1.39056396484375, -1.3140869140625, -1.23760986328125, -1.1611328125, -1.08465576171875, -1.0081787109375, -0.93170166015625, -0.855224609375, -0.77874755859375, -0.7022705078125, -0.62579345703125, -0.54931640625, -0.47283935546875, -0.3963623046875, -0.31988525390625, -0.243408203125, -0.16693115234375, -0.0904541015625, -0.01397705078125, 0.0625, 0.13897705078125, 0.2154541015625, 0.29193115234375, 0.368408203125, 0.44488525390625, 0.5213623046875, 0.59783935546875, 0.67431640625, 0.75079345703125, 0.8272705078125, 0.90374755859375, 0.980224609375, 1.05670166015625, 1.1331787109375, 1.20965576171875, 1.2861328125, 1.36260986328125, 1.4390869140625, 1.51556396484375, 1.592041015625, 1.66851806640625, 1.7449951171875, 1.82147216796875, 1.89794921875, 1.97442626953125, 2.0509033203125, 2.12738037109375, 2.203857421875, 2.28033447265625, 2.3568115234375, 2.43328857421875, 2.509765625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 12.0, 14.0, 20.0, 32.0, 52.0, 53.0, 73.0, 87.0, 95.0, 105.0, 102.0, 87.0, 85.0, 46.0, 36.0, 30.0, 18.0, 11.0, 5.0, 9.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2705078125, -1.2326202392578125, -1.194732666015625, -1.1568450927734375, -1.11895751953125, -1.0810699462890625, -1.043182373046875, -1.0052947998046875, -0.9674072265625, -0.9295196533203125, -0.891632080078125, -0.8537445068359375, -0.81585693359375, -0.7779693603515625, -0.740081787109375, -0.7021942138671875, -0.664306640625, -0.6264190673828125, -0.588531494140625, -0.5506439208984375, -0.51275634765625, -0.4748687744140625, -0.436981201171875, -0.3990936279296875, -0.3612060546875, -0.3233184814453125, -0.285430908203125, -0.2475433349609375, -0.20965576171875, -0.1717681884765625, -0.133880615234375, -0.0959930419921875, -0.05810546875, -0.0202178955078125, 0.017669677734375, 0.0555572509765625, 0.09344482421875, 0.1313323974609375, 0.169219970703125, 0.2071075439453125, 0.2449951171875, 0.2828826904296875, 0.320770263671875, 0.3586578369140625, 0.39654541015625, 0.4344329833984375, 0.472320556640625, 0.5102081298828125, 0.548095703125, 0.5859832763671875, 0.623870849609375, 0.6617584228515625, 0.69964599609375, 0.7375335693359375, 0.775421142578125, 0.8133087158203125, 0.8511962890625, 0.8890838623046875, 0.926971435546875, 0.9648590087890625, 1.00274658203125, 1.0406341552734375, 1.078521728515625, 1.1164093017578125, 1.154296875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 14.0, 28.0, 54.0, 121.0, 281.0, 261.0, 150.0, 52.0, 19.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.458847045898438, -18.61956024169922, -17.780271530151367, -16.94098472595215, -16.101696014404297, -15.262409210205078, -14.423121452331543, -13.583833694458008, -12.744546890258789, -11.905259132385254, -11.065971374511719, -10.2266845703125, -9.387396812438965, -8.54810905456543, -7.7088212966918945, -6.869534015655518, -6.030245780944824, -5.190958023071289, -4.351670742034912, -3.512382984161377, -2.673095464706421, -1.8338079452514648, -0.9945201873779297, -0.15523290634155273, 0.6840548515319824, 1.5233423709869385, 2.3626298904418945, 3.2019176483154297, 4.041205406188965, 4.880492687225342, 5.719780445098877, 6.559067726135254, 7.398355484008789, 8.237643241882324, 9.07693099975586, 9.916217803955078, 10.755505561828613, 11.594793319702148, 12.434081077575684, 13.273368835449219, 14.112655639648438, 14.951943397521973, 15.791231155395508, 16.630517959594727, 17.469806671142578, 18.309093475341797, 19.148380279541016, 19.987668991088867, 20.82695770263672, 21.666244506835938, 22.50553321838379, 23.344820022583008, 24.18410873413086, 25.023395538330078, 25.862682342529297, 26.70197105407715, 27.541257858276367, 28.380544662475586, 29.219833374023438, 30.059120178222656, 30.898408889770508, 31.737695693969727, 32.57698440551758, 33.4162712097168, 34.255558013916016]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 5.0, 6.0, 9.0, 22.0, 19.0, 18.0, 14.0, 24.0, 27.0, 25.0, 20.0, 38.0, 31.0, 42.0, 44.0, 47.0, 47.0, 53.0, 37.0, 55.0, 45.0, 34.0, 31.0, 39.0, 26.0, 29.0, 30.0, 31.0, 26.0, 22.0, 17.0, 17.0, 8.0, 16.0, 8.0, 2.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.912752151489258, -11.559101104736328, -11.205450057983398, -10.851799011230469, -10.498147964477539, -10.14449691772461, -9.79084587097168, -9.43719482421875, -9.08354377746582, -8.72989273071289, -8.376241683959961, -8.022590637207031, -7.668939590454102, -7.315288543701172, -6.9616379737854, -6.607986927032471, -6.254336357116699, -5.9006853103637695, -5.54703426361084, -5.19338321685791, -4.8397321701049805, -4.486081123352051, -4.132430553436279, -3.7787795066833496, -3.42512845993042, -3.0714774131774902, -2.7178263664245605, -2.36417555809021, -2.0105245113372803, -1.6568734645843506, -1.30322265625, -0.9495716094970703, -0.5959196090698242, -0.2422686219215393, 0.1113823652267456, 0.46503329277038574, 0.8186843395233154, 1.1723353862762451, 1.5259861946105957, 1.8796372413635254, 2.233288288116455, 2.5869393348693848, 2.9405903816223145, 3.294241189956665, 3.6478922367095947, 4.001543045043945, 4.355194091796875, 4.708845138549805, 5.062496185302734, 5.416147232055664, 5.769798278808594, 6.123449325561523, 6.477100372314453, 6.830751419067383, 7.184401988983154, 7.538053035736084, 7.891704082489014, 8.245354652404785, 8.599005699157715, 8.952656745910645, 9.306307792663574, 9.659958839416504, 10.013609886169434, 10.367260932922363, 10.720911979675293]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 12.0, 6.0, 12.0, 17.0, 32.0, 60.0, 88.0, 115.0, 242.0, 414.0, 822.0, 1889.0, 5013.0, 16411.0, 98799.0, 3914354.0, 128481.0, 17847.0, 5297.0, 2024.0, 968.0, 499.0, 296.0, 198.0, 125.0, 85.0, 57.0, 32.0, 18.0, 13.0, 9.0, 13.0, 3.0, 2.0, 6.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83203125, -3.67596435546875, -3.5198974609375, -3.36383056640625, -3.207763671875, -3.05169677734375, -2.8956298828125, -2.73956298828125, -2.58349609375, -2.42742919921875, -2.2713623046875, -2.11529541015625, -1.959228515625, -1.80316162109375, -1.6470947265625, -1.49102783203125, -1.3349609375, -1.17889404296875, -1.0228271484375, -0.86676025390625, -0.710693359375, -0.55462646484375, -0.3985595703125, -0.24249267578125, -0.08642578125, 0.06964111328125, 0.2257080078125, 0.38177490234375, 0.537841796875, 0.69390869140625, 0.8499755859375, 1.00604248046875, 1.162109375, 1.31817626953125, 1.4742431640625, 1.63031005859375, 1.786376953125, 1.94244384765625, 2.0985107421875, 2.25457763671875, 2.41064453125, 2.56671142578125, 2.7227783203125, 2.87884521484375, 3.034912109375, 3.19097900390625, 3.3470458984375, 3.50311279296875, 3.6591796875, 3.81524658203125, 3.9713134765625, 4.12738037109375, 4.283447265625, 4.43951416015625, 4.5955810546875, 4.75164794921875, 4.90771484375, 5.06378173828125, 5.2198486328125, 5.37591552734375, 5.531982421875, 5.68804931640625, 5.8441162109375, 6.00018310546875, 6.15625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 11.0, 18.0, 15.0, 23.0, 21.0, 44.0, 52.0, 59.0, 71.0, 92.0, 82.0, 87.0, 73.0, 80.0, 54.0, 47.0, 39.0, 32.0, 32.0, 21.0, 15.0, 7.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48388671875, -0.46538543701171875, -0.4468841552734375, -0.42838287353515625, -0.409881591796875, -0.39138031005859375, -0.3728790283203125, -0.35437774658203125, -0.33587646484375, -0.31737518310546875, -0.2988739013671875, -0.28037261962890625, -0.261871337890625, -0.24337005615234375, -0.2248687744140625, -0.20636749267578125, -0.1878662109375, -0.16936492919921875, -0.1508636474609375, -0.13236236572265625, -0.113861083984375, -0.09535980224609375, -0.0768585205078125, -0.05835723876953125, -0.03985595703125, -0.02135467529296875, -0.0028533935546875, 0.01564788818359375, 0.034149169921875, 0.05265045166015625, 0.0711517333984375, 0.08965301513671875, 0.108154296875, 0.12665557861328125, 0.1451568603515625, 0.16365814208984375, 0.182159423828125, 0.20066070556640625, 0.2191619873046875, 0.23766326904296875, 0.25616455078125, 0.27466583251953125, 0.2931671142578125, 0.31166839599609375, 0.330169677734375, 0.34867095947265625, 0.3671722412109375, 0.38567352294921875, 0.4041748046875, 0.42267608642578125, 0.4411773681640625, 0.45967864990234375, 0.478179931640625, 0.49668121337890625, 0.5151824951171875, 0.5336837768554688, 0.55218505859375, 0.5706863403320312, 0.5891876220703125, 0.6076889038085938, 0.626190185546875, 0.6446914672851562, 0.6631927490234375, 0.6816940307617188, 0.7001953125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 7.0, 3.0, 9.0, 16.0, 14.0, 25.0, 23.0, 57.0, 84.0, 114.0, 183.0, 321.0, 628.0, 1178.0, 2407.0, 6043.0, 19431.0, 111667.0, 3743067.0, 262355.0, 31739.0, 8704.0, 3098.0, 1338.0, 694.0, 362.0, 248.0, 161.0, 109.0, 62.0, 42.0, 36.0, 22.0, 15.0, 6.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.234375, -3.11297607421875, -2.9915771484375, -2.87017822265625, -2.748779296875, -2.62738037109375, -2.5059814453125, -2.38458251953125, -2.26318359375, -2.14178466796875, -2.0203857421875, -1.89898681640625, -1.777587890625, -1.65618896484375, -1.5347900390625, -1.41339111328125, -1.2919921875, -1.17059326171875, -1.0491943359375, -0.92779541015625, -0.806396484375, -0.68499755859375, -0.5635986328125, -0.44219970703125, -0.32080078125, -0.19940185546875, -0.0780029296875, 0.04339599609375, 0.164794921875, 0.28619384765625, 0.4075927734375, 0.52899169921875, 0.650390625, 0.77178955078125, 0.8931884765625, 1.01458740234375, 1.135986328125, 1.25738525390625, 1.3787841796875, 1.50018310546875, 1.62158203125, 1.74298095703125, 1.8643798828125, 1.98577880859375, 2.107177734375, 2.22857666015625, 2.3499755859375, 2.47137451171875, 2.5927734375, 2.71417236328125, 2.8355712890625, 2.95697021484375, 3.078369140625, 3.19976806640625, 3.3211669921875, 3.44256591796875, 3.56396484375, 3.68536376953125, 3.8067626953125, 3.92816162109375, 4.049560546875, 4.17095947265625, 4.2923583984375, 4.41375732421875, 4.53515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 8.0, 12.0, 16.0, 27.0, 31.0, 52.0, 81.0, 159.0, 421.0, 1938.0, 706.0, 259.0, 105.0, 75.0, 39.0, 40.0, 33.0, 21.0, 15.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73876953125, -0.7075729370117188, -0.6763763427734375, -0.6451797485351562, -0.613983154296875, -0.5827865600585938, -0.5515899658203125, -0.5203933715820312, -0.48919677734375, -0.45800018310546875, -0.4268035888671875, -0.39560699462890625, -0.364410400390625, -0.33321380615234375, -0.3020172119140625, -0.27082061767578125, -0.2396240234375, -0.20842742919921875, -0.1772308349609375, -0.14603424072265625, -0.114837646484375, -0.08364105224609375, -0.0524444580078125, -0.02124786376953125, 0.00994873046875, 0.04114532470703125, 0.0723419189453125, 0.10353851318359375, 0.134735107421875, 0.16593170166015625, 0.1971282958984375, 0.22832489013671875, 0.259521484375, 0.29071807861328125, 0.3219146728515625, 0.35311126708984375, 0.384307861328125, 0.41550445556640625, 0.4467010498046875, 0.47789764404296875, 0.50909423828125, 0.5402908325195312, 0.5714874267578125, 0.6026840209960938, 0.633880615234375, 0.6650772094726562, 0.6962738037109375, 0.7274703979492188, 0.7586669921875, 0.7898635864257812, 0.8210601806640625, 0.8522567749023438, 0.883453369140625, 0.9146499633789062, 0.9458465576171875, 0.9770431518554688, 1.00823974609375, 1.0394363403320312, 1.0706329345703125, 1.1018295288085938, 1.133026123046875, 1.1642227172851562, 1.1954193115234375, 1.2266159057617188, 1.2578125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 30.0, 104.0, 383.0, 370.0, 92.0, 18.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.541452407836914, -13.0885591506958, -12.635666847229004, -12.18277359008789, -11.729880332946777, -11.276987075805664, -10.824094772338867, -10.371201515197754, -9.91830825805664, -9.465415000915527, -9.01252269744873, -8.559629440307617, -8.106736183166504, -7.653843402862549, -7.200950622558594, -6.7480573654174805, -6.295165061950684, -5.8422722816467285, -5.389379024505615, -4.93648624420166, -4.483592987060547, -4.030700206756592, -3.5778074264526367, -3.1249144077301025, -2.6720213890075684, -2.219128370285034, -1.7662354707717896, -1.313342571258545, -0.8604495525360107, -0.40755653381347656, 0.045336246490478516, 0.4982292652130127, 0.9511222839355469, 1.404015302658081, 1.8569082021713257, 2.3098011016845703, 2.7626941204071045, 3.2155871391296387, 3.6684799194335938, 4.121373176574707, 4.574265956878662, 5.027158737182617, 5.4800519943237305, 5.9329447746276855, 6.385837554931641, 6.838730812072754, 7.291623592376709, 7.744516372680664, 8.197409629821777, 8.65030288696289, 9.103195190429688, 9.5560884475708, 10.008981704711914, 10.461874008178711, 10.914767265319824, 11.367660522460938, 11.820552825927734, 12.273446083068848, 12.726338386535645, 13.179231643676758, 13.632124900817871, 14.085018157958984, 14.537910461425781, 14.990803718566895, 15.443696975708008]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 12.0, 6.0, 7.0, 14.0, 12.0, 19.0, 19.0, 17.0, 22.0, 22.0, 29.0, 24.0, 36.0, 28.0, 31.0, 50.0, 47.0, 47.0, 51.0, 34.0, 42.0, 45.0, 38.0, 44.0, 37.0, 49.0, 25.0, 29.0, 22.0, 26.0, 31.0, 23.0, 9.0, 12.0, 9.0, 4.0, 5.0, 7.0, 8.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2637805938720703, -2.182279586791992, -2.100778341293335, -2.019277334213257, -1.9377762079238892, -1.8562750816345215, -1.7747740745544434, -1.6932729482650757, -1.611771821975708, -1.5302706956863403, -1.4487695693969727, -1.3672685623168945, -1.2857674360275269, -1.2042663097381592, -1.122765302658081, -1.0412641763687134, -0.9597630500793457, -0.878261923789978, -0.7967608571052551, -0.7152597904205322, -0.6337586641311646, -0.5522575378417969, -0.470756471157074, -0.3892554044723511, -0.3077542781829834, -0.2262531816959381, -0.14475208520889282, -0.06325098872184753, 0.018250107765197754, 0.09975120425224304, 0.18125230073928833, 0.26275336742401123, 0.3442544937133789, 0.4257555902004242, 0.5072566866874695, 0.5887577533721924, 0.6702588796615601, 0.7517600059509277, 0.8332610726356506, 0.9147621393203735, 0.9962632656097412, 1.0777643918991089, 1.1592655181884766, 1.2407665252685547, 1.3222676515579224, 1.40376877784729, 1.4852697849273682, 1.5667709112167358, 1.6482720375061035, 1.7297731637954712, 1.8112742900848389, 1.892775297164917, 1.9742764234542847, 2.0557775497436523, 2.1372785568237305, 2.2187795639038086, 2.300280809402466, 2.381781816482544, 2.463283061981201, 2.5447840690612793, 2.6262850761413574, 2.7077863216400146, 2.7892873287200928, 2.87078857421875, 2.952289581298828]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 12.0, 14.0, 10.0, 25.0, 34.0, 63.0, 59.0, 130.0, 154.0, 262.0, 418.0, 774.0, 1396.0, 2571.0, 5628.0, 13697.0, 37855.0, 119617.0, 371592.0, 334636.0, 103297.0, 33442.0, 12284.0, 5109.0, 2422.0, 1275.0, 651.0, 382.0, 250.0, 169.0, 123.0, 68.0, 49.0, 27.0, 15.0, 17.0, 8.0, 9.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6796875, -1.61956787109375, -1.5594482421875, -1.49932861328125, -1.439208984375, -1.37908935546875, -1.3189697265625, -1.25885009765625, -1.19873046875, -1.13861083984375, -1.0784912109375, -1.01837158203125, -0.958251953125, -0.89813232421875, -0.8380126953125, -0.77789306640625, -0.7177734375, -0.65765380859375, -0.5975341796875, -0.53741455078125, -0.477294921875, -0.41717529296875, -0.3570556640625, -0.29693603515625, -0.23681640625, -0.17669677734375, -0.1165771484375, -0.05645751953125, 0.003662109375, 0.06378173828125, 0.1239013671875, 0.18402099609375, 0.244140625, 0.30426025390625, 0.3643798828125, 0.42449951171875, 0.484619140625, 0.54473876953125, 0.6048583984375, 0.66497802734375, 0.72509765625, 0.78521728515625, 0.8453369140625, 0.90545654296875, 0.965576171875, 1.02569580078125, 1.0858154296875, 1.14593505859375, 1.2060546875, 1.26617431640625, 1.3262939453125, 1.38641357421875, 1.446533203125, 1.50665283203125, 1.5667724609375, 1.62689208984375, 1.68701171875, 1.74713134765625, 1.8072509765625, 1.86737060546875, 1.927490234375, 1.98760986328125, 2.0477294921875, 2.10784912109375, 2.16796875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 3.0, 14.0, 9.0, 15.0, 26.0, 38.0, 47.0, 50.0, 60.0, 81.0, 106.0, 73.0, 82.0, 67.0, 72.0, 53.0, 59.0, 45.0, 37.0, 18.0, 11.0, 8.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51220703125, -0.4937286376953125, -0.475250244140625, -0.4567718505859375, -0.43829345703125, -0.4198150634765625, -0.401336669921875, -0.3828582763671875, -0.3643798828125, -0.3459014892578125, -0.327423095703125, -0.3089447021484375, -0.29046630859375, -0.2719879150390625, -0.253509521484375, -0.2350311279296875, -0.216552734375, -0.1980743408203125, -0.179595947265625, -0.1611175537109375, -0.14263916015625, -0.1241607666015625, -0.105682373046875, -0.0872039794921875, -0.0687255859375, -0.0502471923828125, -0.031768798828125, -0.0132904052734375, 0.00518798828125, 0.0236663818359375, 0.042144775390625, 0.0606231689453125, 0.0791015625, 0.0975799560546875, 0.116058349609375, 0.1345367431640625, 0.15301513671875, 0.1714935302734375, 0.189971923828125, 0.2084503173828125, 0.2269287109375, 0.2454071044921875, 0.263885498046875, 0.2823638916015625, 0.30084228515625, 0.3193206787109375, 0.337799072265625, 0.3562774658203125, 0.374755859375, 0.3932342529296875, 0.411712646484375, 0.4301910400390625, 0.44866943359375, 0.4671478271484375, 0.485626220703125, 0.5041046142578125, 0.5225830078125, 0.5410614013671875, 0.559539794921875, 0.5780181884765625, 0.59649658203125, 0.6149749755859375, 0.633453369140625, 0.6519317626953125, 0.67041015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 7.0, 10.0, 18.0, 30.0, 42.0, 48.0, 84.0, 119.0, 230.0, 328.0, 517.0, 953.0, 1636.0, 3191.0, 6939.0, 17268.0, 46912.0, 149841.0, 391369.0, 285161.0, 91343.0, 30164.0, 11673.0, 4911.0, 2493.0, 1280.0, 766.0, 426.0, 265.0, 187.0, 106.0, 76.0, 49.0, 35.0, 13.0, 12.0, 16.0, 7.0, 6.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.759765625, -1.7076873779296875, -1.655609130859375, -1.6035308837890625, -1.55145263671875, -1.4993743896484375, -1.447296142578125, -1.3952178955078125, -1.3431396484375, -1.2910614013671875, -1.238983154296875, -1.1869049072265625, -1.13482666015625, -1.0827484130859375, -1.030670166015625, -0.9785919189453125, -0.926513671875, -0.8744354248046875, -0.822357177734375, -0.7702789306640625, -0.71820068359375, -0.6661224365234375, -0.614044189453125, -0.5619659423828125, -0.5098876953125, -0.4578094482421875, -0.405731201171875, -0.3536529541015625, -0.30157470703125, -0.2494964599609375, -0.197418212890625, -0.1453399658203125, -0.09326171875, -0.0411834716796875, 0.010894775390625, 0.0629730224609375, 0.11505126953125, 0.1671295166015625, 0.219207763671875, 0.2712860107421875, 0.3233642578125, 0.3754425048828125, 0.427520751953125, 0.4795989990234375, 0.53167724609375, 0.5837554931640625, 0.635833740234375, 0.6879119873046875, 0.739990234375, 0.7920684814453125, 0.844146728515625, 0.8962249755859375, 0.94830322265625, 1.0003814697265625, 1.052459716796875, 1.1045379638671875, 1.1566162109375, 1.2086944580078125, 1.260772705078125, 1.3128509521484375, 1.36492919921875, 1.4170074462890625, 1.469085693359375, 1.5211639404296875, 1.5732421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 9.0, 15.0, 20.0, 23.0, 31.0, 35.0, 38.0, 34.0, 28.0, 50.0, 52.0, 49.0, 44.0, 49.0, 59.0, 59.0, 48.0, 55.0, 56.0, 35.0, 34.0, 25.0, 26.0, 22.0, 19.0, 18.0, 11.0, 8.0, 9.0, 6.0, 4.0, 0.0, 5.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0], "bins": [-2.552734375, -2.48614501953125, -2.4195556640625, -2.35296630859375, -2.286376953125, -2.21978759765625, -2.1531982421875, -2.08660888671875, -2.02001953125, -1.95343017578125, -1.8868408203125, -1.82025146484375, -1.753662109375, -1.68707275390625, -1.6204833984375, -1.55389404296875, -1.4873046875, -1.42071533203125, -1.3541259765625, -1.28753662109375, -1.220947265625, -1.15435791015625, -1.0877685546875, -1.02117919921875, -0.95458984375, -0.88800048828125, -0.8214111328125, -0.75482177734375, -0.688232421875, -0.62164306640625, -0.5550537109375, -0.48846435546875, -0.421875, -0.35528564453125, -0.2886962890625, -0.22210693359375, -0.155517578125, -0.08892822265625, -0.0223388671875, 0.04425048828125, 0.11083984375, 0.17742919921875, 0.2440185546875, 0.31060791015625, 0.377197265625, 0.44378662109375, 0.5103759765625, 0.57696533203125, 0.6435546875, 0.71014404296875, 0.7767333984375, 0.84332275390625, 0.909912109375, 0.97650146484375, 1.0430908203125, 1.10968017578125, 1.17626953125, 1.24285888671875, 1.3094482421875, 1.37603759765625, 1.442626953125, 1.50921630859375, 1.5758056640625, 1.64239501953125, 1.708984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 9.0, 5.0, 8.0, 16.0, 15.0, 14.0, 27.0, 35.0, 51.0, 74.0, 107.0, 160.0, 192.0, 320.0, 496.0, 813.0, 1341.0, 2596.0, 5519.0, 14789.0, 60711.0, 459837.0, 420264.0, 55832.0, 14086.0, 5147.0, 2484.0, 1291.0, 781.0, 538.0, 303.0, 196.0, 149.0, 87.0, 73.0, 51.0, 33.0, 25.0, 25.0, 19.0, 10.0, 9.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.279296875, -1.239288330078125, -1.19927978515625, -1.159271240234375, -1.1192626953125, -1.079254150390625, -1.03924560546875, -0.999237060546875, -0.959228515625, -0.919219970703125, -0.87921142578125, -0.839202880859375, -0.7991943359375, -0.759185791015625, -0.71917724609375, -0.679168701171875, -0.63916015625, -0.599151611328125, -0.55914306640625, -0.519134521484375, -0.4791259765625, -0.439117431640625, -0.39910888671875, -0.359100341796875, -0.319091796875, -0.279083251953125, -0.23907470703125, -0.199066162109375, -0.1590576171875, -0.119049072265625, -0.07904052734375, -0.039031982421875, 0.0009765625, 0.040985107421875, 0.08099365234375, 0.121002197265625, 0.1610107421875, 0.201019287109375, 0.24102783203125, 0.281036376953125, 0.321044921875, 0.361053466796875, 0.40106201171875, 0.441070556640625, 0.4810791015625, 0.521087646484375, 0.56109619140625, 0.601104736328125, 0.64111328125, 0.681121826171875, 0.72113037109375, 0.761138916015625, 0.8011474609375, 0.841156005859375, 0.88116455078125, 0.921173095703125, 0.961181640625, 1.001190185546875, 1.04119873046875, 1.081207275390625, 1.1212158203125, 1.161224365234375, 1.20123291015625, 1.241241455078125, 1.28125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 10.0, 24.0, 30.0, 53.0, 110.0, 267.0, 242.0, 101.0, 69.0, 36.0, 11.0, 11.0, 6.0, 9.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007343292236328125, -0.0007164031267166138, -0.000698477029800415, -0.0006805509328842163, -0.0006626248359680176, -0.0006446987390518188, -0.0006267726421356201, -0.0006088465452194214, -0.0005909204483032227, -0.0005729943513870239, -0.0005550682544708252, -0.0005371421575546265, -0.0005192160606384277, -0.000501289963722229, -0.0004833638668060303, -0.00046543776988983154, -0.0004475116729736328, -0.0004295855760574341, -0.00041165947914123535, -0.0003937333822250366, -0.0003758072853088379, -0.00035788118839263916, -0.00033995509147644043, -0.0003220289945602417, -0.00030410289764404297, -0.00028617680072784424, -0.0002682507038116455, -0.0002503246068954468, -0.00023239850997924805, -0.00021447241306304932, -0.00019654631614685059, -0.00017862021923065186, -0.00016069412231445312, -0.0001427680253982544, -0.00012484192848205566, -0.00010691583156585693, -8.89897346496582e-05, -7.106363773345947e-05, -5.313754081726074e-05, -3.521144390106201e-05, -1.728534698486328e-05, 6.407499313354492e-07, 1.856684684753418e-05, 3.649294376373291e-05, 5.441904067993164e-05, 7.234513759613037e-05, 9.02712345123291e-05, 0.00010819733142852783, 0.00012612342834472656, 0.0001440495252609253, 0.00016197562217712402, 0.00017990171909332275, 0.00019782781600952148, 0.00021575391292572021, 0.00023368000984191895, 0.0002516061067581177, 0.0002695322036743164, 0.00028745830059051514, 0.00030538439750671387, 0.0003233104944229126, 0.00034123659133911133, 0.00035916268825531006, 0.0003770887851715088, 0.0003950148820877075, 0.00041294097900390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 6.0, 16.0, 15.0, 16.0, 26.0, 40.0, 44.0, 84.0, 111.0, 180.0, 315.0, 510.0, 920.0, 1770.0, 3949.0, 13190.0, 111073.0, 809630.0, 87721.0, 11441.0, 3604.0, 1665.0, 874.0, 489.0, 323.0, 175.0, 115.0, 75.0, 59.0, 32.0, 29.0, 10.0, 11.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9013671875, -1.8389434814453125, -1.776519775390625, -1.7140960693359375, -1.65167236328125, -1.5892486572265625, -1.526824951171875, -1.4644012451171875, -1.4019775390625, -1.3395538330078125, -1.277130126953125, -1.2147064208984375, -1.15228271484375, -1.0898590087890625, -1.027435302734375, -0.9650115966796875, -0.902587890625, -0.8401641845703125, -0.777740478515625, -0.7153167724609375, -0.65289306640625, -0.5904693603515625, -0.528045654296875, -0.4656219482421875, -0.4031982421875, -0.3407745361328125, -0.278350830078125, -0.2159271240234375, -0.15350341796875, -0.0910797119140625, -0.028656005859375, 0.0337677001953125, 0.09619140625, 0.1586151123046875, 0.221038818359375, 0.2834625244140625, 0.34588623046875, 0.4083099365234375, 0.470733642578125, 0.5331573486328125, 0.5955810546875, 0.6580047607421875, 0.720428466796875, 0.7828521728515625, 0.84527587890625, 0.9076995849609375, 0.970123291015625, 1.0325469970703125, 1.094970703125, 1.1573944091796875, 1.219818115234375, 1.2822418212890625, 1.34466552734375, 1.4070892333984375, 1.469512939453125, 1.5319366455078125, 1.5943603515625, 1.6567840576171875, 1.719207763671875, 1.7816314697265625, 1.84405517578125, 1.9064788818359375, 1.968902587890625, 2.0313262939453125, 2.09375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 7.0, 6.0, 7.0, 23.0, 19.0, 39.0, 47.0, 56.0, 95.0, 116.0, 117.0, 129.0, 98.0, 68.0, 54.0, 34.0, 23.0, 15.0, 7.0, 7.0, 5.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.14453125, -1.11322021484375, -1.0819091796875, -1.05059814453125, -1.019287109375, -0.98797607421875, -0.9566650390625, -0.92535400390625, -0.89404296875, -0.86273193359375, -0.8314208984375, -0.80010986328125, -0.768798828125, -0.73748779296875, -0.7061767578125, -0.67486572265625, -0.6435546875, -0.61224365234375, -0.5809326171875, -0.54962158203125, -0.518310546875, -0.48699951171875, -0.4556884765625, -0.42437744140625, -0.39306640625, -0.36175537109375, -0.3304443359375, -0.29913330078125, -0.267822265625, -0.23651123046875, -0.2052001953125, -0.17388916015625, -0.142578125, -0.11126708984375, -0.0799560546875, -0.04864501953125, -0.017333984375, 0.01397705078125, 0.0452880859375, 0.07659912109375, 0.10791015625, 0.13922119140625, 0.1705322265625, 0.20184326171875, 0.233154296875, 0.26446533203125, 0.2957763671875, 0.32708740234375, 0.3583984375, 0.38970947265625, 0.4210205078125, 0.45233154296875, 0.483642578125, 0.51495361328125, 0.5462646484375, 0.57757568359375, 0.60888671875, 0.64019775390625, 0.6715087890625, 0.70281982421875, 0.734130859375, 0.76544189453125, 0.7967529296875, 0.82806396484375, 0.859375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 23.0, 33.0, 56.0, 80.0, 131.0, 178.0, 184.0, 126.0, 79.0, 44.0, 18.0, 13.0, 8.0, 9.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.120553016662598, -13.627817153930664, -13.135082244873047, -12.642346382141113, -12.14961051940918, -11.656875610351562, -11.164139747619629, -10.671403884887695, -10.178668975830078, -9.685933113098145, -9.193198204040527, -8.700462341308594, -8.20772647857666, -7.714991092681885, -7.222255706787109, -6.729519844055176, -6.236783981323242, -5.744048595428467, -5.251312732696533, -4.758577346801758, -4.265841484069824, -3.773106098175049, -3.2803707122802734, -2.787635087966919, -2.2948994636535645, -1.80216383934021, -1.309428334236145, -0.8166928291320801, -0.3239572048187256, 0.1687784194946289, 0.6615138053894043, 1.1542494297027588, 1.6469841003417969, 2.1397197246551514, 2.632455348968506, 3.1251907348632812, 3.6179263591766357, 4.11066198348999, 4.603397369384766, 5.096133232116699, 5.588868618011475, 6.08160400390625, 6.574339866638184, 7.067075252532959, 7.559810638427734, 8.052546501159668, 8.545282363891602, 9.038017272949219, 9.530753135681152, 10.023488998413086, 10.516223907470703, 11.008959770202637, 11.50169563293457, 11.994430541992188, 12.487166404724121, 12.979902267456055, 13.472637176513672, 13.965373039245605, 14.458107948303223, 14.950843811035156, 15.44357967376709, 15.936315536499023, 16.42905044555664, 16.921785354614258, 17.414522171020508]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 2.0, 6.0, 10.0, 14.0, 17.0, 13.0, 18.0, 19.0, 15.0, 19.0, 40.0, 33.0, 44.0, 38.0, 42.0, 51.0, 57.0, 46.0, 58.0, 55.0, 55.0, 47.0, 40.0, 44.0, 29.0, 34.0, 32.0, 19.0, 17.0, 15.0, 16.0, 11.0, 19.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.292389869689941, -10.927141189575195, -10.561893463134766, -10.19664478302002, -9.831396102905273, -9.466148376464844, -9.100899696350098, -8.735651016235352, -8.370403289794922, -8.005154609680176, -7.639906883239746, -7.274658203125, -6.909409999847412, -6.544161796569824, -6.178913116455078, -5.81366491317749, -5.448416709899902, -5.0831685066223145, -4.717920303344727, -4.3526716232299805, -3.9874234199523926, -3.6221752166748047, -3.2569267749786377, -2.8916783332824707, -2.526430130004883, -2.161181926727295, -1.795933485031128, -1.4306851625442505, -1.065436840057373, -0.7001885175704956, -0.33494019508361816, 0.030308246612548828, 0.3955564498901367, 0.7608047723770142, 1.1260530948638916, 1.491301417350769, 1.8565497398376465, 2.2217979431152344, 2.5870463848114014, 2.9522948265075684, 3.3175430297851562, 3.682791233062744, 4.048039436340332, 4.413288116455078, 4.778536319732666, 5.143784523010254, 5.509033203125, 5.874281406402588, 6.239529609680176, 6.604777812957764, 6.970026016235352, 7.335274696350098, 7.7005228996276855, 8.065771102905273, 8.43101978302002, 8.796268463134766, 9.161516189575195, 9.526764869689941, 9.892012596130371, 10.257261276245117, 10.622509002685547, 10.987757682800293, 11.353006362915039, 11.718254089355469, 12.083502769470215]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 7.0, 6.0, 13.0, 16.0, 39.0, 53.0, 107.0, 308.0, 727.0, 2129.0, 7438.0, 41962.0, 4029086.0, 96291.0, 11023.0, 2936.0, 1075.0, 441.0, 229.0, 110.0, 75.0, 43.0, 24.0, 21.0, 18.0, 9.0, 13.0, 10.0, 7.0, 12.0, 8.0, 5.0, 4.0, 10.0, 4.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.421875, -2.2445068359375, -2.067138671875, -1.8897705078125, -1.71240234375, -1.5350341796875, -1.357666015625, -1.1802978515625, -1.0029296875, -0.8255615234375, -0.648193359375, -0.4708251953125, -0.29345703125, -0.1160888671875, 0.061279296875, 0.2386474609375, 0.416015625, 0.5933837890625, 0.770751953125, 0.9481201171875, 1.12548828125, 1.3028564453125, 1.480224609375, 1.6575927734375, 1.8349609375, 2.0123291015625, 2.189697265625, 2.3670654296875, 2.54443359375, 2.7218017578125, 2.899169921875, 3.0765380859375, 3.25390625, 3.4312744140625, 3.608642578125, 3.7860107421875, 3.96337890625, 4.1407470703125, 4.318115234375, 4.4954833984375, 4.6728515625, 4.8502197265625, 5.027587890625, 5.2049560546875, 5.38232421875, 5.5596923828125, 5.737060546875, 5.9144287109375, 6.091796875, 6.2691650390625, 6.446533203125, 6.6239013671875, 6.80126953125, 6.9786376953125, 7.156005859375, 7.3333740234375, 7.5107421875, 7.6881103515625, 7.865478515625, 8.0428466796875, 8.22021484375, 8.3975830078125, 8.574951171875, 8.7523193359375, 8.9296875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 4.0, 19.0, 25.0, 31.0, 50.0, 49.0, 60.0, 86.0, 80.0, 105.0, 83.0, 73.0, 75.0, 68.0, 48.0, 31.0, 28.0, 24.0, 21.0, 14.0, 11.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477783203125, -0.4569511413574219, -0.43611907958984375, -0.4152870178222656, -0.3944549560546875, -0.3736228942871094, -0.35279083251953125, -0.3319587707519531, -0.311126708984375, -0.2902946472167969, -0.26946258544921875, -0.24863052368164062, -0.2277984619140625, -0.20696640014648438, -0.18613433837890625, -0.16530227661132812, -0.14447021484375, -0.12363815307617188, -0.10280609130859375, -0.08197402954101562, -0.0611419677734375, -0.040309906005859375, -0.01947784423828125, 0.001354217529296875, 0.022186279296875, 0.043018341064453125, 0.06385040283203125, 0.08468246459960938, 0.1055145263671875, 0.12634658813476562, 0.14717864990234375, 0.16801071166992188, 0.1888427734375, 0.20967483520507812, 0.23050689697265625, 0.2513389587402344, 0.2721710205078125, 0.2930030822753906, 0.31383514404296875, 0.3346672058105469, 0.355499267578125, 0.3763313293457031, 0.39716339111328125, 0.4179954528808594, 0.4388275146484375, 0.4596595764160156, 0.48049163818359375, 0.5013236999511719, 0.52215576171875, 0.5429878234863281, 0.5638198852539062, 0.5846519470214844, 0.6054840087890625, 0.6263160705566406, 0.6471481323242188, 0.6679801940917969, 0.688812255859375, 0.7096443176269531, 0.7304763793945312, 0.7513084411621094, 0.7721405029296875, 0.7929725646972656, 0.8138046264648438, 0.8346366882324219, 0.85546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 3.0, 5.0, 9.0, 8.0, 10.0, 19.0, 26.0, 37.0, 35.0, 40.0, 63.0, 84.0, 168.0, 215.0, 294.0, 485.0, 729.0, 1237.0, 2067.0, 3738.0, 7296.0, 17246.0, 66002.0, 3146777.0, 872726.0, 46553.0, 14165.0, 6298.0, 3239.0, 1764.0, 1045.0, 651.0, 417.0, 257.0, 168.0, 131.0, 78.0, 63.0, 46.0, 26.0, 10.0, 12.0, 12.0, 8.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.65625, -2.577880859375, -2.49951171875, -2.421142578125, -2.3427734375, -2.264404296875, -2.18603515625, -2.107666015625, -2.029296875, -1.950927734375, -1.87255859375, -1.794189453125, -1.7158203125, -1.637451171875, -1.55908203125, -1.480712890625, -1.40234375, -1.323974609375, -1.24560546875, -1.167236328125, -1.0888671875, -1.010498046875, -0.93212890625, -0.853759765625, -0.775390625, -0.697021484375, -0.61865234375, -0.540283203125, -0.4619140625, -0.383544921875, -0.30517578125, -0.226806640625, -0.1484375, -0.070068359375, 0.00830078125, 0.086669921875, 0.1650390625, 0.243408203125, 0.32177734375, 0.400146484375, 0.478515625, 0.556884765625, 0.63525390625, 0.713623046875, 0.7919921875, 0.870361328125, 0.94873046875, 1.027099609375, 1.10546875, 1.183837890625, 1.26220703125, 1.340576171875, 1.4189453125, 1.497314453125, 1.57568359375, 1.654052734375, 1.732421875, 1.810791015625, 1.88916015625, 1.967529296875, 2.0458984375, 2.124267578125, 2.20263671875, 2.281005859375, 2.359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 4.0, 11.0, 14.0, 13.0, 19.0, 20.0, 59.0, 99.0, 239.0, 897.0, 1925.0, 412.0, 145.0, 68.0, 33.0, 25.0, 18.0, 10.0, 15.0, 8.0, 8.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0], "bins": [-1.1083984375, -1.083343505859375, -1.05828857421875, -1.033233642578125, -1.0081787109375, -0.983123779296875, -0.95806884765625, -0.933013916015625, -0.907958984375, -0.882904052734375, -0.85784912109375, -0.832794189453125, -0.8077392578125, -0.782684326171875, -0.75762939453125, -0.732574462890625, -0.70751953125, -0.682464599609375, -0.65740966796875, -0.632354736328125, -0.6072998046875, -0.582244873046875, -0.55718994140625, -0.532135009765625, -0.507080078125, -0.482025146484375, -0.45697021484375, -0.431915283203125, -0.4068603515625, -0.381805419921875, -0.35675048828125, -0.331695556640625, -0.306640625, -0.281585693359375, -0.25653076171875, -0.231475830078125, -0.2064208984375, -0.181365966796875, -0.15631103515625, -0.131256103515625, -0.106201171875, -0.081146240234375, -0.05609130859375, -0.031036376953125, -0.0059814453125, 0.019073486328125, 0.04412841796875, 0.069183349609375, 0.09423828125, 0.119293212890625, 0.14434814453125, 0.169403076171875, 0.1944580078125, 0.219512939453125, 0.24456787109375, 0.269622802734375, 0.294677734375, 0.319732666015625, 0.34478759765625, 0.369842529296875, 0.3948974609375, 0.419952392578125, 0.44500732421875, 0.470062255859375, 0.4951171875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 12.0, 13.0, 28.0, 58.0, 107.0, 182.0, 245.0, 185.0, 79.0, 39.0, 19.0, 13.0, 6.0, 7.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.503745079040527, -4.318550109863281, -4.133354663848877, -3.948159694671631, -3.7629642486572266, -3.5777692794799805, -3.3925740718841553, -3.20737886428833, -3.022183656692505, -2.8369884490966797, -2.6517932415008545, -2.4665980339050293, -2.281403064727783, -2.096207618713379, -1.9110126495361328, -1.7258174419403076, -1.5406222343444824, -1.3554270267486572, -1.170231819152832, -0.9850367307662964, -0.7998415231704712, -0.614646315574646, -0.42945122718811035, -0.24425601959228516, -0.05906081199645996, 0.12613436579704285, 0.31132954359054565, 0.4965246915817261, 0.6817198991775513, 0.8669151067733765, 1.052110195159912, 1.2373054027557373, 1.4225006103515625, 1.6076958179473877, 1.792891025543213, 1.9780861139297485, 2.1632814407348633, 2.3484764099121094, 2.5336716175079346, 2.7188668251037598, 2.904062032699585, 3.08925724029541, 3.2744524478912354, 3.4596476554870605, 3.6448426246643066, 3.830038070678711, 4.015233039855957, 4.200428009033203, 4.385623455047607, 4.5708184242248535, 4.756013870239258, 4.941208839416504, 5.126404285430908, 5.311599254608154, 5.496794700622559, 5.681989669799805, 5.867184638977051, 6.052379608154297, 6.237575054168701, 6.422770023345947, 6.607965469360352, 6.793160438537598, 6.978355407714844, 7.163550853729248, 7.348746299743652]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 4.0, 10.0, 5.0, 13.0, 17.0, 19.0, 15.0, 11.0, 14.0, 14.0, 24.0, 31.0, 34.0, 39.0, 32.0, 48.0, 42.0, 32.0, 35.0, 39.0, 39.0, 59.0, 37.0, 45.0, 52.0, 46.0, 41.0, 28.0, 33.0, 20.0, 18.0, 19.0, 24.0, 10.0, 10.0, 5.0, 8.0, 3.0, 2.0, 5.0, 5.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0], "bins": [-2.376662492752075, -2.3135604858398438, -2.2504584789276123, -2.187356472015381, -2.1242544651031494, -2.061152458190918, -1.9980504512786865, -1.934948444366455, -1.8718464374542236, -1.8087444305419922, -1.7456424236297607, -1.6825404167175293, -1.6194384098052979, -1.5563364028930664, -1.493234395980835, -1.4301323890686035, -1.367030382156372, -1.3039283752441406, -1.2408263683319092, -1.1777243614196777, -1.1146223545074463, -1.0515203475952148, -0.9884183406829834, -0.925316333770752, -0.8622143268585205, -0.7991123199462891, -0.7360103130340576, -0.6729083061218262, -0.6098062992095947, -0.5467042922973633, -0.48360228538513184, -0.4205002784729004, -0.35739850997924805, -0.2942965030670166, -0.23119449615478516, -0.1680924892425537, -0.10499048233032227, -0.04188847541809082, 0.021213531494140625, 0.08431553840637207, 0.14741754531860352, 0.21051955223083496, 0.2736215591430664, 0.33672356605529785, 0.3998255729675293, 0.46292757987976074, 0.5260295867919922, 0.5891315937042236, 0.6522336006164551, 0.7153356075286865, 0.778437614440918, 0.8415396213531494, 0.9046416282653809, 0.9677436351776123, 1.0308456420898438, 1.0939476490020752, 1.1570496559143066, 1.220151662826538, 1.2832536697387695, 1.346355676651001, 1.4094576835632324, 1.4725596904754639, 1.5356616973876953, 1.5987637042999268, 1.6618657112121582]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 11.0, 8.0, 17.0, 8.0, 26.0, 24.0, 35.0, 56.0, 102.0, 289.0, 1031.0, 5755.0, 95724.0, 874952.0, 64594.0, 4476.0, 895.0, 265.0, 103.0, 51.0, 41.0, 22.0, 22.0, 18.0, 9.0, 10.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.8359375, -6.64306640625, -6.4501953125, -6.25732421875, -6.064453125, -5.87158203125, -5.6787109375, -5.48583984375, -5.29296875, -5.10009765625, -4.9072265625, -4.71435546875, -4.521484375, -4.32861328125, -4.1357421875, -3.94287109375, -3.75, -3.55712890625, -3.3642578125, -3.17138671875, -2.978515625, -2.78564453125, -2.5927734375, -2.39990234375, -2.20703125, -2.01416015625, -1.8212890625, -1.62841796875, -1.435546875, -1.24267578125, -1.0498046875, -0.85693359375, -0.6640625, -0.47119140625, -0.2783203125, -0.08544921875, 0.107421875, 0.30029296875, 0.4931640625, 0.68603515625, 0.87890625, 1.07177734375, 1.2646484375, 1.45751953125, 1.650390625, 1.84326171875, 2.0361328125, 2.22900390625, 2.421875, 2.61474609375, 2.8076171875, 3.00048828125, 3.193359375, 3.38623046875, 3.5791015625, 3.77197265625, 3.96484375, 4.15771484375, 4.3505859375, 4.54345703125, 4.736328125, 4.92919921875, 5.1220703125, 5.31494140625, 5.5078125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 8.0, 9.0, 18.0, 23.0, 47.0, 51.0, 75.0, 73.0, 89.0, 76.0, 92.0, 82.0, 91.0, 66.0, 48.0, 45.0, 26.0, 27.0, 12.0, 11.0, 16.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.449951171875, -0.4287376403808594, -0.40752410888671875, -0.3863105773925781, -0.3650970458984375, -0.3438835144042969, -0.32266998291015625, -0.3014564514160156, -0.280242919921875, -0.2590293884277344, -0.23781585693359375, -0.21660232543945312, -0.1953887939453125, -0.17417526245117188, -0.15296173095703125, -0.13174819946289062, -0.11053466796875, -0.08932113647460938, -0.06810760498046875, -0.046894073486328125, -0.0256805419921875, -0.004467010498046875, 0.01674652099609375, 0.037960052490234375, 0.059173583984375, 0.08038711547851562, 0.10160064697265625, 0.12281417846679688, 0.1440277099609375, 0.16524124145507812, 0.18645477294921875, 0.20766830444335938, 0.2288818359375, 0.2500953674316406, 0.27130889892578125, 0.2925224304199219, 0.3137359619140625, 0.3349494934082031, 0.35616302490234375, 0.3773765563964844, 0.398590087890625, 0.4198036193847656, 0.44101715087890625, 0.4622306823730469, 0.4834442138671875, 0.5046577453613281, 0.5258712768554688, 0.5470848083496094, 0.56829833984375, 0.5895118713378906, 0.6107254028320312, 0.6319389343261719, 0.6531524658203125, 0.6743659973144531, 0.6955795288085938, 0.7167930603027344, 0.738006591796875, 0.7592201232910156, 0.7804336547851562, 0.8016471862792969, 0.8228607177734375, 0.8440742492675781, 0.8652877807617188, 0.8865013122558594, 0.90771484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 8.0, 14.0, 16.0, 26.0, 41.0, 48.0, 72.0, 105.0, 158.0, 250.0, 449.0, 700.0, 1223.0, 2303.0, 5251.0, 12652.0, 37026.0, 129057.0, 421807.0, 309762.0, 84410.0, 25481.0, 9161.0, 3956.0, 1913.0, 1017.0, 600.0, 351.0, 223.0, 146.0, 100.0, 77.0, 39.0, 34.0, 23.0, 15.0, 13.0, 4.0, 7.0, 5.0, 3.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.970703125, -1.9124603271484375, -1.854217529296875, -1.7959747314453125, -1.73773193359375, -1.6794891357421875, -1.621246337890625, -1.5630035400390625, -1.5047607421875, -1.4465179443359375, -1.388275146484375, -1.3300323486328125, -1.27178955078125, -1.2135467529296875, -1.155303955078125, -1.0970611572265625, -1.038818359375, -0.9805755615234375, -0.922332763671875, -0.8640899658203125, -0.80584716796875, -0.7476043701171875, -0.689361572265625, -0.6311187744140625, -0.5728759765625, -0.5146331787109375, -0.456390380859375, -0.3981475830078125, -0.33990478515625, -0.2816619873046875, -0.223419189453125, -0.1651763916015625, -0.10693359375, -0.0486907958984375, 0.009552001953125, 0.0677947998046875, 0.12603759765625, 0.1842803955078125, 0.242523193359375, 0.3007659912109375, 0.3590087890625, 0.4172515869140625, 0.475494384765625, 0.5337371826171875, 0.59197998046875, 0.6502227783203125, 0.708465576171875, 0.7667083740234375, 0.824951171875, 0.8831939697265625, 0.941436767578125, 0.9996795654296875, 1.05792236328125, 1.1161651611328125, 1.174407958984375, 1.2326507568359375, 1.2908935546875, 1.3491363525390625, 1.407379150390625, 1.4656219482421875, 1.52386474609375, 1.5821075439453125, 1.640350341796875, 1.6985931396484375, 1.7568359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 6.0, 2.0, 7.0, 4.0, 7.0, 5.0, 12.0, 16.0, 24.0, 23.0, 18.0, 28.0, 25.0, 36.0, 35.0, 33.0, 51.0, 46.0, 36.0, 53.0, 40.0, 47.0, 42.0, 47.0, 47.0, 36.0, 41.0, 28.0, 31.0, 17.0, 26.0, 23.0, 19.0, 12.0, 11.0, 20.0, 14.0, 6.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.54296875, -1.4871826171875, -1.431396484375, -1.3756103515625, -1.31982421875, -1.2640380859375, -1.208251953125, -1.1524658203125, -1.0966796875, -1.0408935546875, -0.985107421875, -0.9293212890625, -0.87353515625, -0.8177490234375, -0.761962890625, -0.7061767578125, -0.650390625, -0.5946044921875, -0.538818359375, -0.4830322265625, -0.42724609375, -0.3714599609375, -0.315673828125, -0.2598876953125, -0.2041015625, -0.1483154296875, -0.092529296875, -0.0367431640625, 0.01904296875, 0.0748291015625, 0.130615234375, 0.1864013671875, 0.2421875, 0.2979736328125, 0.353759765625, 0.4095458984375, 0.46533203125, 0.5211181640625, 0.576904296875, 0.6326904296875, 0.6884765625, 0.7442626953125, 0.800048828125, 0.8558349609375, 0.91162109375, 0.9674072265625, 1.023193359375, 1.0789794921875, 1.134765625, 1.1905517578125, 1.246337890625, 1.3021240234375, 1.35791015625, 1.4136962890625, 1.469482421875, 1.5252685546875, 1.5810546875, 1.6368408203125, 1.692626953125, 1.7484130859375, 1.80419921875, 1.8599853515625, 1.915771484375, 1.9715576171875, 2.02734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 12.0, 5.0, 12.0, 14.0, 22.0, 31.0, 43.0, 55.0, 105.0, 169.0, 251.0, 429.0, 710.0, 1370.0, 2649.0, 5967.0, 18090.0, 85637.0, 544238.0, 320092.0, 47473.0, 11984.0, 4376.0, 2095.0, 1130.0, 601.0, 389.0, 203.0, 128.0, 99.0, 54.0, 35.0, 27.0, 23.0, 14.0, 3.0, 9.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96484375, -0.9363250732421875, -0.907806396484375, -0.8792877197265625, -0.85076904296875, -0.8222503662109375, -0.793731689453125, -0.7652130126953125, -0.7366943359375, -0.7081756591796875, -0.679656982421875, -0.6511383056640625, -0.62261962890625, -0.5941009521484375, -0.565582275390625, -0.5370635986328125, -0.508544921875, -0.4800262451171875, -0.451507568359375, -0.4229888916015625, -0.39447021484375, -0.3659515380859375, -0.337432861328125, -0.3089141845703125, -0.2803955078125, -0.2518768310546875, -0.223358154296875, -0.1948394775390625, -0.16632080078125, -0.1378021240234375, -0.109283447265625, -0.0807647705078125, -0.05224609375, -0.0237274169921875, 0.004791259765625, 0.0333099365234375, 0.06182861328125, 0.0903472900390625, 0.118865966796875, 0.1473846435546875, 0.1759033203125, 0.2044219970703125, 0.232940673828125, 0.2614593505859375, 0.28997802734375, 0.3184967041015625, 0.347015380859375, 0.3755340576171875, 0.404052734375, 0.4325714111328125, 0.461090087890625, 0.4896087646484375, 0.51812744140625, 0.5466461181640625, 0.575164794921875, 0.6036834716796875, 0.6322021484375, 0.6607208251953125, 0.689239501953125, 0.7177581787109375, 0.74627685546875, 0.7747955322265625, 0.803314208984375, 0.8318328857421875, 0.8603515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 20.0, 27.0, 53.0, 121.0, 238.0, 257.0, 122.0, 66.0, 38.0, 23.0, 10.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005965232849121094, -0.0005804263055324554, -0.0005643293261528015, -0.0005482323467731476, -0.0005321353673934937, -0.0005160383880138397, -0.0004999414086341858, -0.00048384442925453186, -0.00046774744987487793, -0.000451650470495224, -0.00043555349111557007, -0.00041945651173591614, -0.0004033595323562622, -0.0003872625529766083, -0.00037116557359695435, -0.0003550685942173004, -0.0003389716148376465, -0.00032287463545799255, -0.0003067776560783386, -0.0002906806766986847, -0.00027458369731903076, -0.00025848671793937683, -0.0002423897385597229, -0.00022629275918006897, -0.00021019577980041504, -0.0001940988004207611, -0.00017800182104110718, -0.00016190484166145325, -0.00014580786228179932, -0.00012971088290214539, -0.00011361390352249146, -9.751692414283752e-05, -8.14199447631836e-05, -6.532296538352966e-05, -4.922598600387573e-05, -3.31290066242218e-05, -1.703202724456787e-05, -9.350478649139404e-07, 1.516193151473999e-05, 3.125891089439392e-05, 4.735589027404785e-05, 6.345286965370178e-05, 7.954984903335571e-05, 9.564682841300964e-05, 0.00011174380779266357, 0.0001278407871723175, 0.00014393776655197144, 0.00016003474593162537, 0.0001761317253112793, 0.00019222870469093323, 0.00020832568407058716, 0.0002244226634502411, 0.00024051964282989502, 0.00025661662220954895, 0.0002727136015892029, 0.0002888105809688568, 0.00030490756034851074, 0.00032100453972816467, 0.0003371015191078186, 0.00035319849848747253, 0.00036929547786712646, 0.0003853924572467804, 0.0004014894366264343, 0.00041758641600608826, 0.0004336833953857422]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 6.0, 10.0, 12.0, 16.0, 29.0, 31.0, 47.0, 94.0, 154.0, 287.0, 476.0, 918.0, 1841.0, 3998.0, 10356.0, 34415.0, 170688.0, 601724.0, 170482.0, 34293.0, 10512.0, 4134.0, 1861.0, 948.0, 486.0, 281.0, 153.0, 101.0, 60.0, 46.0, 35.0, 20.0, 10.0, 12.0, 2.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.826171875, -0.800750732421875, -0.77532958984375, -0.749908447265625, -0.7244873046875, -0.699066162109375, -0.67364501953125, -0.648223876953125, -0.622802734375, -0.597381591796875, -0.57196044921875, -0.546539306640625, -0.5211181640625, -0.495697021484375, -0.47027587890625, -0.444854736328125, -0.41943359375, -0.394012451171875, -0.36859130859375, -0.343170166015625, -0.3177490234375, -0.292327880859375, -0.26690673828125, -0.241485595703125, -0.216064453125, -0.190643310546875, -0.16522216796875, -0.139801025390625, -0.1143798828125, -0.088958740234375, -0.06353759765625, -0.038116455078125, -0.0126953125, 0.012725830078125, 0.03814697265625, 0.063568115234375, 0.0889892578125, 0.114410400390625, 0.13983154296875, 0.165252685546875, 0.190673828125, 0.216094970703125, 0.24151611328125, 0.266937255859375, 0.2923583984375, 0.317779541015625, 0.34320068359375, 0.368621826171875, 0.39404296875, 0.419464111328125, 0.44488525390625, 0.470306396484375, 0.4957275390625, 0.521148681640625, 0.54656982421875, 0.571990966796875, 0.597412109375, 0.622833251953125, 0.64825439453125, 0.673675537109375, 0.6990966796875, 0.724517822265625, 0.74993896484375, 0.775360107421875, 0.80078125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 3.0, 3.0, 4.0, 9.0, 17.0, 20.0, 22.0, 36.0, 67.0, 48.0, 54.0, 84.0, 104.0, 106.0, 78.0, 78.0, 49.0, 51.0, 37.0, 24.0, 25.0, 20.0, 15.0, 9.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.488525390625, -0.4704475402832031, -0.45236968994140625, -0.4342918395996094, -0.4162139892578125, -0.3981361389160156, -0.38005828857421875, -0.3619804382324219, -0.343902587890625, -0.3258247375488281, -0.30774688720703125, -0.2896690368652344, -0.2715911865234375, -0.2535133361816406, -0.23543548583984375, -0.21735763549804688, -0.19927978515625, -0.18120193481445312, -0.16312408447265625, -0.14504623413085938, -0.1269683837890625, -0.10889053344726562, -0.09081268310546875, -0.07273483276367188, -0.054656982421875, -0.036579132080078125, -0.01850128173828125, -0.000423431396484375, 0.0176544189453125, 0.035732269287109375, 0.05381011962890625, 0.07188796997070312, 0.0899658203125, 0.10804367065429688, 0.12612152099609375, 0.14419937133789062, 0.1622772216796875, 0.18035507202148438, 0.19843292236328125, 0.21651077270507812, 0.234588623046875, 0.2526664733886719, 0.27074432373046875, 0.2888221740722656, 0.3069000244140625, 0.3249778747558594, 0.34305572509765625, 0.3611335754394531, 0.37921142578125, 0.3972892761230469, 0.41536712646484375, 0.4334449768066406, 0.4515228271484375, 0.4696006774902344, 0.48767852783203125, 0.5057563781738281, 0.523834228515625, 0.5419120788574219, 0.5599899291992188, 0.5780677795410156, 0.5961456298828125, 0.6142234802246094, 0.6323013305664062, 0.6503791809082031, 0.66845703125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 9.0, 8.0, 11.0, 38.0, 57.0, 115.0, 156.0, 200.0, 145.0, 130.0, 58.0, 28.0, 16.0, 13.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.807180404663086, -15.2871732711792, -14.767166137695312, -14.247159004211426, -13.727151870727539, -13.207144737243652, -12.687137603759766, -12.167130470275879, -11.647123336791992, -11.127116203308105, -10.607109069824219, -10.087101936340332, -9.567094802856445, -9.047087669372559, -8.527080535888672, -8.007073402404785, -7.487066268920898, -6.967059135437012, -6.447052001953125, -5.927044868469238, -5.407037734985352, -4.887030601501465, -4.367023468017578, -3.8470163345336914, -3.3270092010498047, -2.807002067565918, -2.2869949340820312, -1.7669878005981445, -1.2469806671142578, -0.7269735336303711, -0.20696640014648438, 0.31304073333740234, 0.8330459594726562, 1.353053092956543, 1.8730602264404297, 2.3930673599243164, 2.913074493408203, 3.43308162689209, 3.9530887603759766, 4.473095893859863, 4.99310302734375, 5.513110160827637, 6.033117294311523, 6.55312442779541, 7.073131561279297, 7.593138694763184, 8.11314582824707, 8.633152961730957, 9.153160095214844, 9.67316722869873, 10.193174362182617, 10.713181495666504, 11.23318862915039, 11.753195762634277, 12.273202896118164, 12.79321002960205, 13.313217163085938, 13.833224296569824, 14.353231430053711, 14.873238563537598, 15.393245697021484, 15.913252830505371, 16.433259963989258, 16.953266143798828, 17.47327423095703]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 16.0, 17.0, 21.0, 28.0, 37.0, 44.0, 48.0, 46.0, 59.0, 47.0, 60.0, 65.0, 66.0, 83.0, 54.0, 46.0, 44.0, 31.0, 40.0, 29.0, 27.0, 32.0, 12.0, 7.0, 7.0, 8.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.353472709655762, -12.922558784484863, -12.491644859313965, -12.060730934143066, -11.629817008972168, -11.19890308380127, -10.767989158630371, -10.337075233459473, -9.906161308288574, -9.475247383117676, -9.044333457946777, -8.613419532775879, -8.18250560760498, -7.751591682434082, -7.320677757263184, -6.889763832092285, -6.458850383758545, -6.0279364585876465, -5.597022533416748, -5.16610860824585, -4.735194683074951, -4.304281234741211, -3.8733670711517334, -3.442453145980835, -3.0115392208099365, -2.580625295639038, -2.1497113704681396, -1.7187975645065308, -1.2878836393356323, -0.8569698333740234, -0.426055908203125, 0.0048580169677734375, 0.4357719421386719, 0.8666858673095703, 1.2975997924804688, 1.7285135984420776, 2.1594276428222656, 2.590341329574585, 3.0212552547454834, 3.452169179916382, 3.8830831050872803, 4.3139967918396, 4.744910717010498, 5.1758246421813965, 5.606738567352295, 6.037652492523193, 6.468566417694092, 6.89948034286499, 7.330394268035889, 7.761308193206787, 8.192221641540527, 8.623135566711426, 9.054049491882324, 9.484963417053223, 9.915877342224121, 10.34679126739502, 10.777705192565918, 11.208619117736816, 11.639533042907715, 12.070446968078613, 12.501360893249512, 12.93227481842041, 13.363188743591309, 13.794102668762207, 14.225016593933105]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [9.0, 2.0, 15.0, 35.0, 75.0, 145.0, 319.0, 759.0, 2150.0, 7463.0, 36077.0, 3601178.0, 513302.0, 23679.0, 5607.0, 1826.0, 725.0, 311.0, 148.0, 100.0, 77.0, 51.0, 38.0, 17.0, 24.0, 14.0, 16.0, 16.0, 16.0, 9.0, 5.0, 12.0, 7.0, 8.0, 6.0, 4.0, 4.0, 6.0, 8.0, 6.0, 4.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9833984375, -1.8166656494140625, -1.649932861328125, -1.4832000732421875, -1.31646728515625, -1.1497344970703125, -0.983001708984375, -0.8162689208984375, -0.6495361328125, -0.4828033447265625, -0.316070556640625, -0.1493377685546875, 0.01739501953125, 0.1841278076171875, 0.350860595703125, 0.5175933837890625, 0.684326171875, 0.8510589599609375, 1.017791748046875, 1.1845245361328125, 1.35125732421875, 1.5179901123046875, 1.684722900390625, 1.8514556884765625, 2.0181884765625, 2.1849212646484375, 2.351654052734375, 2.5183868408203125, 2.68511962890625, 2.8518524169921875, 3.018585205078125, 3.1853179931640625, 3.35205078125, 3.5187835693359375, 3.685516357421875, 3.8522491455078125, 4.01898193359375, 4.1857147216796875, 4.352447509765625, 4.5191802978515625, 4.6859130859375, 4.8526458740234375, 5.019378662109375, 5.1861114501953125, 5.35284423828125, 5.5195770263671875, 5.686309814453125, 5.8530426025390625, 6.019775390625, 6.1865081787109375, 6.353240966796875, 6.5199737548828125, 6.68670654296875, 6.8534393310546875, 7.020172119140625, 7.1869049072265625, 7.3536376953125, 7.5203704833984375, 7.687103271484375, 7.8538360595703125, 8.02056884765625, 8.187301635742188, 8.354034423828125, 8.520767211914062, 8.6875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 10.0, 24.0, 24.0, 29.0, 38.0, 42.0, 70.0, 84.0, 80.0, 81.0, 94.0, 91.0, 74.0, 70.0, 49.0, 26.0, 32.0, 29.0, 15.0, 10.0, 4.0, 9.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46484375, -0.4436798095703125, -0.422515869140625, -0.4013519287109375, -0.38018798828125, -0.3590240478515625, -0.337860107421875, -0.3166961669921875, -0.2955322265625, -0.2743682861328125, -0.253204345703125, -0.2320404052734375, -0.21087646484375, -0.1897125244140625, -0.168548583984375, -0.1473846435546875, -0.126220703125, -0.1050567626953125, -0.083892822265625, -0.0627288818359375, -0.04156494140625, -0.0204010009765625, 0.000762939453125, 0.0219268798828125, 0.0430908203125, 0.0642547607421875, 0.085418701171875, 0.1065826416015625, 0.12774658203125, 0.1489105224609375, 0.170074462890625, 0.1912384033203125, 0.21240234375, 0.2335662841796875, 0.254730224609375, 0.2758941650390625, 0.29705810546875, 0.3182220458984375, 0.339385986328125, 0.3605499267578125, 0.3817138671875, 0.4028778076171875, 0.424041748046875, 0.4452056884765625, 0.46636962890625, 0.4875335693359375, 0.508697509765625, 0.5298614501953125, 0.551025390625, 0.5721893310546875, 0.593353271484375, 0.6145172119140625, 0.63568115234375, 0.6568450927734375, 0.678009033203125, 0.6991729736328125, 0.7203369140625, 0.7415008544921875, 0.762664794921875, 0.7838287353515625, 0.80499267578125, 0.8261566162109375, 0.847320556640625, 0.8684844970703125, 0.8896484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 16.0, 15.0, 23.0, 33.0, 43.0, 72.0, 168.0, 279.0, 512.0, 982.0, 2700.0, 10109.0, 90500.0, 4023760.0, 51705.0, 8343.0, 2537.0, 1096.0, 585.0, 257.0, 187.0, 129.0, 71.0, 50.0, 25.0, 20.0, 15.0, 6.0, 11.0, 8.0, 4.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.671875, -5.439453125, -5.20703125, -4.974609375, -4.7421875, -4.509765625, -4.27734375, -4.044921875, -3.8125, -3.580078125, -3.34765625, -3.115234375, -2.8828125, -2.650390625, -2.41796875, -2.185546875, -1.953125, -1.720703125, -1.48828125, -1.255859375, -1.0234375, -0.791015625, -0.55859375, -0.326171875, -0.09375, 0.138671875, 0.37109375, 0.603515625, 0.8359375, 1.068359375, 1.30078125, 1.533203125, 1.765625, 1.998046875, 2.23046875, 2.462890625, 2.6953125, 2.927734375, 3.16015625, 3.392578125, 3.625, 3.857421875, 4.08984375, 4.322265625, 4.5546875, 4.787109375, 5.01953125, 5.251953125, 5.484375, 5.716796875, 5.94921875, 6.181640625, 6.4140625, 6.646484375, 6.87890625, 7.111328125, 7.34375, 7.576171875, 7.80859375, 8.041015625, 8.2734375, 8.505859375, 8.73828125, 8.970703125, 9.203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 11.0, 18.0, 39.0, 83.0, 188.0, 897.0, 2274.0, 318.0, 89.0, 54.0, 18.0, 21.0, 15.0, 8.0, 8.0, 9.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.69921875, -1.63189697265625, -1.5645751953125, -1.49725341796875, -1.429931640625, -1.36260986328125, -1.2952880859375, -1.22796630859375, -1.16064453125, -1.09332275390625, -1.0260009765625, -0.95867919921875, -0.891357421875, -0.82403564453125, -0.7567138671875, -0.68939208984375, -0.6220703125, -0.55474853515625, -0.4874267578125, -0.42010498046875, -0.352783203125, -0.28546142578125, -0.2181396484375, -0.15081787109375, -0.08349609375, -0.01617431640625, 0.0511474609375, 0.11846923828125, 0.185791015625, 0.25311279296875, 0.3204345703125, 0.38775634765625, 0.455078125, 0.52239990234375, 0.5897216796875, 0.65704345703125, 0.724365234375, 0.79168701171875, 0.8590087890625, 0.92633056640625, 0.99365234375, 1.06097412109375, 1.1282958984375, 1.19561767578125, 1.262939453125, 1.33026123046875, 1.3975830078125, 1.46490478515625, 1.5322265625, 1.59954833984375, 1.6668701171875, 1.73419189453125, 1.801513671875, 1.86883544921875, 1.9361572265625, 2.00347900390625, 2.07080078125, 2.13812255859375, 2.2054443359375, 2.27276611328125, 2.340087890625, 2.40740966796875, 2.4747314453125, 2.54205322265625, 2.609375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 5.0, 24.0, 41.0, 180.0, 453.0, 194.0, 52.0, 30.0, 14.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.857412338256836, -18.12146759033203, -17.38552474975586, -16.649580001831055, -15.91363525390625, -15.177690505981445, -14.441746711730957, -13.705802917480469, -12.969858169555664, -12.23391342163086, -11.497969627380371, -10.762025833129883, -10.026081085205078, -9.290136337280273, -8.554192543029785, -7.818248271942139, -7.082304000854492, -6.346359729766846, -5.610415458679199, -4.874471187591553, -4.138526916503906, -3.4025826454162598, -2.6666383743286133, -1.9306941032409668, -1.1947498321533203, -0.45880556106567383, 0.27713871002197266, 1.0130829811096191, 1.7490272521972656, 2.484971523284912, 3.2209157943725586, 3.956860065460205, 4.692804336547852, 5.428748607635498, 6.1646928787231445, 6.900637149810791, 7.6365814208984375, 8.372526168823242, 9.10846996307373, 9.844413757324219, 10.580358505249023, 11.316303253173828, 12.052247047424316, 12.788190841674805, 13.52413558959961, 14.260080337524414, 14.996024131774902, 15.73196792602539, 16.467912673950195, 17.203857421875, 17.939800262451172, 18.675745010375977, 19.41168975830078, 20.147634506225586, 20.88357925415039, 21.619522094726562, 22.355466842651367, 23.091411590576172, 23.827354431152344, 24.56329917907715, 25.299243927001953, 26.035188674926758, 26.771133422851562, 27.507076263427734, 28.24302101135254]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 9.0, 14.0, 22.0, 50.0, 56.0, 67.0, 107.0, 122.0, 81.0, 105.0, 92.0, 81.0, 48.0, 55.0, 29.0, 24.0, 15.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.242618560791016, -9.925421714782715, -9.608223915100098, -9.291027069091797, -8.97382926940918, -8.656632423400879, -8.339434623718262, -8.022237777709961, -7.705040454864502, -7.387843132019043, -7.070645809173584, -6.753448486328125, -6.436251640319824, -6.119053840637207, -5.801856994628906, -5.484659671783447, -5.167462348937988, -4.850265026092529, -4.53306770324707, -4.215870380401611, -3.8986732959747314, -3.5814759731292725, -3.2642788887023926, -2.9470815658569336, -2.6298842430114746, -2.3126869201660156, -1.9954897165298462, -1.6782925128936768, -1.3610951900482178, -1.0438978672027588, -0.7267006635665894, -0.4095034599304199, -0.09230518341064453, 0.22489207983016968, 0.5420893430709839, 0.8592866063117981, 1.1764838695526123, 1.4936811923980713, 1.8108783960342407, 2.12807559967041, 2.445272922515869, 2.762470245361328, 3.079667568206787, 3.396864652633667, 3.714061975479126, 4.031259536743164, 4.348456382751465, 4.665653705596924, 4.982851028442383, 5.300048351287842, 5.617245674133301, 5.93444299697876, 6.251640319824219, 6.5688371658325195, 6.8860344886779785, 7.2032318115234375, 7.5204291343688965, 7.8376264572143555, 8.154823303222656, 8.472021102905273, 8.789217948913574, 9.106415748596191, 9.423612594604492, 9.74081039428711, 10.05800724029541]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 3.0, 7.0, 5.0, 17.0, 20.0, 19.0, 36.0, 63.0, 90.0, 149.0, 306.0, 607.0, 1735.0, 6606.0, 61939.0, 812778.0, 148825.0, 11278.0, 2373.0, 850.0, 346.0, 190.0, 100.0, 64.0, 45.0, 31.0, 15.0, 18.0, 15.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0], "bins": [-7.3046875, -7.11566162109375, -6.9266357421875, -6.73760986328125, -6.548583984375, -6.35955810546875, -6.1705322265625, -5.98150634765625, -5.79248046875, -5.60345458984375, -5.4144287109375, -5.22540283203125, -5.036376953125, -4.84735107421875, -4.6583251953125, -4.46929931640625, -4.2802734375, -4.09124755859375, -3.9022216796875, -3.71319580078125, -3.524169921875, -3.33514404296875, -3.1461181640625, -2.95709228515625, -2.76806640625, -2.57904052734375, -2.3900146484375, -2.20098876953125, -2.011962890625, -1.82293701171875, -1.6339111328125, -1.44488525390625, -1.255859375, -1.06683349609375, -0.8778076171875, -0.68878173828125, -0.499755859375, -0.31072998046875, -0.1217041015625, 0.06732177734375, 0.25634765625, 0.44537353515625, 0.6343994140625, 0.82342529296875, 1.012451171875, 1.20147705078125, 1.3905029296875, 1.57952880859375, 1.7685546875, 1.95758056640625, 2.1466064453125, 2.33563232421875, 2.524658203125, 2.71368408203125, 2.9027099609375, 3.09173583984375, 3.28076171875, 3.46978759765625, 3.6588134765625, 3.84783935546875, 4.036865234375, 4.22589111328125, 4.4149169921875, 4.60394287109375, 4.79296875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 14.0, 15.0, 23.0, 24.0, 42.0, 37.0, 51.0, 75.0, 83.0, 91.0, 87.0, 96.0, 65.0, 71.0, 46.0, 49.0, 35.0, 22.0, 27.0, 16.0, 15.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.59716796875, -0.576202392578125, -0.55523681640625, -0.534271240234375, -0.5133056640625, -0.492340087890625, -0.47137451171875, -0.450408935546875, -0.429443359375, -0.408477783203125, -0.38751220703125, -0.366546630859375, -0.3455810546875, -0.324615478515625, -0.30364990234375, -0.282684326171875, -0.26171875, -0.240753173828125, -0.21978759765625, -0.198822021484375, -0.1778564453125, -0.156890869140625, -0.13592529296875, -0.114959716796875, -0.093994140625, -0.073028564453125, -0.05206298828125, -0.031097412109375, -0.0101318359375, 0.010833740234375, 0.03179931640625, 0.052764892578125, 0.07373046875, 0.094696044921875, 0.11566162109375, 0.136627197265625, 0.1575927734375, 0.178558349609375, 0.19952392578125, 0.220489501953125, 0.241455078125, 0.262420654296875, 0.28338623046875, 0.304351806640625, 0.3253173828125, 0.346282958984375, 0.36724853515625, 0.388214111328125, 0.4091796875, 0.430145263671875, 0.45111083984375, 0.472076416015625, 0.4930419921875, 0.514007568359375, 0.53497314453125, 0.555938720703125, 0.576904296875, 0.597869873046875, 0.61883544921875, 0.639801025390625, 0.6607666015625, 0.681732177734375, 0.70269775390625, 0.723663330078125, 0.74462890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 6.0, 11.0, 9.0, 12.0, 23.0, 28.0, 40.0, 74.0, 102.0, 142.0, 173.0, 297.0, 418.0, 622.0, 1040.0, 1605.0, 2755.0, 4730.0, 8852.0, 17057.0, 34292.0, 72928.0, 161574.0, 310552.0, 228520.0, 103218.0, 48053.0, 23716.0, 11984.0, 6472.0, 3548.0, 2051.0, 1305.0, 772.0, 514.0, 316.0, 217.0, 163.0, 95.0, 66.0, 49.0, 37.0, 26.0, 22.0, 14.0, 11.0, 10.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.11328125, -1.0770416259765625, -1.040802001953125, -1.0045623779296875, -0.96832275390625, -0.9320831298828125, -0.895843505859375, -0.8596038818359375, -0.8233642578125, -0.7871246337890625, -0.750885009765625, -0.7146453857421875, -0.67840576171875, -0.6421661376953125, -0.605926513671875, -0.5696868896484375, -0.533447265625, -0.4972076416015625, -0.460968017578125, -0.4247283935546875, -0.38848876953125, -0.3522491455078125, -0.316009521484375, -0.2797698974609375, -0.2435302734375, -0.2072906494140625, -0.171051025390625, -0.1348114013671875, -0.09857177734375, -0.0623321533203125, -0.026092529296875, 0.0101470947265625, 0.04638671875, 0.0826263427734375, 0.118865966796875, 0.1551055908203125, 0.19134521484375, 0.2275848388671875, 0.263824462890625, 0.3000640869140625, 0.3363037109375, 0.3725433349609375, 0.408782958984375, 0.4450225830078125, 0.48126220703125, 0.5175018310546875, 0.553741455078125, 0.5899810791015625, 0.626220703125, 0.6624603271484375, 0.698699951171875, 0.7349395751953125, 0.77117919921875, 0.8074188232421875, 0.843658447265625, 0.8798980712890625, 0.9161376953125, 0.9523773193359375, 0.988616943359375, 1.0248565673828125, 1.06109619140625, 1.0973358154296875, 1.133575439453125, 1.1698150634765625, 1.2060546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 0.0, 3.0, 4.0, 6.0, 8.0, 9.0, 9.0, 10.0, 8.0, 17.0, 21.0, 24.0, 23.0, 29.0, 28.0, 26.0, 33.0, 27.0, 42.0, 41.0, 46.0, 35.0, 28.0, 38.0, 43.0, 43.0, 34.0, 41.0, 28.0, 37.0, 36.0, 26.0, 32.0, 28.0, 12.0, 19.0, 23.0, 25.0, 12.0, 10.0, 10.0, 10.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8623046875, -1.8105621337890625, -1.758819580078125, -1.7070770263671875, -1.65533447265625, -1.6035919189453125, -1.551849365234375, -1.5001068115234375, -1.4483642578125, -1.3966217041015625, -1.344879150390625, -1.2931365966796875, -1.24139404296875, -1.1896514892578125, -1.137908935546875, -1.0861663818359375, -1.034423828125, -0.9826812744140625, -0.930938720703125, -0.8791961669921875, -0.82745361328125, -0.7757110595703125, -0.723968505859375, -0.6722259521484375, -0.6204833984375, -0.5687408447265625, -0.516998291015625, -0.4652557373046875, -0.41351318359375, -0.3617706298828125, -0.310028076171875, -0.2582855224609375, -0.20654296875, -0.1548004150390625, -0.103057861328125, -0.0513153076171875, 0.00042724609375, 0.0521697998046875, 0.103912353515625, 0.1556549072265625, 0.2073974609375, 0.2591400146484375, 0.310882568359375, 0.3626251220703125, 0.41436767578125, 0.4661102294921875, 0.517852783203125, 0.5695953369140625, 0.621337890625, 0.6730804443359375, 0.724822998046875, 0.7765655517578125, 0.82830810546875, 0.8800506591796875, 0.931793212890625, 0.9835357666015625, 1.0352783203125, 1.0870208740234375, 1.138763427734375, 1.1905059814453125, 1.24224853515625, 1.2939910888671875, 1.345733642578125, 1.3974761962890625, 1.44921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 6.0, 3.0, 10.0, 7.0, 13.0, 24.0, 19.0, 36.0, 61.0, 93.0, 143.0, 257.0, 552.0, 850.0, 1852.0, 4109.0, 11038.0, 36045.0, 179424.0, 631735.0, 135890.0, 29688.0, 9412.0, 3735.0, 1655.0, 816.0, 390.0, 270.0, 145.0, 87.0, 62.0, 41.0, 24.0, 14.0, 12.0, 7.0, 8.0, 6.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8583984375, -0.8282012939453125, -0.798004150390625, -0.7678070068359375, -0.73760986328125, -0.7074127197265625, -0.677215576171875, -0.6470184326171875, -0.6168212890625, -0.5866241455078125, -0.556427001953125, -0.5262298583984375, -0.49603271484375, -0.4658355712890625, -0.435638427734375, -0.4054412841796875, -0.375244140625, -0.3450469970703125, -0.314849853515625, -0.2846527099609375, -0.25445556640625, -0.2242584228515625, -0.194061279296875, -0.1638641357421875, -0.1336669921875, -0.1034698486328125, -0.073272705078125, -0.0430755615234375, -0.01287841796875, 0.0173187255859375, 0.047515869140625, 0.0777130126953125, 0.10791015625, 0.1381072998046875, 0.168304443359375, 0.1985015869140625, 0.22869873046875, 0.2588958740234375, 0.289093017578125, 0.3192901611328125, 0.3494873046875, 0.3796844482421875, 0.409881591796875, 0.4400787353515625, 0.47027587890625, 0.5004730224609375, 0.530670166015625, 0.5608673095703125, 0.591064453125, 0.6212615966796875, 0.651458740234375, 0.6816558837890625, 0.71185302734375, 0.7420501708984375, 0.772247314453125, 0.8024444580078125, 0.8326416015625, 0.8628387451171875, 0.893035888671875, 0.9232330322265625, 0.95343017578125, 0.9836273193359375, 1.013824462890625, 1.0440216064453125, 1.07421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 8.0, 4.0, 10.0, 13.0, 9.0, 25.0, 21.0, 24.0, 44.0, 108.0, 166.0, 223.0, 116.0, 59.0, 50.0, 31.0, 19.0, 29.0, 5.0, 12.0, 13.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00030303001403808594, -0.00029361993074417114, -0.00028420984745025635, -0.00027479976415634155, -0.00026538968086242676, -0.00025597959756851196, -0.00024656951427459717, -0.00023715943098068237, -0.00022774934768676758, -0.00021833926439285278, -0.000208929181098938, -0.0001995190978050232, -0.0001901090145111084, -0.0001806989312171936, -0.0001712888479232788, -0.00016187876462936401, -0.00015246868133544922, -0.00014305859804153442, -0.00013364851474761963, -0.00012423843145370483, -0.00011482834815979004, -0.00010541826486587524, -9.600818157196045e-05, -8.659809827804565e-05, -7.718801498413086e-05, -6.777793169021606e-05, -5.836784839630127e-05, -4.8957765102386475e-05, -3.954768180847168e-05, -3.0137598514556885e-05, -2.072751522064209e-05, -1.1317431926727295e-05, -1.9073486328125e-06, 7.502734661102295e-06, 1.691281795501709e-05, 2.6322901248931885e-05, 3.573298454284668e-05, 4.5143067836761475e-05, 5.455315113067627e-05, 6.396323442459106e-05, 7.337331771850586e-05, 8.278340101242065e-05, 9.219348430633545e-05, 0.00010160356760025024, 0.00011101365089416504, 0.00012042373418807983, 0.00012983381748199463, 0.00013924390077590942, 0.00014865398406982422, 0.00015806406736373901, 0.0001674741506576538, 0.0001768842339515686, 0.0001862943172454834, 0.0001957044005393982, 0.000205114483833313, 0.00021452456712722778, 0.00022393465042114258, 0.00023334473371505737, 0.00024275481700897217, 0.00025216490030288696, 0.00026157498359680176, 0.00027098506689071655, 0.00028039515018463135, 0.00028980523347854614, 0.00029921531677246094]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 16.0, 19.0, 19.0, 42.0, 49.0, 72.0, 124.0, 192.0, 321.0, 705.0, 1562.0, 4021.0, 12441.0, 50966.0, 382087.0, 509106.0, 63859.0, 14738.0, 4812.0, 1767.0, 674.0, 348.0, 204.0, 133.0, 87.0, 63.0, 38.0, 23.0, 19.0, 7.0, 5.0, 7.0, 5.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.1611328125, -1.128021240234375, -1.09490966796875, -1.061798095703125, -1.0286865234375, -0.995574951171875, -0.96246337890625, -0.929351806640625, -0.896240234375, -0.863128662109375, -0.83001708984375, -0.796905517578125, -0.7637939453125, -0.730682373046875, -0.69757080078125, -0.664459228515625, -0.63134765625, -0.598236083984375, -0.56512451171875, -0.532012939453125, -0.4989013671875, -0.465789794921875, -0.43267822265625, -0.399566650390625, -0.366455078125, -0.333343505859375, -0.30023193359375, -0.267120361328125, -0.2340087890625, -0.200897216796875, -0.16778564453125, -0.134674072265625, -0.1015625, -0.068450927734375, -0.03533935546875, -0.002227783203125, 0.0308837890625, 0.063995361328125, 0.09710693359375, 0.130218505859375, 0.163330078125, 0.196441650390625, 0.22955322265625, 0.262664794921875, 0.2957763671875, 0.328887939453125, 0.36199951171875, 0.395111083984375, 0.42822265625, 0.461334228515625, 0.49444580078125, 0.527557373046875, 0.5606689453125, 0.593780517578125, 0.62689208984375, 0.660003662109375, 0.693115234375, 0.726226806640625, 0.75933837890625, 0.792449951171875, 0.8255615234375, 0.858673095703125, 0.89178466796875, 0.924896240234375, 0.9580078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 14.0, 14.0, 15.0, 25.0, 27.0, 50.0, 61.0, 75.0, 117.0, 106.0, 126.0, 100.0, 67.0, 62.0, 30.0, 24.0, 17.0, 13.0, 9.0, 13.0, 11.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62060546875, -0.5975341796875, -0.574462890625, -0.5513916015625, -0.5283203125, -0.5052490234375, -0.482177734375, -0.4591064453125, -0.43603515625, -0.4129638671875, -0.389892578125, -0.3668212890625, -0.34375, -0.3206787109375, -0.297607421875, -0.2745361328125, -0.25146484375, -0.2283935546875, -0.205322265625, -0.1822509765625, -0.1591796875, -0.1361083984375, -0.113037109375, -0.0899658203125, -0.06689453125, -0.0438232421875, -0.020751953125, 0.0023193359375, 0.025390625, 0.0484619140625, 0.071533203125, 0.0946044921875, 0.11767578125, 0.1407470703125, 0.163818359375, 0.1868896484375, 0.2099609375, 0.2330322265625, 0.256103515625, 0.2791748046875, 0.30224609375, 0.3253173828125, 0.348388671875, 0.3714599609375, 0.39453125, 0.4176025390625, 0.440673828125, 0.4637451171875, 0.48681640625, 0.5098876953125, 0.532958984375, 0.5560302734375, 0.5791015625, 0.6021728515625, 0.625244140625, 0.6483154296875, 0.67138671875, 0.6944580078125, 0.717529296875, 0.7406005859375, 0.763671875, 0.7867431640625, 0.809814453125, 0.8328857421875, 0.85595703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 10.0, 15.0, 19.0, 41.0, 54.0, 85.0, 122.0, 144.0, 162.0, 110.0, 90.0, 56.0, 37.0, 22.0, 17.0, 3.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.434334754943848, -11.99261474609375, -11.550895690917969, -11.109176635742188, -10.66745662689209, -10.225736618041992, -9.784017562866211, -9.34229850769043, -8.900578498840332, -8.458858489990234, -8.017139434814453, -7.575419902801514, -7.133700370788574, -6.691980838775635, -6.250261306762695, -5.808541774749756, -5.366822242736816, -4.925102710723877, -4.4833831787109375, -4.041663646697998, -3.5999441146850586, -3.158224582672119, -2.7165050506591797, -2.2747855186462402, -1.8330659866333008, -1.3913464546203613, -0.9496269226074219, -0.5079073905944824, -0.06618785858154297, 0.3755316734313965, 0.8172512054443359, 1.2589707374572754, 1.7006902694702148, 2.1424098014831543, 2.5841293334960938, 3.025848865509033, 3.4675683975219727, 3.909287929534912, 4.351007461547852, 4.792726993560791, 5.2344465255737305, 5.67616605758667, 6.117885589599609, 6.559605121612549, 7.001324653625488, 7.443044185638428, 7.884763717651367, 8.326482772827148, 8.768202781677246, 9.209922790527344, 9.651641845703125, 10.093360900878906, 10.535080909729004, 10.976800918579102, 11.418519973754883, 11.860239028930664, 12.301959037780762, 12.74367904663086, 13.18539810180664, 13.627117156982422, 14.06883716583252, 14.510557174682617, 14.952276229858398, 15.39399528503418, 15.835715293884277]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 5.0, 12.0, 12.0, 15.0, 22.0, 23.0, 20.0, 29.0, 22.0, 45.0, 33.0, 37.0, 29.0, 42.0, 43.0, 40.0, 52.0, 45.0, 41.0, 43.0, 41.0, 38.0, 38.0, 41.0, 46.0, 29.0, 25.0, 21.0, 20.0, 17.0, 12.0, 6.0, 12.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.042895317077637, -8.720531463623047, -8.39816665649414, -8.07580280303955, -7.753438949584961, -7.431075096130371, -7.108710765838623, -6.786346435546875, -6.463982582092285, -6.141618728637695, -5.819254398345947, -5.496890068054199, -5.174526214599609, -4.8521623611450195, -4.5297980308532715, -4.207433700561523, -3.8850698471069336, -3.5627057552337646, -3.2403416633605957, -2.9179775714874268, -2.595613479614258, -2.273249387741089, -1.95088529586792, -1.628521203994751, -1.306157112121582, -0.9837930202484131, -0.6614289283752441, -0.3390648365020752, -0.01670074462890625, 0.3056633472442627, 0.6280274391174316, 0.9503915309906006, 1.2727546691894531, 1.595118761062622, 1.917482852935791, 2.23984694480896, 2.562211036682129, 2.884575128555298, 3.206939220428467, 3.5293033123016357, 3.8516674041748047, 4.1740312576293945, 4.496395587921143, 4.818759918212891, 5.1411237716674805, 5.46348762512207, 5.785851955413818, 6.108216285705566, 6.430580139160156, 6.752943992614746, 7.075308322906494, 7.397672653198242, 7.720036506652832, 8.042400360107422, 8.364765167236328, 8.687129020690918, 9.009492874145508, 9.331856727600098, 9.654220581054688, 9.976585388183594, 10.298949241638184, 10.621313095092773, 10.94367790222168, 11.26604175567627, 11.58840560913086]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 8.0, 6.0, 17.0, 17.0, 31.0, 37.0, 71.0, 175.0, 337.0, 878.0, 3093.0, 17224.0, 4044540.0, 117622.0, 7309.0, 1647.0, 637.0, 251.0, 127.0, 72.0, 49.0, 34.0, 28.0, 17.0, 6.0, 10.0, 10.0, 4.0, 6.0, 9.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.80078125, -5.58428955078125, -5.3677978515625, -5.15130615234375, -4.934814453125, -4.71832275390625, -4.5018310546875, -4.28533935546875, -4.06884765625, -3.85235595703125, -3.6358642578125, -3.41937255859375, -3.202880859375, -2.98638916015625, -2.7698974609375, -2.55340576171875, -2.3369140625, -2.12042236328125, -1.9039306640625, -1.68743896484375, -1.470947265625, -1.25445556640625, -1.0379638671875, -0.82147216796875, -0.60498046875, -0.38848876953125, -0.1719970703125, 0.04449462890625, 0.260986328125, 0.47747802734375, 0.6939697265625, 0.91046142578125, 1.126953125, 1.34344482421875, 1.5599365234375, 1.77642822265625, 1.992919921875, 2.20941162109375, 2.4259033203125, 2.64239501953125, 2.85888671875, 3.07537841796875, 3.2918701171875, 3.50836181640625, 3.724853515625, 3.94134521484375, 4.1578369140625, 4.37432861328125, 4.5908203125, 4.80731201171875, 5.0238037109375, 5.24029541015625, 5.456787109375, 5.67327880859375, 5.8897705078125, 6.10626220703125, 6.32275390625, 6.53924560546875, 6.7557373046875, 6.97222900390625, 7.188720703125, 7.40521240234375, 7.6217041015625, 7.83819580078125, 8.0546875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 14.0, 11.0, 18.0, 31.0, 31.0, 44.0, 53.0, 61.0, 76.0, 80.0, 78.0, 93.0, 69.0, 68.0, 59.0, 48.0, 40.0, 26.0, 30.0, 23.0, 11.0, 9.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5859375, -0.5650405883789062, -0.5441436767578125, -0.5232467651367188, -0.502349853515625, -0.48145294189453125, -0.4605560302734375, -0.43965911865234375, -0.41876220703125, -0.39786529541015625, -0.3769683837890625, -0.35607147216796875, -0.335174560546875, -0.31427764892578125, -0.2933807373046875, -0.27248382568359375, -0.2515869140625, -0.23069000244140625, -0.2097930908203125, -0.18889617919921875, -0.167999267578125, -0.14710235595703125, -0.1262054443359375, -0.10530853271484375, -0.08441162109375, -0.06351470947265625, -0.0426177978515625, -0.02172088623046875, -0.000823974609375, 0.02007293701171875, 0.0409698486328125, 0.06186676025390625, 0.082763671875, 0.10366058349609375, 0.1245574951171875, 0.14545440673828125, 0.166351318359375, 0.18724822998046875, 0.2081451416015625, 0.22904205322265625, 0.24993896484375, 0.27083587646484375, 0.2917327880859375, 0.31262969970703125, 0.333526611328125, 0.35442352294921875, 0.3753204345703125, 0.39621734619140625, 0.4171142578125, 0.43801116943359375, 0.4589080810546875, 0.47980499267578125, 0.500701904296875, 0.5215988159179688, 0.5424957275390625, 0.5633926391601562, 0.58428955078125, 0.6051864624023438, 0.6260833740234375, 0.6469802856445312, 0.667877197265625, 0.6887741088867188, 0.7096710205078125, 0.7305679321289062, 0.75146484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 10.0, 19.0, 21.0, 38.0, 28.0, 40.0, 70.0, 119.0, 153.0, 239.0, 339.0, 459.0, 703.0, 1088.0, 1714.0, 2668.0, 4590.0, 8258.0, 18154.0, 56948.0, 747190.0, 3211666.0, 91532.0, 23903.0, 10133.0, 5340.0, 3169.0, 1906.0, 1257.0, 809.0, 562.0, 342.0, 231.0, 178.0, 107.0, 78.0, 60.0, 44.0, 31.0, 27.0, 8.0, 11.0, 9.0, 9.0, 9.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.869140625, -1.812744140625, -1.75634765625, -1.699951171875, -1.6435546875, -1.587158203125, -1.53076171875, -1.474365234375, -1.41796875, -1.361572265625, -1.30517578125, -1.248779296875, -1.1923828125, -1.135986328125, -1.07958984375, -1.023193359375, -0.966796875, -0.910400390625, -0.85400390625, -0.797607421875, -0.7412109375, -0.684814453125, -0.62841796875, -0.572021484375, -0.515625, -0.459228515625, -0.40283203125, -0.346435546875, -0.2900390625, -0.233642578125, -0.17724609375, -0.120849609375, -0.064453125, -0.008056640625, 0.04833984375, 0.104736328125, 0.1611328125, 0.217529296875, 0.27392578125, 0.330322265625, 0.38671875, 0.443115234375, 0.49951171875, 0.555908203125, 0.6123046875, 0.668701171875, 0.72509765625, 0.781494140625, 0.837890625, 0.894287109375, 0.95068359375, 1.007080078125, 1.0634765625, 1.119873046875, 1.17626953125, 1.232666015625, 1.2890625, 1.345458984375, 1.40185546875, 1.458251953125, 1.5146484375, 1.571044921875, 1.62744140625, 1.683837890625, 1.740234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 9.0, 11.0, 9.0, 23.0, 21.0, 29.0, 48.0, 86.0, 190.0, 793.0, 2099.0, 396.0, 137.0, 71.0, 50.0, 19.0, 20.0, 14.0, 6.0, 7.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83935546875, -0.8116455078125, -0.783935546875, -0.7562255859375, -0.728515625, -0.7008056640625, -0.673095703125, -0.6453857421875, -0.61767578125, -0.5899658203125, -0.562255859375, -0.5345458984375, -0.5068359375, -0.4791259765625, -0.451416015625, -0.4237060546875, -0.39599609375, -0.3682861328125, -0.340576171875, -0.3128662109375, -0.28515625, -0.2574462890625, -0.229736328125, -0.2020263671875, -0.17431640625, -0.1466064453125, -0.118896484375, -0.0911865234375, -0.0634765625, -0.0357666015625, -0.008056640625, 0.0196533203125, 0.04736328125, 0.0750732421875, 0.102783203125, 0.1304931640625, 0.158203125, 0.1859130859375, 0.213623046875, 0.2413330078125, 0.26904296875, 0.2967529296875, 0.324462890625, 0.3521728515625, 0.3798828125, 0.4075927734375, 0.435302734375, 0.4630126953125, 0.49072265625, 0.5184326171875, 0.546142578125, 0.5738525390625, 0.6015625, 0.6292724609375, 0.656982421875, 0.6846923828125, 0.71240234375, 0.7401123046875, 0.767822265625, 0.7955322265625, 0.8232421875, 0.8509521484375, 0.878662109375, 0.9063720703125, 0.93408203125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 5.0, 16.0, 29.0, 61.0, 96.0, 162.0, 229.0, 173.0, 97.0, 52.0, 34.0, 17.0, 9.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.101396560668945, -6.9070281982421875, -6.71265983581543, -6.518291473388672, -6.323923110961914, -6.129554748535156, -5.935186386108398, -5.740818023681641, -5.546449661254883, -5.352081298828125, -5.157712936401367, -4.963344573974609, -4.768976211547852, -4.574607849121094, -4.380239486694336, -4.185871124267578, -3.9915032386779785, -3.7971348762512207, -3.602766513824463, -3.408398151397705, -3.2140297889709473, -3.0196614265441895, -2.8252933025360107, -2.630924940109253, -2.436556577682495, -2.2421882152557373, -2.0478198528289795, -1.8534516096115112, -1.6590832471847534, -1.4647148847579956, -1.2703466415405273, -1.0759782791137695, -0.8816094398498535, -0.6872410774230957, -0.49287277460098267, -0.29850447177886963, -0.10413610935211182, 0.090232253074646, 0.28460049629211426, 0.47896885871887207, 0.6733372211456299, 0.8677055835723877, 1.0620739459991455, 1.2564421892166138, 1.4508105516433716, 1.6451789140701294, 1.8395471572875977, 2.0339155197143555, 2.2282838821411133, 2.422652244567871, 2.617020606994629, 2.8113889694213867, 3.0057573318481445, 3.2001256942749023, 3.394493818283081, 3.588862180709839, 3.7832305431365967, 3.9775989055633545, 4.171967029571533, 4.366335391998291, 4.560703754425049, 4.755072116851807, 4.9494404792785645, 5.143808841705322, 5.33817720413208]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 7.0, 14.0, 12.0, 16.0, 17.0, 12.0, 26.0, 25.0, 49.0, 48.0, 35.0, 39.0, 38.0, 54.0, 45.0, 48.0, 48.0, 58.0, 46.0, 40.0, 49.0, 39.0, 32.0, 28.0, 25.0, 21.0, 27.0, 10.0, 19.0, 19.0, 10.0, 11.0, 5.0, 8.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.712989568710327, -2.6325080394744873, -2.5520265102386475, -2.4715449810028076, -2.3910634517669678, -2.310581922531128, -2.230100393295288, -2.1496191024780273, -2.0691375732421875, -1.9886560440063477, -1.9081745147705078, -1.827692985534668, -1.7472114562988281, -1.6667299270629883, -1.586248517036438, -1.5057669878005981, -1.4252853393554688, -1.344803810119629, -1.264322280883789, -1.1838407516479492, -1.1033592224121094, -1.0228776931762695, -0.9423962831497192, -0.8619147539138794, -0.7814332246780396, -0.7009516954421997, -0.6204701662063599, -0.5399886965751648, -0.45950716733932495, -0.3790256381034851, -0.29854413866996765, -0.2180626392364502, -0.13758111000061035, -0.0570995956659317, 0.023381918668746948, 0.1038634330034256, 0.18434494733810425, 0.2648264765739441, 0.34530797600746155, 0.425789475440979, 0.5062710046768188, 0.5867525339126587, 0.6672340631484985, 0.7477155327796936, 0.8281970620155334, 0.9086785912513733, 0.9891600608825684, 1.0696415901184082, 1.150123119354248, 1.230604648590088, 1.3110861778259277, 1.3915677070617676, 1.4720492362976074, 1.5525307655334473, 1.6330121755599976, 1.7134937047958374, 1.7939752340316772, 1.874456763267517, 1.954938292503357, 2.0354197025299072, 2.115901231765747, 2.196382761001587, 2.2768642902374268, 2.3573458194732666, 2.4378273487091064]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 10.0, 7.0, 17.0, 27.0, 34.0, 51.0, 72.0, 98.0, 192.0, 344.0, 728.0, 1760.0, 6009.0, 32568.0, 306381.0, 618637.0, 66663.0, 10328.0, 2563.0, 930.0, 454.0, 234.0, 133.0, 97.0, 65.0, 38.0, 28.0, 17.0, 10.0, 10.0, 11.0, 8.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.994140625, -3.861785888671875, -3.72943115234375, -3.597076416015625, -3.4647216796875, -3.332366943359375, -3.20001220703125, -3.067657470703125, -2.935302734375, -2.802947998046875, -2.67059326171875, -2.538238525390625, -2.4058837890625, -2.273529052734375, -2.14117431640625, -2.008819580078125, -1.87646484375, -1.744110107421875, -1.61175537109375, -1.479400634765625, -1.3470458984375, -1.214691162109375, -1.08233642578125, -0.949981689453125, -0.817626953125, -0.685272216796875, -0.55291748046875, -0.420562744140625, -0.2882080078125, -0.155853271484375, -0.02349853515625, 0.108856201171875, 0.2412109375, 0.373565673828125, 0.50592041015625, 0.638275146484375, 0.7706298828125, 0.902984619140625, 1.03533935546875, 1.167694091796875, 1.300048828125, 1.432403564453125, 1.56475830078125, 1.697113037109375, 1.8294677734375, 1.961822509765625, 2.09417724609375, 2.226531982421875, 2.35888671875, 2.491241455078125, 2.62359619140625, 2.755950927734375, 2.8883056640625, 3.020660400390625, 3.15301513671875, 3.285369873046875, 3.417724609375, 3.550079345703125, 3.68243408203125, 3.814788818359375, 3.9471435546875, 4.079498291015625, 4.21185302734375, 4.344207763671875, 4.4765625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 11.0, 17.0, 24.0, 29.0, 49.0, 49.0, 56.0, 77.0, 75.0, 81.0, 68.0, 77.0, 79.0, 58.0, 53.0, 37.0, 39.0, 26.0, 28.0, 22.0, 6.0, 5.0, 6.0, 7.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59912109375, -0.578704833984375, -0.55828857421875, -0.537872314453125, -0.5174560546875, -0.497039794921875, -0.47662353515625, -0.456207275390625, -0.435791015625, -0.415374755859375, -0.39495849609375, -0.374542236328125, -0.3541259765625, -0.333709716796875, -0.31329345703125, -0.292877197265625, -0.2724609375, -0.252044677734375, -0.23162841796875, -0.211212158203125, -0.1907958984375, -0.170379638671875, -0.14996337890625, -0.129547119140625, -0.109130859375, -0.088714599609375, -0.06829833984375, -0.047882080078125, -0.0274658203125, -0.007049560546875, 0.01336669921875, 0.033782958984375, 0.05419921875, 0.074615478515625, 0.09503173828125, 0.115447998046875, 0.1358642578125, 0.156280517578125, 0.17669677734375, 0.197113037109375, 0.217529296875, 0.237945556640625, 0.25836181640625, 0.278778076171875, 0.2991943359375, 0.319610595703125, 0.34002685546875, 0.360443115234375, 0.380859375, 0.401275634765625, 0.42169189453125, 0.442108154296875, 0.4625244140625, 0.482940673828125, 0.50335693359375, 0.523773193359375, 0.544189453125, 0.564605712890625, 0.58502197265625, 0.605438232421875, 0.6258544921875, 0.646270751953125, 0.66668701171875, 0.687103271484375, 0.70751953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 9.0, 2.0, 10.0, 7.0, 13.0, 17.0, 19.0, 36.0, 52.0, 58.0, 100.0, 142.0, 199.0, 314.0, 534.0, 882.0, 1659.0, 3209.0, 7097.0, 16754.0, 46753.0, 149301.0, 404085.0, 279506.0, 87350.0, 28815.0, 11257.0, 4741.0, 2328.0, 1293.0, 679.0, 429.0, 300.0, 168.0, 143.0, 97.0, 53.0, 40.0, 36.0, 19.0, 12.0, 11.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.51953125, -1.47015380859375, -1.4207763671875, -1.37139892578125, -1.322021484375, -1.27264404296875, -1.2232666015625, -1.17388916015625, -1.12451171875, -1.07513427734375, -1.0257568359375, -0.97637939453125, -0.927001953125, -0.87762451171875, -0.8282470703125, -0.77886962890625, -0.7294921875, -0.68011474609375, -0.6307373046875, -0.58135986328125, -0.531982421875, -0.48260498046875, -0.4332275390625, -0.38385009765625, -0.33447265625, -0.28509521484375, -0.2357177734375, -0.18634033203125, -0.136962890625, -0.08758544921875, -0.0382080078125, 0.01116943359375, 0.060546875, 0.10992431640625, 0.1593017578125, 0.20867919921875, 0.258056640625, 0.30743408203125, 0.3568115234375, 0.40618896484375, 0.45556640625, 0.50494384765625, 0.5543212890625, 0.60369873046875, 0.653076171875, 0.70245361328125, 0.7518310546875, 0.80120849609375, 0.8505859375, 0.89996337890625, 0.9493408203125, 0.99871826171875, 1.048095703125, 1.09747314453125, 1.1468505859375, 1.19622802734375, 1.24560546875, 1.29498291015625, 1.3443603515625, 1.39373779296875, 1.443115234375, 1.49249267578125, 1.5418701171875, 1.59124755859375, 1.640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 6.0, 8.0, 16.0, 6.0, 10.0, 22.0, 17.0, 22.0, 20.0, 23.0, 21.0, 30.0, 20.0, 40.0, 35.0, 42.0, 49.0, 32.0, 42.0, 45.0, 30.0, 35.0, 34.0, 42.0, 38.0, 35.0, 27.0, 24.0, 38.0, 21.0, 24.0, 26.0, 17.0, 16.0, 17.0, 11.0, 8.0, 4.0, 5.0, 6.0, 6.0, 7.0, 2.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.5322265625, -1.4854736328125, -1.438720703125, -1.3919677734375, -1.34521484375, -1.2984619140625, -1.251708984375, -1.2049560546875, -1.158203125, -1.1114501953125, -1.064697265625, -1.0179443359375, -0.97119140625, -0.9244384765625, -0.877685546875, -0.8309326171875, -0.7841796875, -0.7374267578125, -0.690673828125, -0.6439208984375, -0.59716796875, -0.5504150390625, -0.503662109375, -0.4569091796875, -0.41015625, -0.3634033203125, -0.316650390625, -0.2698974609375, -0.22314453125, -0.1763916015625, -0.129638671875, -0.0828857421875, -0.0361328125, 0.0106201171875, 0.057373046875, 0.1041259765625, 0.15087890625, 0.1976318359375, 0.244384765625, 0.2911376953125, 0.337890625, 0.3846435546875, 0.431396484375, 0.4781494140625, 0.52490234375, 0.5716552734375, 0.618408203125, 0.6651611328125, 0.7119140625, 0.7586669921875, 0.805419921875, 0.8521728515625, 0.89892578125, 0.9456787109375, 0.992431640625, 1.0391845703125, 1.0859375, 1.1326904296875, 1.179443359375, 1.2261962890625, 1.27294921875, 1.3197021484375, 1.366455078125, 1.4132080078125, 1.4599609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 5.0, 16.0, 23.0, 36.0, 42.0, 68.0, 140.0, 181.0, 320.0, 579.0, 1040.0, 2187.0, 4827.0, 11788.0, 34010.0, 131614.0, 534963.0, 243170.0, 53888.0, 16961.0, 6607.0, 2862.0, 1438.0, 766.0, 397.0, 222.0, 138.0, 87.0, 53.0, 36.0, 26.0, 22.0, 7.0, 7.0, 6.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1103515625, -1.0816497802734375, -1.052947998046875, -1.0242462158203125, -0.99554443359375, -0.9668426513671875, -0.938140869140625, -0.9094390869140625, -0.8807373046875, -0.8520355224609375, -0.823333740234375, -0.7946319580078125, -0.76593017578125, -0.7372283935546875, -0.708526611328125, -0.6798248291015625, -0.651123046875, -0.6224212646484375, -0.593719482421875, -0.5650177001953125, -0.53631591796875, -0.5076141357421875, -0.478912353515625, -0.4502105712890625, -0.4215087890625, -0.3928070068359375, -0.364105224609375, -0.3354034423828125, -0.30670166015625, -0.2779998779296875, -0.249298095703125, -0.2205963134765625, -0.19189453125, -0.1631927490234375, -0.134490966796875, -0.1057891845703125, -0.07708740234375, -0.0483856201171875, -0.019683837890625, 0.0090179443359375, 0.0377197265625, 0.0664215087890625, 0.095123291015625, 0.1238250732421875, 0.15252685546875, 0.1812286376953125, 0.209930419921875, 0.2386322021484375, 0.267333984375, 0.2960357666015625, 0.324737548828125, 0.3534393310546875, 0.38214111328125, 0.4108428955078125, 0.439544677734375, 0.4682464599609375, 0.4969482421875, 0.5256500244140625, 0.554351806640625, 0.5830535888671875, 0.61175537109375, 0.6404571533203125, 0.669158935546875, 0.6978607177734375, 0.7265625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 4.0, 9.0, 13.0, 15.0, 16.0, 29.0, 26.0, 34.0, 42.0, 54.0, 87.0, 99.0, 124.0, 118.0, 80.0, 53.0, 42.0, 45.0, 20.0, 13.0, 11.0, 12.0, 11.0, 4.0, 4.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022172927856445312, -0.00021423399448394775, -0.00020673871040344238, -0.000199243426322937, -0.00019174814224243164, -0.00018425285816192627, -0.0001767575740814209, -0.00016926229000091553, -0.00016176700592041016, -0.00015427172183990479, -0.00014677643775939941, -0.00013928115367889404, -0.00013178586959838867, -0.0001242905855178833, -0.00011679530143737793, -0.00010930001735687256, -0.00010180473327636719, -9.430944919586182e-05, -8.681416511535645e-05, -7.931888103485107e-05, -7.18235969543457e-05, -6.432831287384033e-05, -5.683302879333496e-05, -4.933774471282959e-05, -4.184246063232422e-05, -3.434717655181885e-05, -2.6851892471313477e-05, -1.9356608390808105e-05, -1.1861324310302734e-05, -4.366040229797363e-06, 3.129243850708008e-06, 1.0624527931213379e-05, 1.811981201171875e-05, 2.561509609222412e-05, 3.311038017272949e-05, 4.060566425323486e-05, 4.8100948333740234e-05, 5.5596232414245605e-05, 6.309151649475098e-05, 7.058680057525635e-05, 7.808208465576172e-05, 8.557736873626709e-05, 9.307265281677246e-05, 0.00010056793689727783, 0.0001080632209777832, 0.00011555850505828857, 0.00012305378913879395, 0.00013054907321929932, 0.0001380443572998047, 0.00014553964138031006, 0.00015303492546081543, 0.0001605302095413208, 0.00016802549362182617, 0.00017552077770233154, 0.00018301606178283691, 0.00019051134586334229, 0.00019800662994384766, 0.00020550191402435303, 0.0002129971981048584, 0.00022049248218536377, 0.00022798776626586914, 0.0002354830503463745, 0.00024297833442687988, 0.00025047361850738525, 0.0002579689025878906]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 12.0, 12.0, 22.0, 47.0, 48.0, 70.0, 117.0, 197.0, 313.0, 513.0, 982.0, 2015.0, 4102.0, 10112.0, 29382.0, 115951.0, 593598.0, 219972.0, 45421.0, 14473.0, 5681.0, 2682.0, 1250.0, 606.0, 366.0, 211.0, 123.0, 86.0, 50.0, 41.0, 22.0, 24.0, 13.0, 11.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.986328125, -0.953094482421875, -0.91986083984375, -0.886627197265625, -0.8533935546875, -0.820159912109375, -0.78692626953125, -0.753692626953125, -0.720458984375, -0.687225341796875, -0.65399169921875, -0.620758056640625, -0.5875244140625, -0.554290771484375, -0.52105712890625, -0.487823486328125, -0.45458984375, -0.421356201171875, -0.38812255859375, -0.354888916015625, -0.3216552734375, -0.288421630859375, -0.25518798828125, -0.221954345703125, -0.188720703125, -0.155487060546875, -0.12225341796875, -0.089019775390625, -0.0557861328125, -0.022552490234375, 0.01068115234375, 0.043914794921875, 0.0771484375, 0.110382080078125, 0.14361572265625, 0.176849365234375, 0.2100830078125, 0.243316650390625, 0.27655029296875, 0.309783935546875, 0.343017578125, 0.376251220703125, 0.40948486328125, 0.442718505859375, 0.4759521484375, 0.509185791015625, 0.54241943359375, 0.575653076171875, 0.60888671875, 0.642120361328125, 0.67535400390625, 0.708587646484375, 0.7418212890625, 0.775054931640625, 0.80828857421875, 0.841522216796875, 0.874755859375, 0.907989501953125, 0.94122314453125, 0.974456787109375, 1.0076904296875, 1.040924072265625, 1.07415771484375, 1.107391357421875, 1.140625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 2.0, 1.0, 1.0, 7.0, 7.0, 6.0, 8.0, 6.0, 13.0, 15.0, 24.0, 26.0, 17.0, 22.0, 48.0, 58.0, 63.0, 106.0, 90.0, 93.0, 68.0, 58.0, 49.0, 43.0, 23.0, 31.0, 21.0, 15.0, 15.0, 14.0, 9.0, 4.0, 8.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.65869140625, -0.6386260986328125, -0.618560791015625, -0.5984954833984375, -0.57843017578125, -0.5583648681640625, -0.538299560546875, -0.5182342529296875, -0.4981689453125, -0.4781036376953125, -0.458038330078125, -0.4379730224609375, -0.41790771484375, -0.3978424072265625, -0.377777099609375, -0.3577117919921875, -0.337646484375, -0.3175811767578125, -0.297515869140625, -0.2774505615234375, -0.25738525390625, -0.2373199462890625, -0.217254638671875, -0.1971893310546875, -0.1771240234375, -0.1570587158203125, -0.136993408203125, -0.1169281005859375, -0.09686279296875, -0.0767974853515625, -0.056732177734375, -0.0366668701171875, -0.0166015625, 0.0034637451171875, 0.023529052734375, 0.0435943603515625, 0.06365966796875, 0.0837249755859375, 0.103790283203125, 0.1238555908203125, 0.1439208984375, 0.1639862060546875, 0.184051513671875, 0.2041168212890625, 0.22418212890625, 0.2442474365234375, 0.264312744140625, 0.2843780517578125, 0.304443359375, 0.3245086669921875, 0.344573974609375, 0.3646392822265625, 0.38470458984375, 0.4047698974609375, 0.424835205078125, 0.4449005126953125, 0.4649658203125, 0.4850311279296875, 0.505096435546875, 0.5251617431640625, 0.54522705078125, 0.5652923583984375, 0.585357666015625, 0.6054229736328125, 0.62548828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 4.0, 10.0, 16.0, 13.0, 46.0, 63.0, 107.0, 154.0, 163.0, 147.0, 111.0, 69.0, 40.0, 18.0, 11.0, 8.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.6190242767334, -16.1527099609375, -15.686394691467285, -15.22007942199707, -14.753765106201172, -14.287449836730957, -13.821134567260742, -13.354820251464844, -12.888504981994629, -12.422189712524414, -11.955875396728516, -11.4895601272583, -11.023244857788086, -10.556930541992188, -10.090615272521973, -9.624300003051758, -9.15798568725586, -8.691670417785645, -8.225356101989746, -7.759040832519531, -7.292726039886475, -6.826411247253418, -6.360095977783203, -5.8937811851501465, -5.42746639251709, -4.961151599884033, -4.494836807250977, -4.028521537780762, -3.562206745147705, -3.0958919525146484, -2.6295769214630127, -2.163261890411377, -1.696946144104004, -1.2306312322616577, -0.7643163204193115, -0.29800140857696533, 0.16831350326538086, 0.6346282958984375, 1.1009433269500732, 1.567258358001709, 2.0335731506347656, 2.4998879432678223, 2.966202974319458, 3.4325180053710938, 3.8988327980041504, 4.365147590637207, 4.831462860107422, 5.2977776527404785, 5.764092445373535, 6.230407238006592, 6.696722030639648, 7.163037300109863, 7.62935209274292, 8.095666885375977, 8.561982154846191, 9.028297424316406, 9.494611740112305, 9.96092700958252, 10.427241325378418, 10.893556594848633, 11.359870910644531, 11.826186180114746, 12.292501449584961, 12.75881576538086, 13.225131034851074]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 10.0, 3.0, 9.0, 7.0, 15.0, 17.0, 10.0, 14.0, 26.0, 27.0, 23.0, 24.0, 33.0, 56.0, 40.0, 42.0, 55.0, 52.0, 60.0, 54.0, 34.0, 55.0, 53.0, 39.0, 27.0, 40.0, 30.0, 25.0, 29.0, 20.0, 15.0, 8.0, 16.0, 7.0, 6.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.061080932617188, -10.719315528869629, -10.377551078796387, -10.035785675048828, -9.694021224975586, -9.352255821228027, -9.010490417480469, -8.668725967407227, -8.326960563659668, -7.985195636749268, -7.643430709838867, -7.301665306091309, -6.959900379180908, -6.618135452270508, -6.276370525360107, -5.934605598449707, -5.592840671539307, -5.251075744628906, -4.909310817718506, -4.5675458908081055, -4.225780487060547, -3.8840155601501465, -3.542250633239746, -3.2004854679107666, -2.858720541000366, -2.516955614089966, -2.1751904487609863, -1.833425521850586, -1.491660475730896, -1.149895429611206, -0.8081305027008057, -0.46636533737182617, -0.12460041046142578, 0.21716460585594177, 0.5589296221733093, 0.9006946086883545, 1.2424596548080444, 1.5842247009277344, 1.9259896278381348, 2.2677547931671143, 2.6095197200775146, 2.951284646987915, 3.2930498123168945, 3.634814739227295, 3.9765796661376953, 4.318345069885254, 4.660109519958496, 5.001874923706055, 5.343639850616455, 5.6854047775268555, 6.027169704437256, 6.368934631347656, 6.710700035095215, 7.052464962005615, 7.394229888916016, 7.735995292663574, 8.077759742736816, 8.419525146484375, 8.761289596557617, 9.103055000305176, 9.444819450378418, 9.786584854125977, 10.128349304199219, 10.470114707946777, 10.811880111694336]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 11.0, 10.0, 15.0, 25.0, 55.0, 84.0, 137.0, 286.0, 772.0, 2257.0, 9612.0, 118273.0, 4035319.0, 21613.0, 3770.0, 1042.0, 360.0, 202.0, 119.0, 71.0, 43.0, 37.0, 32.0, 22.0, 19.0, 20.0, 9.0, 12.0, 6.0, 7.0, 6.0, 5.0, 5.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.3511962890625, -4.155517578125, -3.9598388671875, -3.76416015625, -3.5684814453125, -3.372802734375, -3.1771240234375, -2.9814453125, -2.7857666015625, -2.590087890625, -2.3944091796875, -2.19873046875, -2.0030517578125, -1.807373046875, -1.6116943359375, -1.416015625, -1.2203369140625, -1.024658203125, -0.8289794921875, -0.63330078125, -0.4376220703125, -0.241943359375, -0.0462646484375, 0.1494140625, 0.3450927734375, 0.540771484375, 0.7364501953125, 0.93212890625, 1.1278076171875, 1.323486328125, 1.5191650390625, 1.71484375, 1.9105224609375, 2.106201171875, 2.3018798828125, 2.49755859375, 2.6932373046875, 2.888916015625, 3.0845947265625, 3.2802734375, 3.4759521484375, 3.671630859375, 3.8673095703125, 4.06298828125, 4.2586669921875, 4.454345703125, 4.6500244140625, 4.845703125, 5.0413818359375, 5.237060546875, 5.4327392578125, 5.62841796875, 5.8240966796875, 6.019775390625, 6.2154541015625, 6.4111328125, 6.6068115234375, 6.802490234375, 6.9981689453125, 7.19384765625, 7.3895263671875, 7.585205078125, 7.7808837890625, 7.9765625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 10.0, 8.0, 8.0, 19.0, 22.0, 29.0, 50.0, 54.0, 60.0, 69.0, 79.0, 69.0, 70.0, 88.0, 69.0, 62.0, 44.0, 53.0, 39.0, 29.0, 22.0, 21.0, 9.0, 6.0, 2.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.6006011962890625, -0.578643798828125, -0.5566864013671875, -0.53472900390625, -0.5127716064453125, -0.490814208984375, -0.4688568115234375, -0.4468994140625, -0.4249420166015625, -0.402984619140625, -0.3810272216796875, -0.35906982421875, -0.3371124267578125, -0.315155029296875, -0.2931976318359375, -0.271240234375, -0.2492828369140625, -0.227325439453125, -0.2053680419921875, -0.18341064453125, -0.1614532470703125, -0.139495849609375, -0.1175384521484375, -0.0955810546875, -0.0736236572265625, -0.051666259765625, -0.0297088623046875, -0.00775146484375, 0.0142059326171875, 0.036163330078125, 0.0581207275390625, 0.080078125, 0.1020355224609375, 0.123992919921875, 0.1459503173828125, 0.16790771484375, 0.1898651123046875, 0.211822509765625, 0.2337799072265625, 0.2557373046875, 0.2776947021484375, 0.299652099609375, 0.3216094970703125, 0.34356689453125, 0.3655242919921875, 0.387481689453125, 0.4094390869140625, 0.431396484375, 0.4533538818359375, 0.475311279296875, 0.4972686767578125, 0.51922607421875, 0.5411834716796875, 0.563140869140625, 0.5850982666015625, 0.6070556640625, 0.6290130615234375, 0.650970458984375, 0.6729278564453125, 0.69488525390625, 0.7168426513671875, 0.738800048828125, 0.7607574462890625, 0.78271484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 7.0, 5.0, 8.0, 4.0, 7.0, 15.0, 22.0, 20.0, 22.0, 37.0, 72.0, 112.0, 227.0, 430.0, 960.0, 2078.0, 5453.0, 15755.0, 76344.0, 3920298.0, 140170.0, 20696.0, 6615.0, 2576.0, 1175.0, 540.0, 247.0, 115.0, 86.0, 45.0, 32.0, 26.0, 24.0, 17.0, 7.0, 10.0, 7.0, 5.0, 6.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.560546875, -3.45135498046875, -3.3421630859375, -3.23297119140625, -3.123779296875, -3.01458740234375, -2.9053955078125, -2.79620361328125, -2.68701171875, -2.57781982421875, -2.4686279296875, -2.35943603515625, -2.250244140625, -2.14105224609375, -2.0318603515625, -1.92266845703125, -1.8134765625, -1.70428466796875, -1.5950927734375, -1.48590087890625, -1.376708984375, -1.26751708984375, -1.1583251953125, -1.04913330078125, -0.93994140625, -0.83074951171875, -0.7215576171875, -0.61236572265625, -0.503173828125, -0.39398193359375, -0.2847900390625, -0.17559814453125, -0.06640625, 0.04278564453125, 0.1519775390625, 0.26116943359375, 0.370361328125, 0.47955322265625, 0.5887451171875, 0.69793701171875, 0.80712890625, 0.91632080078125, 1.0255126953125, 1.13470458984375, 1.243896484375, 1.35308837890625, 1.4622802734375, 1.57147216796875, 1.6806640625, 1.78985595703125, 1.8990478515625, 2.00823974609375, 2.117431640625, 2.22662353515625, 2.3358154296875, 2.44500732421875, 2.55419921875, 2.66339111328125, 2.7725830078125, 2.88177490234375, 2.990966796875, 3.10015869140625, 3.2093505859375, 3.31854248046875, 3.427734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 5.0, 4.0, 18.0, 21.0, 25.0, 43.0, 89.0, 215.0, 1712.0, 1517.0, 219.0, 68.0, 37.0, 25.0, 16.0, 25.0, 10.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.175445556640625, -1.13018798828125, -1.084930419921875, -1.0396728515625, -0.994415283203125, -0.94915771484375, -0.903900146484375, -0.858642578125, -0.813385009765625, -0.76812744140625, -0.722869873046875, -0.6776123046875, -0.632354736328125, -0.58709716796875, -0.541839599609375, -0.49658203125, -0.451324462890625, -0.40606689453125, -0.360809326171875, -0.3155517578125, -0.270294189453125, -0.22503662109375, -0.179779052734375, -0.134521484375, -0.089263916015625, -0.04400634765625, 0.001251220703125, 0.0465087890625, 0.091766357421875, 0.13702392578125, 0.182281494140625, 0.2275390625, 0.272796630859375, 0.31805419921875, 0.363311767578125, 0.4085693359375, 0.453826904296875, 0.49908447265625, 0.544342041015625, 0.589599609375, 0.634857177734375, 0.68011474609375, 0.725372314453125, 0.7706298828125, 0.815887451171875, 0.86114501953125, 0.906402587890625, 0.95166015625, 0.996917724609375, 1.04217529296875, 1.087432861328125, 1.1326904296875, 1.177947998046875, 1.22320556640625, 1.268463134765625, 1.313720703125, 1.358978271484375, 1.40423583984375, 1.449493408203125, 1.4947509765625, 1.540008544921875, 1.58526611328125, 1.630523681640625, 1.67578125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 15.0, 16.0, 40.0, 54.0, 109.0, 216.0, 185.0, 165.0, 77.0, 36.0, 41.0, 18.0, 9.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52201509475708, -6.263278961181641, -6.004543304443359, -5.74580717086792, -5.487071514129639, -5.228335380554199, -4.969599723815918, -4.7108635902404785, -4.452127456665039, -4.1933913230896, -3.9346556663513184, -3.675919532775879, -3.4171838760375977, -3.158447742462158, -2.899711847305298, -2.6409759521484375, -2.3822402954101562, -2.123504400253296, -1.8647685050964355, -1.6060324907302856, -1.3472965955734253, -1.088560700416565, -0.829824686050415, -0.5710887908935547, -0.31235289573669434, -0.0536169707775116, 0.20511895418167114, 0.46385490894317627, 0.7225908041000366, 0.981326699256897, 1.2400627136230469, 1.4987986087799072, 1.7575349807739258, 2.016270875930786, 2.2750067710876465, 2.533742904663086, 2.792478561401367, 3.0512146949768066, 3.309950590133667, 3.5686864852905273, 3.8274223804473877, 4.086158275604248, 4.3448944091796875, 4.603630065917969, 4.862366199493408, 5.1211018562316895, 5.379837989807129, 5.63857364654541, 5.89730978012085, 6.156045913696289, 6.41478157043457, 6.67351770401001, 6.932253360748291, 7.1909894943237305, 7.449725151062012, 7.708461284637451, 7.967197418212891, 8.225933074951172, 8.48466968536377, 8.74340534210205, 9.002140998840332, 9.260876655578613, 9.519613265991211, 9.778348922729492, 10.037084579467773]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 9.0, 24.0, 23.0, 29.0, 42.0, 46.0, 46.0, 40.0, 67.0, 67.0, 61.0, 52.0, 58.0, 63.0, 52.0, 61.0, 49.0, 44.0, 37.0, 27.0, 28.0, 18.0, 15.0, 13.0, 10.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.184516906738281, -5.043605327606201, -4.902693748474121, -4.761782169342041, -4.620870590209961, -4.479959487915039, -4.339047431945801, -4.198136329650879, -4.057224750518799, -3.9163131713867188, -3.7754015922546387, -3.6344900131225586, -3.4935786724090576, -3.3526670932769775, -3.2117555141448975, -3.0708439350128174, -2.9299323558807373, -2.7890207767486572, -2.648109197616577, -2.507197856903076, -2.366286277770996, -2.225374698638916, -2.084463119506836, -1.9435515403747559, -1.8026400804519653, -1.6617285013198853, -1.5208170413970947, -1.3799054622650146, -1.2389938831329346, -1.098082423210144, -0.957170844078064, -0.8162593245506287, -0.6753480434417725, -0.5344365239143372, -0.39352497458457947, -0.2526134252548218, -0.11170190572738647, 0.029209613800048828, 0.1701211929321289, 0.3110327124595642, 0.4519442319869995, 0.5928557515144348, 0.7337672710418701, 0.8746788501739502, 1.0155904293060303, 1.1565018892288208, 1.2974134683609009, 1.4383249282836914, 1.5792365074157715, 1.7201480865478516, 1.861059546470642, 2.0019712448120117, 2.1428825855255127, 2.2837941646575928, 2.424705743789673, 2.565617322921753, 2.706528663635254, 2.847440242767334, 2.988351821899414, 3.129263401031494, 3.270174741744995, 3.411086320877075, 3.5519979000091553, 3.6929094791412354, 3.8338210582733154]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 7.0, 15.0, 23.0, 32.0, 51.0, 53.0, 108.0, 232.0, 499.0, 1322.0, 4715.0, 32129.0, 709676.0, 278218.0, 16687.0, 3023.0, 920.0, 353.0, 185.0, 96.0, 51.0, 36.0, 29.0, 22.0, 17.0, 8.0, 7.0, 3.0, 4.0, 2.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.16796875, -5.98577880859375, -5.8035888671875, -5.62139892578125, -5.439208984375, -5.25701904296875, -5.0748291015625, -4.89263916015625, -4.71044921875, -4.52825927734375, -4.3460693359375, -4.16387939453125, -3.981689453125, -3.79949951171875, -3.6173095703125, -3.43511962890625, -3.2529296875, -3.07073974609375, -2.8885498046875, -2.70635986328125, -2.524169921875, -2.34197998046875, -2.1597900390625, -1.97760009765625, -1.79541015625, -1.61322021484375, -1.4310302734375, -1.24884033203125, -1.066650390625, -0.88446044921875, -0.7022705078125, -0.52008056640625, -0.337890625, -0.15570068359375, 0.0264892578125, 0.20867919921875, 0.390869140625, 0.57305908203125, 0.7552490234375, 0.93743896484375, 1.11962890625, 1.30181884765625, 1.4840087890625, 1.66619873046875, 1.848388671875, 2.03057861328125, 2.2127685546875, 2.39495849609375, 2.5771484375, 2.75933837890625, 2.9415283203125, 3.12371826171875, 3.305908203125, 3.48809814453125, 3.6702880859375, 3.85247802734375, 4.03466796875, 4.21685791015625, 4.3990478515625, 4.58123779296875, 4.763427734375, 4.94561767578125, 5.1278076171875, 5.30999755859375, 5.4921875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 16.0, 16.0, 24.0, 33.0, 54.0, 56.0, 79.0, 58.0, 59.0, 79.0, 77.0, 87.0, 61.0, 62.0, 54.0, 43.0, 30.0, 35.0, 21.0, 8.0, 17.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57080078125, -0.548919677734375, -0.52703857421875, -0.505157470703125, -0.4832763671875, -0.461395263671875, -0.43951416015625, -0.417633056640625, -0.395751953125, -0.373870849609375, -0.35198974609375, -0.330108642578125, -0.3082275390625, -0.286346435546875, -0.26446533203125, -0.242584228515625, -0.220703125, -0.198822021484375, -0.17694091796875, -0.155059814453125, -0.1331787109375, -0.111297607421875, -0.08941650390625, -0.067535400390625, -0.045654296875, -0.023773193359375, -0.00189208984375, 0.019989013671875, 0.0418701171875, 0.063751220703125, 0.08563232421875, 0.107513427734375, 0.12939453125, 0.151275634765625, 0.17315673828125, 0.195037841796875, 0.2169189453125, 0.238800048828125, 0.26068115234375, 0.282562255859375, 0.304443359375, 0.326324462890625, 0.34820556640625, 0.370086669921875, 0.3919677734375, 0.413848876953125, 0.43572998046875, 0.457611083984375, 0.4794921875, 0.501373291015625, 0.52325439453125, 0.545135498046875, 0.5670166015625, 0.588897705078125, 0.61077880859375, 0.632659912109375, 0.654541015625, 0.676422119140625, 0.69830322265625, 0.720184326171875, 0.7420654296875, 0.763946533203125, 0.78582763671875, 0.807708740234375, 0.82958984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 6.0, 11.0, 19.0, 15.0, 27.0, 31.0, 55.0, 76.0, 103.0, 153.0, 241.0, 454.0, 730.0, 1348.0, 3066.0, 7729.0, 25817.0, 117230.0, 568815.0, 253081.0, 48243.0, 12644.0, 4407.0, 1838.0, 974.0, 502.0, 330.0, 198.0, 132.0, 83.0, 58.0, 40.0, 26.0, 19.0, 13.0, 10.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.33984375, -2.27044677734375, -2.2010498046875, -2.13165283203125, -2.062255859375, -1.99285888671875, -1.9234619140625, -1.85406494140625, -1.78466796875, -1.71527099609375, -1.6458740234375, -1.57647705078125, -1.507080078125, -1.43768310546875, -1.3682861328125, -1.29888916015625, -1.2294921875, -1.16009521484375, -1.0906982421875, -1.02130126953125, -0.951904296875, -0.88250732421875, -0.8131103515625, -0.74371337890625, -0.67431640625, -0.60491943359375, -0.5355224609375, -0.46612548828125, -0.396728515625, -0.32733154296875, -0.2579345703125, -0.18853759765625, -0.119140625, -0.04974365234375, 0.0196533203125, 0.08905029296875, 0.158447265625, 0.22784423828125, 0.2972412109375, 0.36663818359375, 0.43603515625, 0.50543212890625, 0.5748291015625, 0.64422607421875, 0.713623046875, 0.78302001953125, 0.8524169921875, 0.92181396484375, 0.9912109375, 1.06060791015625, 1.1300048828125, 1.19940185546875, 1.268798828125, 1.33819580078125, 1.4075927734375, 1.47698974609375, 1.54638671875, 1.61578369140625, 1.6851806640625, 1.75457763671875, 1.823974609375, 1.89337158203125, 1.9627685546875, 2.03216552734375, 2.1015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 7.0, 8.0, 9.0, 17.0, 21.0, 25.0, 25.0, 32.0, 37.0, 40.0, 44.0, 38.0, 44.0, 51.0, 54.0, 50.0, 48.0, 40.0, 53.0, 49.0, 38.0, 46.0, 37.0, 36.0, 15.0, 33.0, 22.0, 18.0, 16.0, 9.0, 4.0, 7.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4140625, -2.349639892578125, -2.28521728515625, -2.220794677734375, -2.1563720703125, -2.091949462890625, -2.02752685546875, -1.963104248046875, -1.898681640625, -1.834259033203125, -1.76983642578125, -1.705413818359375, -1.6409912109375, -1.576568603515625, -1.51214599609375, -1.447723388671875, -1.38330078125, -1.318878173828125, -1.25445556640625, -1.190032958984375, -1.1256103515625, -1.061187744140625, -0.99676513671875, -0.932342529296875, -0.867919921875, -0.803497314453125, -0.73907470703125, -0.674652099609375, -0.6102294921875, -0.545806884765625, -0.48138427734375, -0.416961669921875, -0.3525390625, -0.288116455078125, -0.22369384765625, -0.159271240234375, -0.0948486328125, -0.030426025390625, 0.03399658203125, 0.098419189453125, 0.162841796875, 0.227264404296875, 0.29168701171875, 0.356109619140625, 0.4205322265625, 0.484954833984375, 0.54937744140625, 0.613800048828125, 0.67822265625, 0.742645263671875, 0.80706787109375, 0.871490478515625, 0.9359130859375, 1.000335693359375, 1.06475830078125, 1.129180908203125, 1.193603515625, 1.258026123046875, 1.32244873046875, 1.386871337890625, 1.4512939453125, 1.515716552734375, 1.58013916015625, 1.644561767578125, 1.708984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 10.0, 16.0, 25.0, 38.0, 55.0, 62.0, 105.0, 249.0, 433.0, 893.0, 2126.0, 5807.0, 20737.0, 110671.0, 755471.0, 119791.0, 21856.0, 6020.0, 2254.0, 928.0, 416.0, 253.0, 115.0, 79.0, 42.0, 32.0, 21.0, 14.0, 12.0, 5.0, 1.0, 4.0, 5.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.1474227905273438, -1.1141815185546875, -1.0809402465820312, -1.047698974609375, -1.0144577026367188, -0.9812164306640625, -0.9479751586914062, -0.91473388671875, -0.8814926147460938, -0.8482513427734375, -0.8150100708007812, -0.781768798828125, -0.7485275268554688, -0.7152862548828125, -0.6820449829101562, -0.6488037109375, -0.6155624389648438, -0.5823211669921875, -0.5490798950195312, -0.515838623046875, -0.48259735107421875, -0.4493560791015625, -0.41611480712890625, -0.38287353515625, -0.34963226318359375, -0.3163909912109375, -0.28314971923828125, -0.249908447265625, -0.21666717529296875, -0.1834259033203125, -0.15018463134765625, -0.116943359375, -0.08370208740234375, -0.0504608154296875, -0.01721954345703125, 0.016021728515625, 0.04926300048828125, 0.0825042724609375, 0.11574554443359375, 0.14898681640625, 0.18222808837890625, 0.2154693603515625, 0.24871063232421875, 0.281951904296875, 0.31519317626953125, 0.3484344482421875, 0.38167572021484375, 0.4149169921875, 0.44815826416015625, 0.4813995361328125, 0.5146408081054688, 0.547882080078125, 0.5811233520507812, 0.6143646240234375, 0.6476058959960938, 0.68084716796875, 0.7140884399414062, 0.7473297119140625, 0.7805709838867188, 0.813812255859375, 0.8470535278320312, 0.8802947998046875, 0.9135360717773438, 0.94677734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 10.0, 16.0, 13.0, 21.0, 23.0, 42.0, 62.0, 121.0, 330.0, 175.0, 52.0, 53.0, 24.0, 19.0, 14.0, 8.0, 5.0, 7.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004076957702636719, -0.0003952011466026306, -0.00038270652294158936, -0.0003702118992805481, -0.00035771727561950684, -0.0003452226519584656, -0.0003327280282974243, -0.00032023340463638306, -0.0003077387809753418, -0.00029524415731430054, -0.0002827495336532593, -0.000270254909992218, -0.00025776028633117676, -0.0002452656626701355, -0.00023277103900909424, -0.00022027641534805298, -0.00020778179168701172, -0.00019528716802597046, -0.0001827925443649292, -0.00017029792070388794, -0.00015780329704284668, -0.00014530867338180542, -0.00013281404972076416, -0.0001203194260597229, -0.00010782480239868164, -9.533017873764038e-05, -8.283555507659912e-05, -7.034093141555786e-05, -5.78463077545166e-05, -4.535168409347534e-05, -3.285706043243408e-05, -2.0362436771392822e-05, -7.867813110351562e-06, 4.626810550689697e-06, 1.7121434211730957e-05, 2.9616057872772217e-05, 4.2110681533813477e-05, 5.4605305194854736e-05, 6.7099928855896e-05, 7.959455251693726e-05, 9.208917617797852e-05, 0.00010458379983901978, 0.00011707842350006104, 0.0001295730471611023, 0.00014206767082214355, 0.00015456229448318481, 0.00016705691814422607, 0.00017955154180526733, 0.0001920461654663086, 0.00020454078912734985, 0.0002170354127883911, 0.00022953003644943237, 0.00024202466011047363, 0.0002545192837715149, 0.00026701390743255615, 0.0002795085310935974, 0.00029200315475463867, 0.00030449777841567993, 0.0003169924020767212, 0.00032948702573776245, 0.0003419816493988037, 0.00035447627305984497, 0.00036697089672088623, 0.0003794655203819275, 0.00039196014404296875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 8.0, 13.0, 13.0, 22.0, 29.0, 35.0, 60.0, 110.0, 150.0, 273.0, 474.0, 912.0, 1875.0, 4592.0, 14824.0, 68769.0, 674414.0, 232898.0, 34418.0, 8631.0, 3047.0, 1415.0, 651.0, 364.0, 186.0, 117.0, 74.0, 53.0, 33.0, 25.0, 16.0, 15.0, 11.0, 2.0, 9.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.0478515625, -1.017730712890625, -0.98760986328125, -0.957489013671875, -0.9273681640625, -0.897247314453125, -0.86712646484375, -0.837005615234375, -0.806884765625, -0.776763916015625, -0.74664306640625, -0.716522216796875, -0.6864013671875, -0.656280517578125, -0.62615966796875, -0.596038818359375, -0.56591796875, -0.535797119140625, -0.50567626953125, -0.475555419921875, -0.4454345703125, -0.415313720703125, -0.38519287109375, -0.355072021484375, -0.324951171875, -0.294830322265625, -0.26470947265625, -0.234588623046875, -0.2044677734375, -0.174346923828125, -0.14422607421875, -0.114105224609375, -0.083984375, -0.053863525390625, -0.02374267578125, 0.006378173828125, 0.0364990234375, 0.066619873046875, 0.09674072265625, 0.126861572265625, 0.156982421875, 0.187103271484375, 0.21722412109375, 0.247344970703125, 0.2774658203125, 0.307586669921875, 0.33770751953125, 0.367828369140625, 0.39794921875, 0.428070068359375, 0.45819091796875, 0.488311767578125, 0.5184326171875, 0.548553466796875, 0.57867431640625, 0.608795166015625, 0.638916015625, 0.669036865234375, 0.69915771484375, 0.729278564453125, 0.7593994140625, 0.789520263671875, 0.81964111328125, 0.849761962890625, 0.8798828125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 5.0, 6.0, 11.0, 8.0, 9.0, 19.0, 27.0, 22.0, 47.0, 81.0, 130.0, 167.0, 145.0, 108.0, 73.0, 33.0, 33.0, 23.0, 8.0, 14.0, 10.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80859375, -0.7846450805664062, -0.7606964111328125, -0.7367477416992188, -0.712799072265625, -0.6888504028320312, -0.6649017333984375, -0.6409530639648438, -0.61700439453125, -0.5930557250976562, -0.5691070556640625, -0.5451583862304688, -0.521209716796875, -0.49726104736328125, -0.4733123779296875, -0.44936370849609375, -0.4254150390625, -0.40146636962890625, -0.3775177001953125, -0.35356903076171875, -0.329620361328125, -0.30567169189453125, -0.2817230224609375, -0.25777435302734375, -0.23382568359375, -0.20987701416015625, -0.1859283447265625, -0.16197967529296875, -0.138031005859375, -0.11408233642578125, -0.0901336669921875, -0.06618499755859375, -0.042236328125, -0.01828765869140625, 0.0056610107421875, 0.02960968017578125, 0.053558349609375, 0.07750701904296875, 0.1014556884765625, 0.12540435791015625, 0.14935302734375, 0.17330169677734375, 0.1972503662109375, 0.22119903564453125, 0.245147705078125, 0.26909637451171875, 0.2930450439453125, 0.31699371337890625, 0.3409423828125, 0.36489105224609375, 0.3888397216796875, 0.41278839111328125, 0.436737060546875, 0.46068572998046875, 0.4846343994140625, 0.5085830688476562, 0.53253173828125, 0.5564804077148438, 0.5804290771484375, 0.6043777465820312, 0.628326416015625, 0.6522750854492188, 0.6762237548828125, 0.7001724243164062, 0.72412109375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 12.0, 12.0, 12.0, 41.0, 64.0, 89.0, 111.0, 160.0, 164.0, 127.0, 75.0, 53.0, 35.0, 26.0, 11.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-21.52381134033203, -21.076377868652344, -20.62894630432129, -20.181514739990234, -19.734081268310547, -19.28664779663086, -18.839216232299805, -18.39178466796875, -17.944351196289062, -17.496917724609375, -17.04948616027832, -16.602054595947266, -16.154621124267578, -15.707188606262207, -15.259756088256836, -14.812323570251465, -14.364891052246094, -13.917458534240723, -13.470026016235352, -13.02259349822998, -12.57516098022461, -12.127728462219238, -11.680295944213867, -11.232863426208496, -10.785430908203125, -10.337998390197754, -9.890565872192383, -9.443133354187012, -8.99570083618164, -8.54826831817627, -8.100835800170898, -7.653403282165527, -7.205970764160156, -6.758538246154785, -6.311105728149414, -5.863673210144043, -5.416240692138672, -4.968808174133301, -4.52137565612793, -4.073943138122559, -3.6265106201171875, -3.1790781021118164, -2.7316455841064453, -2.284213066101074, -1.8367805480957031, -1.389348030090332, -0.9419155120849609, -0.49448299407958984, -0.04705047607421875, 0.40038204193115234, 0.8478145599365234, 1.2952470779418945, 1.7426795959472656, 2.1901121139526367, 2.637544631958008, 3.084977149963379, 3.53240966796875, 3.979842185974121, 4.427274703979492, 4.874707221984863, 5.322139739990234, 5.7695722579956055, 6.217004776000977, 6.664437294006348, 7.111869812011719]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 7.0, 10.0, 13.0, 9.0, 16.0, 14.0, 16.0, 24.0, 33.0, 21.0, 23.0, 40.0, 40.0, 37.0, 40.0, 33.0, 38.0, 42.0, 47.0, 49.0, 43.0, 36.0, 30.0, 38.0, 31.0, 33.0, 32.0, 23.0, 19.0, 22.0, 18.0, 20.0, 14.0, 16.0, 7.0, 16.0, 13.0, 9.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-9.522441864013672, -9.247241973876953, -8.972042083740234, -8.696842193603516, -8.421642303466797, -8.146442413330078, -7.871243000030518, -7.596043109893799, -7.32084321975708, -7.045643329620361, -6.770443439483643, -6.495243549346924, -6.220044136047363, -5.9448442459106445, -5.669644355773926, -5.394444465637207, -5.119244575500488, -4.8440446853637695, -4.568844795227051, -4.293644905090332, -4.018445014953613, -3.7432453632354736, -3.468045711517334, -3.1928458213806152, -2.9176459312438965, -2.6424460411071777, -2.367246150970459, -2.0920464992523193, -1.8168466091156006, -1.5416467189788818, -1.2664469480514526, -0.9912471771240234, -0.7160482406616211, -0.4408484101295471, -0.16564857959747314, 0.10955125093460083, 0.3847510814666748, 0.6599509716033936, 0.9351507425308228, 1.210350513458252, 1.4855504035949707, 1.7607502937316895, 2.035950183868408, 2.311149835586548, 2.5863497257232666, 2.8615496158599854, 3.136749267578125, 3.4119491577148438, 3.6871490478515625, 3.9623489379882812, 4.237548828125, 4.512748718261719, 4.7879486083984375, 5.063148498535156, 5.338347911834717, 5.6135478019714355, 5.888747692108154, 6.163947582244873, 6.439147472381592, 6.7143473625183105, 6.989546775817871, 7.26474666595459, 7.539946556091309, 7.815146446228027, 8.090346336364746]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 15.0, 15.0, 6.0, 31.0, 30.0, 81.0, 132.0, 294.0, 713.0, 2225.0, 10919.0, 4067414.0, 104054.0, 5810.0, 1489.0, 488.0, 229.0, 100.0, 65.0, 45.0, 23.0, 19.0, 20.0, 9.0, 9.0, 7.0, 9.0, 5.0, 1.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9453125, -6.6656494140625, -6.385986328125, -6.1063232421875, -5.82666015625, -5.5469970703125, -5.267333984375, -4.9876708984375, -4.7080078125, -4.4283447265625, -4.148681640625, -3.8690185546875, -3.58935546875, -3.3096923828125, -3.030029296875, -2.7503662109375, -2.470703125, -2.1910400390625, -1.911376953125, -1.6317138671875, -1.35205078125, -1.0723876953125, -0.792724609375, -0.5130615234375, -0.2333984375, 0.0462646484375, 0.325927734375, 0.6055908203125, 0.88525390625, 1.1649169921875, 1.444580078125, 1.7242431640625, 2.00390625, 2.2835693359375, 2.563232421875, 2.8428955078125, 3.12255859375, 3.4022216796875, 3.681884765625, 3.9615478515625, 4.2412109375, 4.5208740234375, 4.800537109375, 5.0802001953125, 5.35986328125, 5.6395263671875, 5.919189453125, 6.1988525390625, 6.478515625, 6.7581787109375, 7.037841796875, 7.3175048828125, 7.59716796875, 7.8768310546875, 8.156494140625, 8.4361572265625, 8.7158203125, 8.9954833984375, 9.275146484375, 9.5548095703125, 9.83447265625, 10.1141357421875, 10.393798828125, 10.6734619140625, 10.953125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 14.0, 19.0, 14.0, 27.0, 28.0, 34.0, 50.0, 63.0, 62.0, 64.0, 65.0, 68.0, 75.0, 75.0, 63.0, 58.0, 53.0, 43.0, 30.0, 21.0, 27.0, 13.0, 5.0, 13.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56982421875, -0.5476226806640625, -0.525421142578125, -0.5032196044921875, -0.48101806640625, -0.4588165283203125, -0.436614990234375, -0.4144134521484375, -0.3922119140625, -0.3700103759765625, -0.347808837890625, -0.3256072998046875, -0.30340576171875, -0.2812042236328125, -0.259002685546875, -0.2368011474609375, -0.214599609375, -0.1923980712890625, -0.170196533203125, -0.1479949951171875, -0.12579345703125, -0.1035919189453125, -0.081390380859375, -0.0591888427734375, -0.0369873046875, -0.0147857666015625, 0.007415771484375, 0.0296173095703125, 0.05181884765625, 0.0740203857421875, 0.096221923828125, 0.1184234619140625, 0.140625, 0.1628265380859375, 0.185028076171875, 0.2072296142578125, 0.22943115234375, 0.2516326904296875, 0.273834228515625, 0.2960357666015625, 0.3182373046875, 0.3404388427734375, 0.362640380859375, 0.3848419189453125, 0.40704345703125, 0.4292449951171875, 0.451446533203125, 0.4736480712890625, 0.495849609375, 0.5180511474609375, 0.540252685546875, 0.5624542236328125, 0.58465576171875, 0.6068572998046875, 0.629058837890625, 0.6512603759765625, 0.6734619140625, 0.6956634521484375, 0.717864990234375, 0.7400665283203125, 0.76226806640625, 0.7844696044921875, 0.806671142578125, 0.8288726806640625, 0.85107421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 6.0, 6.0, 9.0, 13.0, 8.0, 16.0, 22.0, 24.0, 27.0, 42.0, 53.0, 90.0, 161.0, 300.0, 619.0, 1504.0, 4147.0, 16292.0, 599729.0, 3543010.0, 20316.0, 4660.0, 1671.0, 653.0, 337.0, 187.0, 94.0, 55.0, 38.0, 34.0, 30.0, 26.0, 14.0, 23.0, 14.0, 10.0, 7.0, 6.0, 4.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.48828125, -4.3338623046875, -4.179443359375, -4.0250244140625, -3.87060546875, -3.7161865234375, -3.561767578125, -3.4073486328125, -3.2529296875, -3.0985107421875, -2.944091796875, -2.7896728515625, -2.63525390625, -2.4808349609375, -2.326416015625, -2.1719970703125, -2.017578125, -1.8631591796875, -1.708740234375, -1.5543212890625, -1.39990234375, -1.2454833984375, -1.091064453125, -0.9366455078125, -0.7822265625, -0.6278076171875, -0.473388671875, -0.3189697265625, -0.16455078125, -0.0101318359375, 0.144287109375, 0.2987060546875, 0.453125, 0.6075439453125, 0.761962890625, 0.9163818359375, 1.07080078125, 1.2252197265625, 1.379638671875, 1.5340576171875, 1.6884765625, 1.8428955078125, 1.997314453125, 2.1517333984375, 2.30615234375, 2.4605712890625, 2.614990234375, 2.7694091796875, 2.923828125, 3.0782470703125, 3.232666015625, 3.3870849609375, 3.54150390625, 3.6959228515625, 3.850341796875, 4.0047607421875, 4.1591796875, 4.3135986328125, 4.468017578125, 4.6224365234375, 4.77685546875, 4.9312744140625, 5.085693359375, 5.2401123046875, 5.39453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 6.0, 9.0, 8.0, 20.0, 22.0, 37.0, 85.0, 417.0, 2934.0, 370.0, 66.0, 35.0, 28.0, 14.0, 11.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7802734375, -0.7328338623046875, -0.685394287109375, -0.6379547119140625, -0.59051513671875, -0.5430755615234375, -0.495635986328125, -0.4481964111328125, -0.4007568359375, -0.3533172607421875, -0.305877685546875, -0.2584381103515625, -0.21099853515625, -0.1635589599609375, -0.116119384765625, -0.0686798095703125, -0.021240234375, 0.0261993408203125, 0.073638916015625, 0.1210784912109375, 0.16851806640625, 0.2159576416015625, 0.263397216796875, 0.3108367919921875, 0.3582763671875, 0.4057159423828125, 0.453155517578125, 0.5005950927734375, 0.54803466796875, 0.5954742431640625, 0.642913818359375, 0.6903533935546875, 0.73779296875, 0.7852325439453125, 0.832672119140625, 0.8801116943359375, 0.92755126953125, 0.9749908447265625, 1.022430419921875, 1.0698699951171875, 1.1173095703125, 1.1647491455078125, 1.212188720703125, 1.2596282958984375, 1.30706787109375, 1.3545074462890625, 1.401947021484375, 1.4493865966796875, 1.496826171875, 1.5442657470703125, 1.591705322265625, 1.6391448974609375, 1.68658447265625, 1.7340240478515625, 1.781463623046875, 1.8289031982421875, 1.8763427734375, 1.9237823486328125, 1.971221923828125, 2.0186614990234375, 2.06610107421875, 2.1135406494140625, 2.160980224609375, 2.2084197998046875, 2.255859375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 9.0, 20.0, 40.0, 111.0, 318.0, 293.0, 135.0, 41.0, 16.0, 5.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.804039001464844, -10.486967086791992, -10.16989517211914, -9.852823257446289, -9.535750389099121, -9.21867847442627, -8.901606559753418, -8.584534645080566, -8.267462730407715, -7.950390815734863, -7.6333184242248535, -7.316246509552002, -6.99917459487915, -6.682102203369141, -6.365030288696289, -6.0479583740234375, -5.730885982513428, -5.413814067840576, -5.096741676330566, -4.779669761657715, -4.462597846984863, -4.145525932312012, -3.828453540802002, -3.5113816261291504, -3.1943094730377197, -2.877237319946289, -2.5601654052734375, -2.243093252182007, -1.9260212182998657, -1.6089491844177246, -1.291877031326294, -0.9748051166534424, -0.6577329635620117, -0.3406608998775482, -0.023588836193084717, 0.29348325729370117, 0.6105552911758423, 0.9276273250579834, 1.244699478149414, 1.5617713928222656, 1.8788435459136963, 2.195915699005127, 2.5129876136779785, 2.830059766769409, 3.14713191986084, 3.4642038345336914, 3.781275987625122, 4.0983476638793945, 4.415420055389404, 4.732491970062256, 5.049564361572266, 5.366636276245117, 5.683708190917969, 6.00078010559082, 6.31785249710083, 6.634924411773682, 6.951996803283691, 7.269068717956543, 7.586141109466553, 7.903213024139404, 8.220285415649414, 8.537357330322266, 8.854429244995117, 9.171501159667969, 9.48857307434082]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 10.0, 18.0, 16.0, 28.0, 35.0, 42.0, 51.0, 70.0, 58.0, 84.0, 82.0, 73.0, 95.0, 88.0, 60.0, 50.0, 44.0, 37.0, 17.0, 22.0, 10.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.007857799530029, -3.8816070556640625, -3.7553560733795166, -3.62910532951355, -3.502854347229004, -3.376603603363037, -3.2503528594970703, -3.1241021156311035, -2.9978511333465576, -2.871600389480591, -2.745349407196045, -2.619098663330078, -2.4928479194641113, -2.3665969371795654, -2.2403461933135986, -2.1140952110290527, -1.987844467163086, -1.8615936040878296, -1.7353427410125732, -1.6090919971466064, -1.48284113407135, -1.3565902709960938, -1.230339527130127, -1.1040886640548706, -0.9778378009796143, -0.8515869379043579, -0.7253361344337463, -0.5990853309631348, -0.4728344678878784, -0.34658360481262207, -0.2203328013420105, -0.09408199787139893, 0.03216886520385742, 0.15841969847679138, 0.28467053174972534, 0.4109213650226593, 0.5371721982955933, 0.6634230613708496, 0.7896738648414612, 0.9159246683120728, 1.042175531387329, 1.1684263944625854, 1.2946772575378418, 1.4209280014038086, 1.547178864479065, 1.6734297275543213, 1.799680471420288, 1.9259313344955444, 2.052182197570801, 2.1784329414367676, 2.3046839237213135, 2.4309346675872803, 2.557185649871826, 2.683436393737793, 2.8096871376037598, 2.9359378814697266, 3.0621888637542725, 3.1884396076202393, 3.314690589904785, 3.440941333770752, 3.5671920776367188, 3.6934430599212646, 3.8196938037872314, 3.9459447860717773, 4.072195529937744]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 12.0, 7.0, 30.0, 33.0, 48.0, 70.0, 168.0, 339.0, 906.0, 3286.0, 20678.0, 393304.0, 595224.0, 28591.0, 3997.0, 1054.0, 361.0, 170.0, 92.0, 47.0, 32.0, 21.0, 20.0, 9.0, 11.0, 6.0, 4.0, 6.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78515625, -3.63995361328125, -3.4947509765625, -3.34954833984375, -3.204345703125, -3.05914306640625, -2.9139404296875, -2.76873779296875, -2.62353515625, -2.47833251953125, -2.3331298828125, -2.18792724609375, -2.042724609375, -1.89752197265625, -1.7523193359375, -1.60711669921875, -1.4619140625, -1.31671142578125, -1.1715087890625, -1.02630615234375, -0.881103515625, -0.73590087890625, -0.5906982421875, -0.44549560546875, -0.30029296875, -0.15509033203125, -0.0098876953125, 0.13531494140625, 0.280517578125, 0.42572021484375, 0.5709228515625, 0.71612548828125, 0.861328125, 1.00653076171875, 1.1517333984375, 1.29693603515625, 1.442138671875, 1.58734130859375, 1.7325439453125, 1.87774658203125, 2.02294921875, 2.16815185546875, 2.3133544921875, 2.45855712890625, 2.603759765625, 2.74896240234375, 2.8941650390625, 3.03936767578125, 3.1845703125, 3.32977294921875, 3.4749755859375, 3.62017822265625, 3.765380859375, 3.91058349609375, 4.0557861328125, 4.20098876953125, 4.34619140625, 4.49139404296875, 4.6365966796875, 4.78179931640625, 4.927001953125, 5.07220458984375, 5.2174072265625, 5.36260986328125, 5.5078125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 10.0, 12.0, 15.0, 23.0, 33.0, 36.0, 47.0, 72.0, 76.0, 76.0, 78.0, 80.0, 73.0, 86.0, 66.0, 46.0, 45.0, 33.0, 30.0, 22.0, 11.0, 9.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59033203125, -0.5659713745117188, -0.5416107177734375, -0.5172500610351562, -0.492889404296875, -0.46852874755859375, -0.4441680908203125, -0.41980743408203125, -0.39544677734375, -0.37108612060546875, -0.3467254638671875, -0.32236480712890625, -0.298004150390625, -0.27364349365234375, -0.2492828369140625, -0.22492218017578125, -0.2005615234375, -0.17620086669921875, -0.1518402099609375, -0.12747955322265625, -0.103118896484375, -0.07875823974609375, -0.0543975830078125, -0.03003692626953125, -0.00567626953125, 0.01868438720703125, 0.0430450439453125, 0.06740570068359375, 0.091766357421875, 0.11612701416015625, 0.1404876708984375, 0.16484832763671875, 0.189208984375, 0.21356964111328125, 0.2379302978515625, 0.26229095458984375, 0.286651611328125, 0.31101226806640625, 0.3353729248046875, 0.35973358154296875, 0.38409423828125, 0.40845489501953125, 0.4328155517578125, 0.45717620849609375, 0.481536865234375, 0.5058975219726562, 0.5302581787109375, 0.5546188354492188, 0.5789794921875, 0.6033401489257812, 0.6277008056640625, 0.6520614624023438, 0.676422119140625, 0.7007827758789062, 0.7251434326171875, 0.7495040893554688, 0.77386474609375, 0.7982254028320312, 0.8225860595703125, 0.8469467163085938, 0.871307373046875, 0.8956680297851562, 0.9200286865234375, 0.9443893432617188, 0.96875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 11.0, 10.0, 11.0, 12.0, 26.0, 29.0, 42.0, 48.0, 59.0, 95.0, 165.0, 256.0, 423.0, 782.0, 1548.0, 3187.0, 7576.0, 20041.0, 62649.0, 230542.0, 487478.0, 160650.0, 46217.0, 15218.0, 5974.0, 2540.0, 1267.0, 621.0, 377.0, 234.0, 133.0, 97.0, 58.0, 43.0, 28.0, 26.0, 19.0, 11.0, 13.0, 8.0, 10.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3916015625, -1.3457794189453125, -1.299957275390625, -1.2541351318359375, -1.20831298828125, -1.1624908447265625, -1.116668701171875, -1.0708465576171875, -1.0250244140625, -0.9792022705078125, -0.933380126953125, -0.8875579833984375, -0.84173583984375, -0.7959136962890625, -0.750091552734375, -0.7042694091796875, -0.658447265625, -0.6126251220703125, -0.566802978515625, -0.5209808349609375, -0.47515869140625, -0.4293365478515625, -0.383514404296875, -0.3376922607421875, -0.2918701171875, -0.2460479736328125, -0.200225830078125, -0.1544036865234375, -0.10858154296875, -0.0627593994140625, -0.016937255859375, 0.0288848876953125, 0.07470703125, 0.1205291748046875, 0.166351318359375, 0.2121734619140625, 0.25799560546875, 0.3038177490234375, 0.349639892578125, 0.3954620361328125, 0.4412841796875, 0.4871063232421875, 0.532928466796875, 0.5787506103515625, 0.62457275390625, 0.6703948974609375, 0.716217041015625, 0.7620391845703125, 0.807861328125, 0.8536834716796875, 0.899505615234375, 0.9453277587890625, 0.99114990234375, 1.0369720458984375, 1.082794189453125, 1.1286163330078125, 1.1744384765625, 1.2202606201171875, 1.266082763671875, 1.3119049072265625, 1.35772705078125, 1.4035491943359375, 1.449371337890625, 1.4951934814453125, 1.541015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 0.0, 3.0, 4.0, 6.0, 9.0, 9.0, 9.0, 5.0, 20.0, 19.0, 24.0, 27.0, 25.0, 30.0, 36.0, 31.0, 44.0, 52.0, 39.0, 42.0, 42.0, 49.0, 36.0, 48.0, 40.0, 45.0, 39.0, 35.0, 36.0, 29.0, 20.0, 25.0, 21.0, 15.0, 17.0, 11.0, 23.0, 7.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.892578125, -1.8363037109375, -1.780029296875, -1.7237548828125, -1.66748046875, -1.6112060546875, -1.554931640625, -1.4986572265625, -1.4423828125, -1.3861083984375, -1.329833984375, -1.2735595703125, -1.21728515625, -1.1610107421875, -1.104736328125, -1.0484619140625, -0.9921875, -0.9359130859375, -0.879638671875, -0.8233642578125, -0.76708984375, -0.7108154296875, -0.654541015625, -0.5982666015625, -0.5419921875, -0.4857177734375, -0.429443359375, -0.3731689453125, -0.31689453125, -0.2606201171875, -0.204345703125, -0.1480712890625, -0.091796875, -0.0355224609375, 0.020751953125, 0.0770263671875, 0.13330078125, 0.1895751953125, 0.245849609375, 0.3021240234375, 0.3583984375, 0.4146728515625, 0.470947265625, 0.5272216796875, 0.58349609375, 0.6397705078125, 0.696044921875, 0.7523193359375, 0.80859375, 0.8648681640625, 0.921142578125, 0.9774169921875, 1.03369140625, 1.0899658203125, 1.146240234375, 1.2025146484375, 1.2587890625, 1.3150634765625, 1.371337890625, 1.4276123046875, 1.48388671875, 1.5401611328125, 1.596435546875, 1.6527099609375, 1.708984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 10.0, 15.0, 14.0, 16.0, 22.0, 35.0, 54.0, 107.0, 244.0, 536.0, 1235.0, 3711.0, 12598.0, 56389.0, 590550.0, 329439.0, 39286.0, 9586.0, 2779.0, 1048.0, 415.0, 182.0, 105.0, 50.0, 40.0, 33.0, 19.0, 12.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.884765625, -0.8586578369140625, -0.832550048828125, -0.8064422607421875, -0.78033447265625, -0.7542266845703125, -0.728118896484375, -0.7020111083984375, -0.6759033203125, -0.6497955322265625, -0.623687744140625, -0.5975799560546875, -0.57147216796875, -0.5453643798828125, -0.519256591796875, -0.4931488037109375, -0.467041015625, -0.4409332275390625, -0.414825439453125, -0.3887176513671875, -0.36260986328125, -0.3365020751953125, -0.310394287109375, -0.2842864990234375, -0.2581787109375, -0.2320709228515625, -0.205963134765625, -0.1798553466796875, -0.15374755859375, -0.1276397705078125, -0.101531982421875, -0.0754241943359375, -0.04931640625, -0.0232086181640625, 0.002899169921875, 0.0290069580078125, 0.05511474609375, 0.0812225341796875, 0.107330322265625, 0.1334381103515625, 0.1595458984375, 0.1856536865234375, 0.211761474609375, 0.2378692626953125, 0.26397705078125, 0.2900848388671875, 0.316192626953125, 0.3423004150390625, 0.368408203125, 0.3945159912109375, 0.420623779296875, 0.4467315673828125, 0.47283935546875, 0.4989471435546875, 0.525054931640625, 0.5511627197265625, 0.5772705078125, 0.6033782958984375, 0.629486083984375, 0.6555938720703125, 0.68170166015625, 0.7078094482421875, 0.733917236328125, 0.7600250244140625, 0.7861328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 9.0, 9.0, 8.0, 15.0, 19.0, 12.0, 22.0, 27.0, 81.0, 182.0, 264.0, 153.0, 50.0, 33.0, 23.0, 13.0, 17.0, 18.0, 7.0, 12.0, 2.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0002913475036621094, -0.00028412602841854095, -0.00027690455317497253, -0.0002696830779314041, -0.0002624616026878357, -0.0002552401274442673, -0.00024801865220069885, -0.00024079717695713043, -0.000233575701713562, -0.0002263542264699936, -0.00021913275122642517, -0.00021191127598285675, -0.00020468980073928833, -0.0001974683254957199, -0.0001902468502521515, -0.00018302537500858307, -0.00017580389976501465, -0.00016858242452144623, -0.0001613609492778778, -0.0001541394740343094, -0.00014691799879074097, -0.00013969652354717255, -0.00013247504830360413, -0.0001252535730600357, -0.00011803209781646729, -0.00011081062257289886, -0.00010358914732933044, -9.636767208576202e-05, -8.91461968421936e-05, -8.192472159862518e-05, -7.470324635505676e-05, -6.748177111148834e-05, -6.026029586791992e-05, -5.30388206243515e-05, -4.581734538078308e-05, -3.859587013721466e-05, -3.137439489364624e-05, -2.415291965007782e-05, -1.69314444065094e-05, -9.709969162940979e-06, -2.4884939193725586e-06, 4.732981324195862e-06, 1.1954456567764282e-05, 1.9175931811332703e-05, 2.6397407054901123e-05, 3.3618882298469543e-05, 4.0840357542037964e-05, 4.8061832785606384e-05, 5.5283308029174805e-05, 6.250478327274323e-05, 6.972625851631165e-05, 7.694773375988007e-05, 8.416920900344849e-05, 9.13906842470169e-05, 9.861215949058533e-05, 0.00010583363473415375, 0.00011305510997772217, 0.00012027658522129059, 0.000127498060464859, 0.00013471953570842743, 0.00014194101095199585, 0.00014916248619556427, 0.0001563839614391327, 0.0001636054366827011, 0.00017082691192626953]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 9.0, 8.0, 16.0, 27.0, 45.0, 42.0, 98.0, 170.0, 325.0, 725.0, 1807.0, 5669.0, 20972.0, 110820.0, 756676.0, 119949.0, 22003.0, 5913.0, 1837.0, 686.0, 306.0, 172.0, 86.0, 66.0, 34.0, 27.0, 14.0, 18.0, 5.0, 11.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.82861328125, -0.803131103515625, -0.77764892578125, -0.752166748046875, -0.7266845703125, -0.701202392578125, -0.67572021484375, -0.650238037109375, -0.624755859375, -0.599273681640625, -0.57379150390625, -0.548309326171875, -0.5228271484375, -0.497344970703125, -0.47186279296875, -0.446380615234375, -0.4208984375, -0.395416259765625, -0.36993408203125, -0.344451904296875, -0.3189697265625, -0.293487548828125, -0.26800537109375, -0.242523193359375, -0.217041015625, -0.191558837890625, -0.16607666015625, -0.140594482421875, -0.1151123046875, -0.089630126953125, -0.06414794921875, -0.038665771484375, -0.01318359375, 0.012298583984375, 0.03778076171875, 0.063262939453125, 0.0887451171875, 0.114227294921875, 0.13970947265625, 0.165191650390625, 0.190673828125, 0.216156005859375, 0.24163818359375, 0.267120361328125, 0.2926025390625, 0.318084716796875, 0.34356689453125, 0.369049072265625, 0.39453125, 0.420013427734375, 0.44549560546875, 0.470977783203125, 0.4964599609375, 0.521942138671875, 0.54742431640625, 0.572906494140625, 0.598388671875, 0.623870849609375, 0.64935302734375, 0.674835205078125, 0.7003173828125, 0.725799560546875, 0.75128173828125, 0.776763916015625, 0.80224609375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 12.0, 8.0, 15.0, 16.0, 25.0, 42.0, 74.0, 132.0, 201.0, 218.0, 107.0, 54.0, 34.0, 18.0, 14.0, 11.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56884765625, -0.5416641235351562, -0.5144805908203125, -0.48729705810546875, -0.460113525390625, -0.43292999267578125, -0.4057464599609375, -0.37856292724609375, -0.35137939453125, -0.32419586181640625, -0.2970123291015625, -0.26982879638671875, -0.242645263671875, -0.21546173095703125, -0.1882781982421875, -0.16109466552734375, -0.1339111328125, -0.10672760009765625, -0.0795440673828125, -0.05236053466796875, -0.025177001953125, 0.00200653076171875, 0.0291900634765625, 0.05637359619140625, 0.08355712890625, 0.11074066162109375, 0.1379241943359375, 0.16510772705078125, 0.192291259765625, 0.21947479248046875, 0.2466583251953125, 0.27384185791015625, 0.301025390625, 0.32820892333984375, 0.3553924560546875, 0.38257598876953125, 0.409759521484375, 0.43694305419921875, 0.4641265869140625, 0.49131011962890625, 0.51849365234375, 0.5456771850585938, 0.5728607177734375, 0.6000442504882812, 0.627227783203125, 0.6544113159179688, 0.6815948486328125, 0.7087783813476562, 0.7359619140625, 0.7631454467773438, 0.7903289794921875, 0.8175125122070312, 0.844696044921875, 0.8718795776367188, 0.8990631103515625, 0.9262466430664062, 0.95343017578125, 0.9806137084960938, 1.0077972412109375, 1.0349807739257812, 1.062164306640625, 1.0893478393554688, 1.1165313720703125, 1.1437149047851562, 1.1708984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 9.0, 8.0, 19.0, 38.0, 62.0, 98.0, 137.0, 168.0, 154.0, 116.0, 78.0, 43.0, 35.0, 14.0, 6.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.06808853149414, -16.658336639404297, -16.248584747314453, -15.83883285522461, -15.429080963134766, -15.019329071044922, -14.609577178955078, -14.199825286865234, -13.79007339477539, -13.380321502685547, -12.970569610595703, -12.56081771850586, -12.151065826416016, -11.741313934326172, -11.331562042236328, -10.921810150146484, -10.512057304382324, -10.10230541229248, -9.692553520202637, -9.282801628112793, -8.87304973602295, -8.463297843933105, -8.053544998168945, -7.64379358291626, -7.234041690826416, -6.824289798736572, -6.4145379066467285, -6.004785537719727, -5.595033645629883, -5.185281753540039, -4.775529861450195, -4.365777969360352, -3.956026077270508, -3.546274185180664, -3.1365222930908203, -2.7267701625823975, -2.3170182704925537, -1.90726637840271, -1.497514247894287, -1.0877623558044434, -0.6780104637145996, -0.2682585120201111, 0.14149343967437744, 0.5512454509735107, 0.9609973430633545, 1.3707492351531982, 1.780501365661621, 2.190253257751465, 2.6000051498413086, 3.0097570419311523, 3.419508934020996, 3.829261064529419, 4.239012718200684, 4.648764610290527, 5.058516979217529, 5.468268871307373, 5.878020763397217, 6.2877726554870605, 6.697524547576904, 7.107276916503906, 7.51702880859375, 7.926780700683594, 8.336532592773438, 8.746284484863281, 9.156036376953125]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 9.0, 10.0, 5.0, 12.0, 11.0, 19.0, 21.0, 19.0, 22.0, 29.0, 28.0, 39.0, 30.0, 40.0, 48.0, 43.0, 38.0, 59.0, 54.0, 43.0, 50.0, 30.0, 42.0, 31.0, 25.0, 37.0, 30.0, 18.0, 26.0, 20.0, 15.0, 22.0, 19.0, 14.0, 16.0, 9.0, 9.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.673399925231934, -9.401901245117188, -9.130402565002441, -8.858902931213379, -8.587404251098633, -8.315905570983887, -8.04440689086914, -7.7729082107543945, -7.50140905380249, -7.229910373687744, -6.95841121673584, -6.686912536621094, -6.415413856506348, -6.143914699554443, -5.872416019439697, -5.600916862487793, -5.329418182373047, -5.057919502258301, -4.7864203453063965, -4.51492166519165, -4.243422508239746, -3.971923828125, -3.700425148010254, -3.4289262294769287, -3.1574273109436035, -2.8859283924102783, -2.614429473876953, -2.342930793762207, -2.071431875228882, -1.7999329566955566, -1.528434157371521, -1.2569353580474854, -0.9854373931884766, -0.7139385342597961, -0.4424396753311157, -0.1709408164024353, 0.10055804252624512, 0.3720569610595703, 0.643555760383606, 0.9150545597076416, 1.1865534782409668, 1.458052396774292, 1.7295511960983276, 2.0010499954223633, 2.2725489139556885, 2.5440478324890137, 2.8155465126037598, 3.087045431137085, 3.35854434967041, 3.6300432682037354, 3.9015421867370605, 4.173040866851807, 4.444540023803711, 4.716038703918457, 4.987537384033203, 5.259036064147949, 5.5305352210998535, 5.8020339012146, 6.073533058166504, 6.34503173828125, 6.616530418395996, 6.8880295753479, 7.1595282554626465, 7.431027412414551, 7.702526092529297]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 7.0, 14.0, 16.0, 14.0, 47.0, 63.0, 146.0, 299.0, 645.0, 1986.0, 8962.0, 1205745.0, 2964658.0, 8511.0, 1817.0, 656.0, 304.0, 135.0, 66.0, 54.0, 32.0, 25.0, 17.0, 9.0, 8.0, 9.0, 1.0, 6.0, 9.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.86328125, -5.61907958984375, -5.3748779296875, -5.13067626953125, -4.886474609375, -4.64227294921875, -4.3980712890625, -4.15386962890625, -3.90966796875, -3.66546630859375, -3.4212646484375, -3.17706298828125, -2.932861328125, -2.68865966796875, -2.4444580078125, -2.20025634765625, -1.9560546875, -1.71185302734375, -1.4676513671875, -1.22344970703125, -0.979248046875, -0.73504638671875, -0.4908447265625, -0.24664306640625, -0.00244140625, 0.24176025390625, 0.4859619140625, 0.73016357421875, 0.974365234375, 1.21856689453125, 1.4627685546875, 1.70697021484375, 1.951171875, 2.19537353515625, 2.4395751953125, 2.68377685546875, 2.927978515625, 3.17218017578125, 3.4163818359375, 3.66058349609375, 3.90478515625, 4.14898681640625, 4.3931884765625, 4.63739013671875, 4.881591796875, 5.12579345703125, 5.3699951171875, 5.61419677734375, 5.8583984375, 6.10260009765625, 6.3468017578125, 6.59100341796875, 6.835205078125, 7.07940673828125, 7.3236083984375, 7.56781005859375, 7.81201171875, 8.05621337890625, 8.3004150390625, 8.54461669921875, 8.788818359375, 9.03302001953125, 9.2772216796875, 9.52142333984375, 9.765625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 13.0, 10.0, 17.0, 18.0, 27.0, 24.0, 40.0, 40.0, 45.0, 66.0, 65.0, 74.0, 86.0, 73.0, 60.0, 70.0, 48.0, 50.0, 39.0, 43.0, 29.0, 21.0, 13.0, 7.0, 9.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61865234375, -0.59637451171875, -0.5740966796875, -0.55181884765625, -0.529541015625, -0.50726318359375, -0.4849853515625, -0.46270751953125, -0.4404296875, -0.41815185546875, -0.3958740234375, -0.37359619140625, -0.351318359375, -0.32904052734375, -0.3067626953125, -0.28448486328125, -0.26220703125, -0.23992919921875, -0.2176513671875, -0.19537353515625, -0.173095703125, -0.15081787109375, -0.1285400390625, -0.10626220703125, -0.083984375, -0.06170654296875, -0.0394287109375, -0.01715087890625, 0.005126953125, 0.02740478515625, 0.0496826171875, 0.07196044921875, 0.09423828125, 0.11651611328125, 0.1387939453125, 0.16107177734375, 0.183349609375, 0.20562744140625, 0.2279052734375, 0.25018310546875, 0.2724609375, 0.29473876953125, 0.3170166015625, 0.33929443359375, 0.361572265625, 0.38385009765625, 0.4061279296875, 0.42840576171875, 0.45068359375, 0.47296142578125, 0.4952392578125, 0.51751708984375, 0.539794921875, 0.56207275390625, 0.5843505859375, 0.60662841796875, 0.62890625, 0.65118408203125, 0.6734619140625, 0.69573974609375, 0.718017578125, 0.74029541015625, 0.7625732421875, 0.78485107421875, 0.80712890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 6.0, 9.0, 8.0, 8.0, 18.0, 26.0, 30.0, 34.0, 68.0, 115.0, 152.0, 265.0, 396.0, 732.0, 1332.0, 2764.0, 6310.0, 19195.0, 194400.0, 3892632.0, 55262.0, 11514.0, 4430.0, 2018.0, 1101.0, 533.0, 343.0, 207.0, 118.0, 69.0, 58.0, 34.0, 25.0, 9.0, 17.0, 14.0, 1.0, 11.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.638671875, -3.5260009765625, -3.413330078125, -3.3006591796875, -3.18798828125, -3.0753173828125, -2.962646484375, -2.8499755859375, -2.7373046875, -2.6246337890625, -2.511962890625, -2.3992919921875, -2.28662109375, -2.1739501953125, -2.061279296875, -1.9486083984375, -1.8359375, -1.7232666015625, -1.610595703125, -1.4979248046875, -1.38525390625, -1.2725830078125, -1.159912109375, -1.0472412109375, -0.9345703125, -0.8218994140625, -0.709228515625, -0.5965576171875, -0.48388671875, -0.3712158203125, -0.258544921875, -0.1458740234375, -0.033203125, 0.0794677734375, 0.192138671875, 0.3048095703125, 0.41748046875, 0.5301513671875, 0.642822265625, 0.7554931640625, 0.8681640625, 0.9808349609375, 1.093505859375, 1.2061767578125, 1.31884765625, 1.4315185546875, 1.544189453125, 1.6568603515625, 1.76953125, 1.8822021484375, 1.994873046875, 2.1075439453125, 2.22021484375, 2.3328857421875, 2.445556640625, 2.5582275390625, 2.6708984375, 2.7835693359375, 2.896240234375, 3.0089111328125, 3.12158203125, 3.2342529296875, 3.346923828125, 3.4595947265625, 3.572265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 8.0, 19.0, 31.0, 37.0, 77.0, 205.0, 1150.0, 2113.0, 222.0, 75.0, 38.0, 20.0, 12.0, 10.0, 5.0, 9.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4990234375, -1.4616317749023438, -1.4242401123046875, -1.3868484497070312, -1.349456787109375, -1.3120651245117188, -1.2746734619140625, -1.2372817993164062, -1.19989013671875, -1.1624984741210938, -1.1251068115234375, -1.0877151489257812, -1.050323486328125, -1.0129318237304688, -0.9755401611328125, -0.9381484985351562, -0.9007568359375, -0.8633651733398438, -0.8259735107421875, -0.7885818481445312, -0.751190185546875, -0.7137985229492188, -0.6764068603515625, -0.6390151977539062, -0.60162353515625, -0.5642318725585938, -0.5268402099609375, -0.48944854736328125, -0.452056884765625, -0.41466522216796875, -0.3772735595703125, -0.33988189697265625, -0.302490234375, -0.26509857177734375, -0.2277069091796875, -0.19031524658203125, -0.152923583984375, -0.11553192138671875, -0.0781402587890625, -0.04074859619140625, -0.00335693359375, 0.03403472900390625, 0.0714263916015625, 0.10881805419921875, 0.146209716796875, 0.18360137939453125, 0.2209930419921875, 0.25838470458984375, 0.2957763671875, 0.33316802978515625, 0.3705596923828125, 0.40795135498046875, 0.445343017578125, 0.48273468017578125, 0.5201263427734375, 0.5575180053710938, 0.59490966796875, 0.6323013305664062, 0.6696929931640625, 0.7070846557617188, 0.744476318359375, 0.7818679809570312, 0.8192596435546875, 0.8566513061523438, 0.89404296875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 21.0, 53.0, 153.0, 292.0, 302.0, 118.0, 38.0, 11.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.315021514892578, -14.97471809387207, -14.634413719177246, -14.294110298156738, -13.953805923461914, -13.613502502441406, -13.273199081420898, -12.93289566040039, -12.592591285705566, -12.252287864685059, -11.911983489990234, -11.571680068969727, -11.231376647949219, -10.891072273254395, -10.550768852233887, -10.210464477539062, -9.870161056518555, -9.529857635498047, -9.189553260803223, -8.849249839782715, -8.50894546508789, -8.168642044067383, -7.828338623046875, -7.488034725189209, -7.147730827331543, -6.807426929473877, -6.467123031616211, -6.126819610595703, -5.786515712738037, -5.446211814880371, -5.105908393859863, -4.765604496002197, -4.425299644470215, -4.084995746612549, -3.744692087173462, -3.404388427734375, -3.064084529876709, -2.723780632019043, -2.383476972579956, -2.043173313140869, -1.7028694152832031, -1.3625656366348267, -1.0222618579864502, -0.6819580793380737, -0.34165430068969727, -0.0013505220413208008, 0.33895325660705566, 0.6792569160461426, 1.0195608139038086, 1.359864592552185, 1.7001683712005615, 2.0404720306396484, 2.3807759284973145, 2.7210798263549805, 3.0613834857940674, 3.4016871452331543, 3.7419910430908203, 4.082294940948486, 4.422598838806152, 4.76290225982666, 5.103206157684326, 5.443510055541992, 5.7838134765625, 6.124117374420166, 6.464421272277832]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 12.0, 7.0, 12.0, 14.0, 23.0, 24.0, 40.0, 45.0, 55.0, 66.0, 57.0, 64.0, 65.0, 70.0, 78.0, 65.0, 69.0, 51.0, 47.0, 39.0, 29.0, 18.0, 17.0, 8.0, 10.0, 11.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.167564392089844, -4.048315048217773, -3.929065465927124, -3.8098158836364746, -3.6905665397644043, -3.571316957473755, -3.4520673751831055, -3.332818031311035, -3.2135684490203857, -3.0943188667297363, -2.975069522857666, -2.8558199405670166, -2.7365705966949463, -2.617321014404297, -2.4980716705322266, -2.378822088241577, -2.2595725059509277, -2.1403229236602783, -2.021073579788208, -1.9018239974975586, -1.7825745344161987, -1.6633250713348389, -1.544075608253479, -1.4248261451721191, -1.3055768013000488, -1.186327338218689, -1.067077875137329, -0.9478283524513245, -0.8285788297653198, -0.70932936668396, -0.5900799036026001, -0.47083038091659546, -0.3515808582305908, -0.23233136534690857, -0.11308188736438751, 0.006167590618133545, 0.1254170835018158, 0.24466657638549805, 0.3639160394668579, 0.48316556215286255, 0.6024150252342224, 0.7216644883155823, 0.8409140110015869, 0.9601634740829468, 1.0794129371643066, 1.198662519454956, 1.3179118633270264, 1.4371614456176758, 1.5564109086990356, 1.6756603717803955, 1.7949098348617554, 1.9141592979431152, 2.0334088802337646, 2.152658462524414, 2.2719078063964844, 2.391157388687134, 2.510406732559204, 2.6296563148498535, 2.748905658721924, 2.8681552410125732, 2.9874045848846436, 3.106654167175293, 3.2259035110473633, 3.3451530933380127, 3.464402675628662]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 10.0, 12.0, 14.0, 19.0, 21.0, 45.0, 69.0, 74.0, 139.0, 229.0, 440.0, 1045.0, 3018.0, 13827.0, 101167.0, 693554.0, 204066.0, 23593.0, 4552.0, 1359.0, 583.0, 257.0, 150.0, 98.0, 61.0, 37.0, 27.0, 21.0, 10.0, 13.0, 11.0, 5.0, 9.0, 8.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.73675537109375, -3.6063232421875, -3.47589111328125, -3.345458984375, -3.21502685546875, -3.0845947265625, -2.95416259765625, -2.82373046875, -2.69329833984375, -2.5628662109375, -2.43243408203125, -2.302001953125, -2.17156982421875, -2.0411376953125, -1.91070556640625, -1.7802734375, -1.64984130859375, -1.5194091796875, -1.38897705078125, -1.258544921875, -1.12811279296875, -0.9976806640625, -0.86724853515625, -0.73681640625, -0.60638427734375, -0.4759521484375, -0.34552001953125, -0.215087890625, -0.08465576171875, 0.0457763671875, 0.17620849609375, 0.306640625, 0.43707275390625, 0.5675048828125, 0.69793701171875, 0.828369140625, 0.95880126953125, 1.0892333984375, 1.21966552734375, 1.35009765625, 1.48052978515625, 1.6109619140625, 1.74139404296875, 1.871826171875, 2.00225830078125, 2.1326904296875, 2.26312255859375, 2.3935546875, 2.52398681640625, 2.6544189453125, 2.78485107421875, 2.915283203125, 3.04571533203125, 3.1761474609375, 3.30657958984375, 3.43701171875, 3.56744384765625, 3.6978759765625, 3.82830810546875, 3.958740234375, 4.08917236328125, 4.2196044921875, 4.35003662109375, 4.48046875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 9.0, 13.0, 15.0, 21.0, 29.0, 47.0, 57.0, 43.0, 59.0, 64.0, 86.0, 90.0, 75.0, 64.0, 65.0, 55.0, 45.0, 48.0, 38.0, 26.0, 15.0, 15.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63623046875, -0.612335205078125, -0.58843994140625, -0.564544677734375, -0.5406494140625, -0.516754150390625, -0.49285888671875, -0.468963623046875, -0.445068359375, -0.421173095703125, -0.39727783203125, -0.373382568359375, -0.3494873046875, -0.325592041015625, -0.30169677734375, -0.277801513671875, -0.25390625, -0.230010986328125, -0.20611572265625, -0.182220458984375, -0.1583251953125, -0.134429931640625, -0.11053466796875, -0.086639404296875, -0.062744140625, -0.038848876953125, -0.01495361328125, 0.008941650390625, 0.0328369140625, 0.056732177734375, 0.08062744140625, 0.104522705078125, 0.12841796875, 0.152313232421875, 0.17620849609375, 0.200103759765625, 0.2239990234375, 0.247894287109375, 0.27178955078125, 0.295684814453125, 0.319580078125, 0.343475341796875, 0.36737060546875, 0.391265869140625, 0.4151611328125, 0.439056396484375, 0.46295166015625, 0.486846923828125, 0.5107421875, 0.534637451171875, 0.55853271484375, 0.582427978515625, 0.6063232421875, 0.630218505859375, 0.65411376953125, 0.678009033203125, 0.701904296875, 0.725799560546875, 0.74969482421875, 0.773590087890625, 0.7974853515625, 0.821380615234375, 0.84527587890625, 0.869171142578125, 0.89306640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 8.0, 8.0, 11.0, 16.0, 26.0, 27.0, 49.0, 63.0, 92.0, 152.0, 180.0, 254.0, 398.0, 609.0, 1185.0, 2263.0, 5428.0, 15050.0, 50282.0, 191536.0, 489770.0, 208764.0, 55177.0, 15908.0, 5697.0, 2425.0, 1180.0, 643.0, 476.0, 264.0, 168.0, 118.0, 99.0, 70.0, 40.0, 31.0, 20.0, 23.0, 12.0, 15.0, 6.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7626953125, -1.7085113525390625, -1.654327392578125, -1.6001434326171875, -1.54595947265625, -1.4917755126953125, -1.437591552734375, -1.3834075927734375, -1.3292236328125, -1.2750396728515625, -1.220855712890625, -1.1666717529296875, -1.11248779296875, -1.0583038330078125, -1.004119873046875, -0.9499359130859375, -0.895751953125, -0.8415679931640625, -0.787384033203125, -0.7332000732421875, -0.67901611328125, -0.6248321533203125, -0.570648193359375, -0.5164642333984375, -0.4622802734375, -0.4080963134765625, -0.353912353515625, -0.2997283935546875, -0.24554443359375, -0.1913604736328125, -0.137176513671875, -0.0829925537109375, -0.02880859375, 0.0253753662109375, 0.079559326171875, 0.1337432861328125, 0.18792724609375, 0.2421112060546875, 0.296295166015625, 0.3504791259765625, 0.4046630859375, 0.4588470458984375, 0.513031005859375, 0.5672149658203125, 0.62139892578125, 0.6755828857421875, 0.729766845703125, 0.7839508056640625, 0.838134765625, 0.8923187255859375, 0.946502685546875, 1.0006866455078125, 1.05487060546875, 1.1090545654296875, 1.163238525390625, 1.2174224853515625, 1.2716064453125, 1.3257904052734375, 1.379974365234375, 1.4341583251953125, 1.48834228515625, 1.5425262451171875, 1.596710205078125, 1.6508941650390625, 1.705078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 4.0, 7.0, 10.0, 8.0, 9.0, 17.0, 17.0, 20.0, 20.0, 23.0, 31.0, 30.0, 35.0, 37.0, 43.0, 42.0, 33.0, 44.0, 39.0, 38.0, 53.0, 52.0, 41.0, 43.0, 28.0, 38.0, 27.0, 32.0, 22.0, 16.0, 17.0, 15.0, 16.0, 12.0, 13.0, 10.0, 12.0, 4.0, 12.0, 1.0, 7.0, 3.0, 0.0, 4.0, 3.0, 4.0, 1.0, 2.0], "bins": [-2.0234375, -1.96575927734375, -1.9080810546875, -1.85040283203125, -1.792724609375, -1.73504638671875, -1.6773681640625, -1.61968994140625, -1.56201171875, -1.50433349609375, -1.4466552734375, -1.38897705078125, -1.331298828125, -1.27362060546875, -1.2159423828125, -1.15826416015625, -1.1005859375, -1.04290771484375, -0.9852294921875, -0.92755126953125, -0.869873046875, -0.81219482421875, -0.7545166015625, -0.69683837890625, -0.63916015625, -0.58148193359375, -0.5238037109375, -0.46612548828125, -0.408447265625, -0.35076904296875, -0.2930908203125, -0.23541259765625, -0.177734375, -0.12005615234375, -0.0623779296875, -0.00469970703125, 0.052978515625, 0.11065673828125, 0.1683349609375, 0.22601318359375, 0.28369140625, 0.34136962890625, 0.3990478515625, 0.45672607421875, 0.514404296875, 0.57208251953125, 0.6297607421875, 0.68743896484375, 0.7451171875, 0.80279541015625, 0.8604736328125, 0.91815185546875, 0.975830078125, 1.03350830078125, 1.0911865234375, 1.14886474609375, 1.20654296875, 1.26422119140625, 1.3218994140625, 1.37957763671875, 1.437255859375, 1.49493408203125, 1.5526123046875, 1.61029052734375, 1.66796875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 7.0, 1.0, 6.0, 7.0, 12.0, 22.0, 27.0, 36.0, 63.0, 94.0, 152.0, 231.0, 363.0, 670.0, 1082.0, 2130.0, 4162.0, 8898.0, 21212.0, 64778.0, 239945.0, 518957.0, 122732.0, 36823.0, 13573.0, 5977.0, 2898.0, 1484.0, 886.0, 495.0, 290.0, 177.0, 124.0, 78.0, 48.0, 37.0, 20.0, 15.0, 12.0, 11.0, 5.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.7998046875, -0.7733688354492188, -0.7469329833984375, -0.7204971313476562, -0.694061279296875, -0.6676254272460938, -0.6411895751953125, -0.6147537231445312, -0.58831787109375, -0.5618820190429688, -0.5354461669921875, -0.5090103149414062, -0.482574462890625, -0.45613861083984375, -0.4297027587890625, -0.40326690673828125, -0.3768310546875, -0.35039520263671875, -0.3239593505859375, -0.29752349853515625, -0.271087646484375, -0.24465179443359375, -0.2182159423828125, -0.19178009033203125, -0.16534423828125, -0.13890838623046875, -0.1124725341796875, -0.08603668212890625, -0.059600830078125, -0.03316497802734375, -0.0067291259765625, 0.01970672607421875, 0.046142578125, 0.07257843017578125, 0.0990142822265625, 0.12545013427734375, 0.151885986328125, 0.17832183837890625, 0.2047576904296875, 0.23119354248046875, 0.25762939453125, 0.28406524658203125, 0.3105010986328125, 0.33693695068359375, 0.363372802734375, 0.38980865478515625, 0.4162445068359375, 0.44268035888671875, 0.4691162109375, 0.49555206298828125, 0.5219879150390625, 0.5484237670898438, 0.574859619140625, 0.6012954711914062, 0.6277313232421875, 0.6541671752929688, 0.68060302734375, 0.7070388793945312, 0.7334747314453125, 0.7599105834960938, 0.786346435546875, 0.8127822875976562, 0.8392181396484375, 0.8656539916992188, 0.89208984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 2.0, 6.0, 3.0, 11.0, 11.0, 14.0, 24.0, 19.0, 31.0, 27.0, 38.0, 51.0, 85.0, 118.0, 145.0, 97.0, 68.0, 46.0, 39.0, 28.0, 22.0, 18.0, 13.0, 15.0, 13.0, 8.0, 3.0, 10.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0002770423889160156, -0.00026959553360939026, -0.0002621486783027649, -0.0002547018229961395, -0.00024725496768951416, -0.0002398081123828888, -0.00023236125707626343, -0.00022491440176963806, -0.0002174675464630127, -0.00021002069115638733, -0.00020257383584976196, -0.0001951269805431366, -0.00018768012523651123, -0.00018023326992988586, -0.0001727864146232605, -0.00016533955931663513, -0.00015789270401000977, -0.0001504458487033844, -0.00014299899339675903, -0.00013555213809013367, -0.0001281052827835083, -0.00012065842747688293, -0.00011321157217025757, -0.0001057647168636322, -9.831786155700684e-05, -9.087100625038147e-05, -8.34241509437561e-05, -7.597729563713074e-05, -6.853044033050537e-05, -6.108358502388e-05, -5.363672971725464e-05, -4.618987441062927e-05, -3.8743019104003906e-05, -3.129616379737854e-05, -2.3849308490753174e-05, -1.6402453184127808e-05, -8.955597877502441e-06, -1.5087425708770752e-06, 5.938112735748291e-06, 1.3384968042373657e-05, 2.0831823348999023e-05, 2.827867865562439e-05, 3.5725533962249756e-05, 4.317238926887512e-05, 5.061924457550049e-05, 5.8066099882125854e-05, 6.551295518875122e-05, 7.295981049537659e-05, 8.040666580200195e-05, 8.785352110862732e-05, 9.530037641525269e-05, 0.00010274723172187805, 0.00011019408702850342, 0.00011764094233512878, 0.00012508779764175415, 0.00013253465294837952, 0.00013998150825500488, 0.00014742836356163025, 0.00015487521886825562, 0.00016232207417488098, 0.00016976892948150635, 0.00017721578478813171, 0.00018466264009475708, 0.00019210949540138245, 0.0001995563507080078]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 8.0, 17.0, 16.0, 44.0, 56.0, 67.0, 157.0, 231.0, 450.0, 836.0, 1994.0, 5935.0, 27045.0, 207505.0, 684245.0, 97942.0, 15111.0, 3832.0, 1501.0, 653.0, 356.0, 212.0, 97.0, 78.0, 45.0, 31.0, 27.0, 20.0, 7.0, 3.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.28125, -1.23602294921875, -1.1907958984375, -1.14556884765625, -1.100341796875, -1.05511474609375, -1.0098876953125, -0.96466064453125, -0.91943359375, -0.87420654296875, -0.8289794921875, -0.78375244140625, -0.738525390625, -0.69329833984375, -0.6480712890625, -0.60284423828125, -0.5576171875, -0.51239013671875, -0.4671630859375, -0.42193603515625, -0.376708984375, -0.33148193359375, -0.2862548828125, -0.24102783203125, -0.19580078125, -0.15057373046875, -0.1053466796875, -0.06011962890625, -0.014892578125, 0.03033447265625, 0.0755615234375, 0.12078857421875, 0.166015625, 0.21124267578125, 0.2564697265625, 0.30169677734375, 0.346923828125, 0.39215087890625, 0.4373779296875, 0.48260498046875, 0.52783203125, 0.57305908203125, 0.6182861328125, 0.66351318359375, 0.708740234375, 0.75396728515625, 0.7991943359375, 0.84442138671875, 0.8896484375, 0.93487548828125, 0.9801025390625, 1.02532958984375, 1.070556640625, 1.11578369140625, 1.1610107421875, 1.20623779296875, 1.25146484375, 1.29669189453125, 1.3419189453125, 1.38714599609375, 1.432373046875, 1.47760009765625, 1.5228271484375, 1.56805419921875, 1.61328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 6.0, 16.0, 10.0, 26.0, 22.0, 48.0, 63.0, 64.0, 99.0, 119.0, 114.0, 112.0, 93.0, 58.0, 43.0, 28.0, 19.0, 19.0, 12.0, 11.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70947265625, -0.6724624633789062, -0.6354522705078125, -0.5984420776367188, -0.561431884765625, -0.5244216918945312, -0.4874114990234375, -0.45040130615234375, -0.41339111328125, -0.37638092041015625, -0.3393707275390625, -0.30236053466796875, -0.265350341796875, -0.22834014892578125, -0.1913299560546875, -0.15431976318359375, -0.1173095703125, -0.08029937744140625, -0.0432891845703125, -0.00627899169921875, 0.030731201171875, 0.06774139404296875, 0.1047515869140625, 0.14176177978515625, 0.17877197265625, 0.21578216552734375, 0.2527923583984375, 0.28980255126953125, 0.326812744140625, 0.36382293701171875, 0.4008331298828125, 0.43784332275390625, 0.474853515625, 0.5118637084960938, 0.5488739013671875, 0.5858840942382812, 0.622894287109375, 0.6599044799804688, 0.6969146728515625, 0.7339248657226562, 0.77093505859375, 0.8079452514648438, 0.8449554443359375, 0.8819656372070312, 0.918975830078125, 0.9559860229492188, 0.9929962158203125, 1.0300064086914062, 1.0670166015625, 1.1040267944335938, 1.1410369873046875, 1.1780471801757812, 1.215057373046875, 1.2520675659179688, 1.2890777587890625, 1.3260879516601562, 1.36309814453125, 1.4001083374023438, 1.4371185302734375, 1.4741287231445312, 1.511138916015625, 1.5481491088867188, 1.5851593017578125, 1.6221694946289062, 1.6591796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 13.0, 29.0, 44.0, 83.0, 105.0, 138.0, 155.0, 112.0, 107.0, 78.0, 46.0, 29.0, 17.0, 14.0, 8.0, 11.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.745893478393555, -16.24556541442871, -15.7452392578125, -15.244912147521973, -14.744585037231445, -14.244256973266602, -13.743929862976074, -13.243602752685547, -12.74327564239502, -12.242948532104492, -11.742621421813965, -11.242294311523438, -10.741966247558594, -10.241640090942383, -9.741312026977539, -9.240984916687012, -8.740657806396484, -8.240330696105957, -7.74000358581543, -7.239675998687744, -6.739348888397217, -6.2390217781066895, -5.738694190979004, -5.238367080688477, -4.738039970397949, -4.237712860107422, -3.7373855113983154, -3.237058162689209, -2.7367310523986816, -2.2364039421081543, -1.7360765933990479, -1.2357492446899414, -0.7354240417480469, -0.23509681224822998, 0.2652304172515869, 0.7655576467514038, 1.2658848762512207, 1.766211986541748, 2.2665393352508545, 2.766866683959961, 3.2671937942504883, 3.7675209045410156, 4.267848014831543, 4.7681756019592285, 5.268502712249756, 5.768829822540283, 6.269157409667969, 6.769484519958496, 7.269811630249023, 7.770138740539551, 8.270465850830078, 8.770792961120605, 9.271120071411133, 9.771448135375977, 10.271775245666504, 10.772102355957031, 11.272429466247559, 11.772756576538086, 12.273083686828613, 12.77341079711914, 13.273738861083984, 13.774065017700195, 14.274393081665039, 14.774720191955566, 15.275047302246094]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 9.0, 8.0, 11.0, 18.0, 11.0, 16.0, 19.0, 17.0, 26.0, 26.0, 30.0, 30.0, 36.0, 50.0, 39.0, 40.0, 36.0, 35.0, 45.0, 50.0, 44.0, 44.0, 43.0, 35.0, 36.0, 37.0, 37.0, 28.0, 19.0, 29.0, 25.0, 11.0, 8.0, 13.0, 7.0, 4.0, 6.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.537372589111328, -11.192741394042969, -10.848111152648926, -10.503479957580566, -10.158849716186523, -9.814218521118164, -9.469587326049805, -9.124957084655762, -8.780325889587402, -8.435694694519043, -8.091064453125, -7.746433258056641, -7.4018025398254395, -7.057171821594238, -6.712541103363037, -6.367910385131836, -6.023279666900635, -5.678648948669434, -5.334018230438232, -4.989387512207031, -4.644756317138672, -4.300125598907471, -3.9554948806762695, -3.6108639240264893, -3.266233205795288, -2.921602487564087, -2.5769715309143066, -2.2323408126831055, -1.8877099752426147, -1.543079137802124, -1.1984484195709229, -0.8538174629211426, -0.5091867446899414, -0.16455593705177307, 0.18007487058639526, 0.5247056484222412, 0.8693364858627319, 1.2139673233032227, 1.5585980415344238, 1.903228998184204, 2.2478597164154053, 2.5924904346466064, 2.9371213912963867, 3.281752109527588, 3.626382827758789, 3.9710137844085693, 4.315644264221191, 4.660275459289551, 5.004906177520752, 5.349536895751953, 5.694167613983154, 6.0387983322143555, 6.383429527282715, 6.728060245513916, 7.072690963745117, 7.417322158813477, 7.7619524002075195, 8.106583595275879, 8.451213836669922, 8.795845031738281, 9.140475273132324, 9.485106468200684, 9.829736709594727, 10.174367904663086, 10.518999099731445]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 8.0, 9.0, 18.0, 34.0, 66.0, 141.0, 282.0, 974.0, 5558.0, 3311044.0, 869922.0, 4643.0, 911.0, 307.0, 146.0, 89.0, 38.0, 26.0, 23.0, 15.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.67578125, -6.38519287109375, -6.0946044921875, -5.80401611328125, -5.513427734375, -5.22283935546875, -4.9322509765625, -4.64166259765625, -4.35107421875, -4.06048583984375, -3.7698974609375, -3.47930908203125, -3.188720703125, -2.89813232421875, -2.6075439453125, -2.31695556640625, -2.0263671875, -1.73577880859375, -1.4451904296875, -1.15460205078125, -0.864013671875, -0.57342529296875, -0.2828369140625, 0.00775146484375, 0.29833984375, 0.58892822265625, 0.8795166015625, 1.17010498046875, 1.460693359375, 1.75128173828125, 2.0418701171875, 2.33245849609375, 2.623046875, 2.91363525390625, 3.2042236328125, 3.49481201171875, 3.785400390625, 4.07598876953125, 4.3665771484375, 4.65716552734375, 4.94775390625, 5.23834228515625, 5.5289306640625, 5.81951904296875, 6.110107421875, 6.40069580078125, 6.6912841796875, 6.98187255859375, 7.2724609375, 7.56304931640625, 7.8536376953125, 8.14422607421875, 8.434814453125, 8.72540283203125, 9.0159912109375, 9.30657958984375, 9.59716796875, 9.88775634765625, 10.1783447265625, 10.46893310546875, 10.759521484375, 11.05010986328125, 11.3406982421875, 11.63128662109375, 11.921875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 11.0, 6.0, 20.0, 26.0, 28.0, 35.0, 41.0, 49.0, 53.0, 55.0, 75.0, 75.0, 73.0, 63.0, 72.0, 53.0, 42.0, 41.0, 44.0, 31.0, 28.0, 19.0, 15.0, 5.0, 6.0, 3.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57958984375, -0.5566787719726562, -0.5337677001953125, -0.5108566284179688, -0.487945556640625, -0.46503448486328125, -0.4421234130859375, -0.41921234130859375, -0.39630126953125, -0.37339019775390625, -0.3504791259765625, -0.32756805419921875, -0.304656982421875, -0.28174591064453125, -0.2588348388671875, -0.23592376708984375, -0.2130126953125, -0.19010162353515625, -0.1671905517578125, -0.14427947998046875, -0.121368408203125, -0.09845733642578125, -0.0755462646484375, -0.05263519287109375, -0.02972412109375, -0.00681304931640625, 0.0160980224609375, 0.03900909423828125, 0.061920166015625, 0.08483123779296875, 0.1077423095703125, 0.13065338134765625, 0.153564453125, 0.17647552490234375, 0.1993865966796875, 0.22229766845703125, 0.245208740234375, 0.26811981201171875, 0.2910308837890625, 0.31394195556640625, 0.33685302734375, 0.35976409912109375, 0.3826751708984375, 0.40558624267578125, 0.428497314453125, 0.45140838623046875, 0.4743194580078125, 0.49723052978515625, 0.5201416015625, 0.5430526733398438, 0.5659637451171875, 0.5888748168945312, 0.611785888671875, 0.6346969604492188, 0.6576080322265625, 0.6805191040039062, 0.70343017578125, 0.7263412475585938, 0.7492523193359375, 0.7721633911132812, 0.795074462890625, 0.8179855346679688, 0.8408966064453125, 0.8638076782226562, 0.88671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 6.0, 11.0, 20.0, 19.0, 25.0, 38.0, 60.0, 91.0, 96.0, 184.0, 280.0, 450.0, 741.0, 1345.0, 2651.0, 6770.0, 28919.0, 2943987.0, 1172214.0, 24371.0, 6309.0, 2530.0, 1242.0, 685.0, 424.0, 256.0, 163.0, 124.0, 72.0, 63.0, 47.0, 25.0, 17.0, 10.0, 11.0, 10.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.953125, -3.8211669921875, -3.689208984375, -3.5572509765625, -3.42529296875, -3.2933349609375, -3.161376953125, -3.0294189453125, -2.8974609375, -2.7655029296875, -2.633544921875, -2.5015869140625, -2.36962890625, -2.2376708984375, -2.105712890625, -1.9737548828125, -1.841796875, -1.7098388671875, -1.577880859375, -1.4459228515625, -1.31396484375, -1.1820068359375, -1.050048828125, -0.9180908203125, -0.7861328125, -0.6541748046875, -0.522216796875, -0.3902587890625, -0.25830078125, -0.1263427734375, 0.005615234375, 0.1375732421875, 0.26953125, 0.4014892578125, 0.533447265625, 0.6654052734375, 0.79736328125, 0.9293212890625, 1.061279296875, 1.1932373046875, 1.3251953125, 1.4571533203125, 1.589111328125, 1.7210693359375, 1.85302734375, 1.9849853515625, 2.116943359375, 2.2489013671875, 2.380859375, 2.5128173828125, 2.644775390625, 2.7767333984375, 2.90869140625, 3.0406494140625, 3.172607421875, 3.3045654296875, 3.4365234375, 3.5684814453125, 3.700439453125, 3.8323974609375, 3.96435546875, 4.0963134765625, 4.228271484375, 4.3602294921875, 4.4921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 16.0, 25.0, 39.0, 53.0, 141.0, 509.0, 2398.0, 584.0, 160.0, 55.0, 25.0, 15.0, 13.0, 10.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.703125, -1.6491546630859375, -1.595184326171875, -1.5412139892578125, -1.48724365234375, -1.4332733154296875, -1.379302978515625, -1.3253326416015625, -1.2713623046875, -1.2173919677734375, -1.163421630859375, -1.1094512939453125, -1.05548095703125, -1.0015106201171875, -0.947540283203125, -0.8935699462890625, -0.839599609375, -0.7856292724609375, -0.731658935546875, -0.6776885986328125, -0.62371826171875, -0.5697479248046875, -0.515777587890625, -0.4618072509765625, -0.4078369140625, -0.3538665771484375, -0.299896240234375, -0.2459259033203125, -0.19195556640625, -0.1379852294921875, -0.084014892578125, -0.0300445556640625, 0.02392578125, 0.0778961181640625, 0.131866455078125, 0.1858367919921875, 0.23980712890625, 0.2937774658203125, 0.347747802734375, 0.4017181396484375, 0.4556884765625, 0.5096588134765625, 0.563629150390625, 0.6175994873046875, 0.67156982421875, 0.7255401611328125, 0.779510498046875, 0.8334808349609375, 0.887451171875, 0.9414215087890625, 0.995391845703125, 1.0493621826171875, 1.10333251953125, 1.1573028564453125, 1.211273193359375, 1.2652435302734375, 1.3192138671875, 1.3731842041015625, 1.427154541015625, 1.4811248779296875, 1.53509521484375, 1.5890655517578125, 1.643035888671875, 1.6970062255859375, 1.7509765625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 39.0, 173.0, 434.0, 252.0, 62.0, 22.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.91795539855957, -28.240795135498047, -27.563636779785156, -26.886476516723633, -26.20931625366211, -25.532155990600586, -24.854995727539062, -24.177837371826172, -23.50067710876465, -22.823516845703125, -22.146358489990234, -21.46919822692871, -20.792037963867188, -20.114877700805664, -19.43771743774414, -18.76055908203125, -18.083398818969727, -17.406238555908203, -16.729080200195312, -16.05191993713379, -15.374759674072266, -14.697599411010742, -14.020440101623535, -13.343280792236328, -12.666120529174805, -11.988960266113281, -11.311800956726074, -10.634641647338867, -9.957481384277344, -9.28032112121582, -8.603161811828613, -7.926002025604248, -7.248844146728516, -6.57168436050415, -5.894524574279785, -5.21736478805542, -4.540205001831055, -3.8630452156066895, -3.185885429382324, -2.508725643157959, -1.8315658569335938, -1.1544060707092285, -0.4772462844848633, 0.19991350173950195, 0.8770732879638672, 1.5542330741882324, 2.2313928604125977, 2.908552646636963, 3.585712432861328, 4.262872219085693, 4.940032005310059, 5.617191791534424, 6.294351577758789, 6.971511363983154, 7.6486711502075195, 8.325830459594727, 9.00299072265625, 9.680150985717773, 10.35731029510498, 11.034469604492188, 11.711629867553711, 12.388790130615234, 13.065949440002441, 13.743108749389648, 14.420269012451172]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 17.0, 19.0, 36.0, 31.0, 47.0, 54.0, 67.0, 63.0, 71.0, 70.0, 57.0, 65.0, 62.0, 61.0, 52.0, 46.0, 38.0, 27.0, 30.0, 15.0, 16.0, 11.0, 11.0, 6.0, 6.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.689672470092773, -5.532442092895508, -5.375211238861084, -5.217980861663818, -5.060750484466553, -4.903519630432129, -4.746289253234863, -4.589058876037598, -4.431828498840332, -4.274598121643066, -4.117367267608643, -3.960136890411377, -3.8029065132141113, -3.6456758975982666, -3.488445281982422, -3.3312149047851562, -3.1739840507507324, -3.0167534351348877, -2.859523057937622, -2.7022924423217773, -2.5450620651245117, -2.387831449508667, -2.2306008338928223, -2.0733704566955566, -1.916139841079712, -1.7589093446731567, -1.6016788482666016, -1.4444482326507568, -1.2872177362442017, -1.1299872398376465, -0.9727566838264465, -0.8155261278152466, -0.6582956314086914, -0.5010651350021362, -0.3438345789909363, -0.18660405278205872, -0.029373526573181152, 0.12785696983337402, 0.285087525844574, 0.4423180818557739, 0.5995485782623291, 0.7567790746688843, 0.9140096306800842, 1.0712401866912842, 1.2284706830978394, 1.3857011795043945, 1.5429317951202393, 1.7001622915267944, 1.8573927879333496, 2.0146234035491943, 2.17185378074646, 2.3290843963623047, 2.4863147735595703, 2.643545389175415, 2.8007760047912598, 2.9580063819885254, 3.11523699760437, 3.272467613220215, 3.4296979904174805, 3.586928606033325, 3.74415922164917, 3.9013895988464355, 4.058619976043701, 4.215850830078125, 4.373081207275391]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 3.0, 4.0, 9.0, 14.0, 21.0, 19.0, 33.0, 35.0, 73.0, 103.0, 164.0, 314.0, 632.0, 1691.0, 5132.0, 22804.0, 161861.0, 634994.0, 186065.0, 25663.0, 5532.0, 1820.0, 716.0, 330.0, 185.0, 91.0, 75.0, 51.0, 28.0, 23.0, 14.0, 14.0, 8.0, 10.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.511932373046875, -3.39691162109375, -3.281890869140625, -3.1668701171875, -3.051849365234375, -2.93682861328125, -2.821807861328125, -2.706787109375, -2.591766357421875, -2.47674560546875, -2.361724853515625, -2.2467041015625, -2.131683349609375, -2.01666259765625, -1.901641845703125, -1.78662109375, -1.671600341796875, -1.55657958984375, -1.441558837890625, -1.3265380859375, -1.211517333984375, -1.09649658203125, -0.981475830078125, -0.866455078125, -0.751434326171875, -0.63641357421875, -0.521392822265625, -0.4063720703125, -0.291351318359375, -0.17633056640625, -0.061309814453125, 0.0537109375, 0.168731689453125, 0.28375244140625, 0.398773193359375, 0.5137939453125, 0.628814697265625, 0.74383544921875, 0.858856201171875, 0.973876953125, 1.088897705078125, 1.20391845703125, 1.318939208984375, 1.4339599609375, 1.548980712890625, 1.66400146484375, 1.779022216796875, 1.89404296875, 2.009063720703125, 2.12408447265625, 2.239105224609375, 2.3541259765625, 2.469146728515625, 2.58416748046875, 2.699188232421875, 2.814208984375, 2.929229736328125, 3.04425048828125, 3.159271240234375, 3.2742919921875, 3.389312744140625, 3.50433349609375, 3.619354248046875, 3.734375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 14.0, 15.0, 21.0, 30.0, 31.0, 43.0, 59.0, 58.0, 56.0, 82.0, 68.0, 79.0, 68.0, 69.0, 57.0, 57.0, 38.0, 35.0, 31.0, 26.0, 14.0, 9.0, 8.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.654296875, -0.629241943359375, -0.60418701171875, -0.579132080078125, -0.5540771484375, -0.529022216796875, -0.50396728515625, -0.478912353515625, -0.453857421875, -0.428802490234375, -0.40374755859375, -0.378692626953125, -0.3536376953125, -0.328582763671875, -0.30352783203125, -0.278472900390625, -0.25341796875, -0.228363037109375, -0.20330810546875, -0.178253173828125, -0.1531982421875, -0.128143310546875, -0.10308837890625, -0.078033447265625, -0.052978515625, -0.027923583984375, -0.00286865234375, 0.022186279296875, 0.0472412109375, 0.072296142578125, 0.09735107421875, 0.122406005859375, 0.1474609375, 0.172515869140625, 0.19757080078125, 0.222625732421875, 0.2476806640625, 0.272735595703125, 0.29779052734375, 0.322845458984375, 0.347900390625, 0.372955322265625, 0.39801025390625, 0.423065185546875, 0.4481201171875, 0.473175048828125, 0.49822998046875, 0.523284912109375, 0.54833984375, 0.573394775390625, 0.59844970703125, 0.623504638671875, 0.6485595703125, 0.673614501953125, 0.69866943359375, 0.723724365234375, 0.748779296875, 0.773834228515625, 0.79888916015625, 0.823944091796875, 0.8489990234375, 0.874053955078125, 0.89910888671875, 0.924163818359375, 0.94921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 9.0, 4.0, 18.0, 12.0, 29.0, 18.0, 34.0, 47.0, 60.0, 112.0, 144.0, 170.0, 262.0, 401.0, 593.0, 988.0, 1855.0, 4132.0, 10388.0, 32786.0, 128884.0, 443370.0, 311336.0, 77124.0, 21332.0, 7302.0, 3143.0, 1465.0, 835.0, 491.0, 339.0, 233.0, 196.0, 132.0, 89.0, 67.0, 42.0, 33.0, 20.0, 13.0, 10.0, 10.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-2.296875, -2.2309112548828125, -2.164947509765625, -2.0989837646484375, -2.03302001953125, -1.9670562744140625, -1.901092529296875, -1.8351287841796875, -1.7691650390625, -1.7032012939453125, -1.637237548828125, -1.5712738037109375, -1.50531005859375, -1.4393463134765625, -1.373382568359375, -1.3074188232421875, -1.241455078125, -1.1754913330078125, -1.109527587890625, -1.0435638427734375, -0.97760009765625, -0.9116363525390625, -0.845672607421875, -0.7797088623046875, -0.7137451171875, -0.6477813720703125, -0.581817626953125, -0.5158538818359375, -0.44989013671875, -0.3839263916015625, -0.317962646484375, -0.2519989013671875, -0.18603515625, -0.1200714111328125, -0.054107666015625, 0.0118560791015625, 0.07781982421875, 0.1437835693359375, 0.209747314453125, 0.2757110595703125, 0.3416748046875, 0.4076385498046875, 0.473602294921875, 0.5395660400390625, 0.60552978515625, 0.6714935302734375, 0.737457275390625, 0.8034210205078125, 0.869384765625, 0.9353485107421875, 1.001312255859375, 1.0672760009765625, 1.13323974609375, 1.1992034912109375, 1.265167236328125, 1.3311309814453125, 1.3970947265625, 1.4630584716796875, 1.529022216796875, 1.5949859619140625, 1.66094970703125, 1.7269134521484375, 1.792877197265625, 1.8588409423828125, 1.9248046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 9.0, 5.0, 15.0, 17.0, 9.0, 22.0, 22.0, 25.0, 30.0, 23.0, 34.0, 41.0, 45.0, 51.0, 39.0, 42.0, 56.0, 56.0, 42.0, 38.0, 43.0, 41.0, 40.0, 33.0, 37.0, 29.0, 20.0, 20.0, 18.0, 11.0, 23.0, 16.0, 4.0, 9.0, 4.0, 5.0, 10.0, 5.0, 3.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.65625, -2.57373046875, -2.4912109375, -2.40869140625, -2.326171875, -2.24365234375, -2.1611328125, -2.07861328125, -1.99609375, -1.91357421875, -1.8310546875, -1.74853515625, -1.666015625, -1.58349609375, -1.5009765625, -1.41845703125, -1.3359375, -1.25341796875, -1.1708984375, -1.08837890625, -1.005859375, -0.92333984375, -0.8408203125, -0.75830078125, -0.67578125, -0.59326171875, -0.5107421875, -0.42822265625, -0.345703125, -0.26318359375, -0.1806640625, -0.09814453125, -0.015625, 0.06689453125, 0.1494140625, 0.23193359375, 0.314453125, 0.39697265625, 0.4794921875, 0.56201171875, 0.64453125, 0.72705078125, 0.8095703125, 0.89208984375, 0.974609375, 1.05712890625, 1.1396484375, 1.22216796875, 1.3046875, 1.38720703125, 1.4697265625, 1.55224609375, 1.634765625, 1.71728515625, 1.7998046875, 1.88232421875, 1.96484375, 2.04736328125, 2.1298828125, 2.21240234375, 2.294921875, 2.37744140625, 2.4599609375, 2.54248046875, 2.625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 2.0, 8.0, 16.0, 15.0, 42.0, 86.0, 128.0, 273.0, 543.0, 1346.0, 3514.0, 10765.0, 40547.0, 188173.0, 529474.0, 210125.0, 45427.0, 11710.0, 3745.0, 1481.0, 571.0, 246.0, 140.0, 75.0, 37.0, 21.0, 12.0, 9.0, 9.0, 1.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0625, -1.02880859375, -0.9951171875, -0.96142578125, -0.927734375, -0.89404296875, -0.8603515625, -0.82666015625, -0.79296875, -0.75927734375, -0.7255859375, -0.69189453125, -0.658203125, -0.62451171875, -0.5908203125, -0.55712890625, -0.5234375, -0.48974609375, -0.4560546875, -0.42236328125, -0.388671875, -0.35498046875, -0.3212890625, -0.28759765625, -0.25390625, -0.22021484375, -0.1865234375, -0.15283203125, -0.119140625, -0.08544921875, -0.0517578125, -0.01806640625, 0.015625, 0.04931640625, 0.0830078125, 0.11669921875, 0.150390625, 0.18408203125, 0.2177734375, 0.25146484375, 0.28515625, 0.31884765625, 0.3525390625, 0.38623046875, 0.419921875, 0.45361328125, 0.4873046875, 0.52099609375, 0.5546875, 0.58837890625, 0.6220703125, 0.65576171875, 0.689453125, 0.72314453125, 0.7568359375, 0.79052734375, 0.82421875, 0.85791015625, 0.8916015625, 0.92529296875, 0.958984375, 0.99267578125, 1.0263671875, 1.06005859375, 1.09375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 8.0, 8.0, 12.0, 12.0, 24.0, 41.0, 66.0, 71.0, 136.0, 148.0, 137.0, 107.0, 78.0, 43.0, 33.0, 31.0, 11.0, 15.0, 4.0, 5.0, 5.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004012584686279297, -0.0003890208899974823, -0.0003767833113670349, -0.0003645457327365875, -0.00035230815410614014, -0.00034007057547569275, -0.00032783299684524536, -0.000315595418214798, -0.0003033578395843506, -0.0002911202609539032, -0.0002788826823234558, -0.0002666451036930084, -0.00025440752506256104, -0.00024216994643211365, -0.00022993236780166626, -0.00021769478917121887, -0.00020545721054077148, -0.0001932196319103241, -0.0001809820532798767, -0.00016874447464942932, -0.00015650689601898193, -0.00014426931738853455, -0.00013203173875808716, -0.00011979416012763977, -0.00010755658149719238, -9.5319002866745e-05, -8.308142423629761e-05, -7.084384560585022e-05, -5.860626697540283e-05, -4.6368688344955444e-05, -3.413110971450806e-05, -2.189353108406067e-05, -9.655952453613281e-06, 2.5816261768341064e-06, 1.4819204807281494e-05, 2.7056783437728882e-05, 3.929436206817627e-05, 5.153194069862366e-05, 6.376951932907104e-05, 7.600709795951843e-05, 8.824467658996582e-05, 0.00010048225522041321, 0.0001127198338508606, 0.00012495741248130798, 0.00013719499111175537, 0.00014943256974220276, 0.00016167014837265015, 0.00017390772700309753, 0.00018614530563354492, 0.0001983828842639923, 0.0002106204628944397, 0.00022285804152488708, 0.00023509562015533447, 0.00024733319878578186, 0.00025957077741622925, 0.00027180835604667664, 0.000284045934677124, 0.0002962835133075714, 0.0003085210919380188, 0.0003207586705684662, 0.0003329962491989136, 0.00034523382782936096, 0.00035747140645980835, 0.00036970898509025574, 0.0003819465637207031]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 11.0, 25.0, 29.0, 55.0, 73.0, 133.0, 248.0, 427.0, 926.0, 2301.0, 7471.0, 40485.0, 314128.0, 570524.0, 91726.0, 13816.0, 3462.0, 1296.0, 621.0, 286.0, 185.0, 132.0, 58.0, 42.0, 24.0, 15.0, 11.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.732421875, -1.68707275390625, -1.6417236328125, -1.59637451171875, -1.551025390625, -1.50567626953125, -1.4603271484375, -1.41497802734375, -1.36962890625, -1.32427978515625, -1.2789306640625, -1.23358154296875, -1.188232421875, -1.14288330078125, -1.0975341796875, -1.05218505859375, -1.0068359375, -0.96148681640625, -0.9161376953125, -0.87078857421875, -0.825439453125, -0.78009033203125, -0.7347412109375, -0.68939208984375, -0.64404296875, -0.59869384765625, -0.5533447265625, -0.50799560546875, -0.462646484375, -0.41729736328125, -0.3719482421875, -0.32659912109375, -0.28125, -0.23590087890625, -0.1905517578125, -0.14520263671875, -0.099853515625, -0.05450439453125, -0.0091552734375, 0.03619384765625, 0.08154296875, 0.12689208984375, 0.1722412109375, 0.21759033203125, 0.262939453125, 0.30828857421875, 0.3536376953125, 0.39898681640625, 0.4443359375, 0.48968505859375, 0.5350341796875, 0.58038330078125, 0.625732421875, 0.67108154296875, 0.7164306640625, 0.76177978515625, 0.80712890625, 0.85247802734375, 0.8978271484375, 0.94317626953125, 0.988525390625, 1.03387451171875, 1.0792236328125, 1.12457275390625, 1.169921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 11.0, 3.0, 9.0, 13.0, 18.0, 27.0, 26.0, 29.0, 37.0, 49.0, 58.0, 62.0, 77.0, 65.0, 81.0, 78.0, 81.0, 73.0, 38.0, 44.0, 36.0, 23.0, 15.0, 14.0, 10.0, 11.0, 6.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72412109375, -0.6953964233398438, -0.6666717529296875, -0.6379470825195312, -0.609222412109375, -0.5804977416992188, -0.5517730712890625, -0.5230484008789062, -0.49432373046875, -0.46559906005859375, -0.4368743896484375, -0.40814971923828125, -0.379425048828125, -0.35070037841796875, -0.3219757080078125, -0.29325103759765625, -0.2645263671875, -0.23580169677734375, -0.2070770263671875, -0.17835235595703125, -0.149627685546875, -0.12090301513671875, -0.0921783447265625, -0.06345367431640625, -0.03472900390625, -0.00600433349609375, 0.0227203369140625, 0.05144500732421875, 0.080169677734375, 0.10889434814453125, 0.1376190185546875, 0.16634368896484375, 0.195068359375, 0.22379302978515625, 0.2525177001953125, 0.28124237060546875, 0.309967041015625, 0.33869171142578125, 0.3674163818359375, 0.39614105224609375, 0.42486572265625, 0.45359039306640625, 0.4823150634765625, 0.5110397338867188, 0.539764404296875, 0.5684890747070312, 0.5972137451171875, 0.6259384155273438, 0.6546630859375, 0.6833877563476562, 0.7121124267578125, 0.7408370971679688, 0.769561767578125, 0.7982864379882812, 0.8270111083984375, 0.8557357788085938, 0.88446044921875, 0.9131851196289062, 0.9419097900390625, 0.9706344604492188, 0.999359130859375, 1.0280838012695312, 1.0568084716796875, 1.0855331420898438, 1.1142578125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 9.0, 36.0, 81.0, 201.0, 287.0, 213.0, 102.0, 44.0, 17.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.44586181640625, -25.375865936279297, -24.30586814880371, -23.235872268676758, -22.165874481201172, -21.09587860107422, -20.025882720947266, -18.95588493347168, -17.885887145996094, -16.81589126586914, -15.745893478393555, -14.675897598266602, -13.605899810791016, -12.535903930664062, -11.465907096862793, -10.395910263061523, -9.32591438293457, -8.2559175491333, -7.185920715332031, -6.11592435836792, -5.04592752456665, -3.975930690765381, -2.9059343338012695, -1.8359375, -0.7659406661987305, 0.3040560483932495, 1.3740527629852295, 2.44404935836792, 3.5140461921691895, 4.584043025970459, 5.65403938293457, 6.72403621673584, 7.794033050537109, 8.864029884338379, 9.934026718139648, 11.004022598266602, 12.074020385742188, 13.14401626586914, 14.21401309967041, 15.28400993347168, 16.354007720947266, 17.42400360107422, 18.494001388549805, 19.563997268676758, 20.633995056152344, 21.703990936279297, 22.77398681640625, 23.843984603881836, 24.91398048400879, 25.983976364135742, 27.053974151611328, 28.12397003173828, 29.193967819213867, 30.26396369934082, 31.333961486816406, 32.40395736694336, 33.47395324707031, 34.543949127197266, 35.61394500732422, 36.68394470214844, 37.75394058227539, 38.823936462402344, 39.8939323425293, 40.96392822265625, 42.03392791748047]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 9.0, 5.0, 2.0, 3.0, 3.0, 7.0, 11.0, 19.0, 13.0, 19.0, 16.0, 12.0, 15.0, 24.0, 30.0, 29.0, 24.0, 31.0, 35.0, 42.0, 39.0, 28.0, 38.0, 38.0, 41.0, 43.0, 32.0, 37.0, 45.0, 35.0, 34.0, 30.0, 37.0, 24.0, 29.0, 9.0, 25.0, 15.0, 7.0, 18.0, 9.0, 8.0, 7.0, 6.0, 3.0, 8.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-10.763351440429688, -10.42521858215332, -10.087085723876953, -9.74895191192627, -9.410819053649902, -9.072686195373535, -8.734553337097168, -8.396419525146484, -8.058286666870117, -7.72015380859375, -7.382020473480225, -7.043887615203857, -6.705754280090332, -6.367621421813965, -6.029488563537598, -5.691355228424072, -5.353222370147705, -5.015089511871338, -4.6769561767578125, -4.338823318481445, -4.00068998336792, -3.6625571250915527, -3.3244240283966064, -2.98629093170166, -2.648157835006714, -2.3100247383117676, -1.9718916416168213, -1.6337586641311646, -1.2956255674362183, -0.957492470741272, -0.6193594932556152, -0.28122639656066895, 0.056906700134277344, 0.39503976702690125, 0.7331728339195251, 1.0713058710098267, 1.409438967704773, 1.7475720643997192, 2.085705041885376, 2.4238381385803223, 2.7619712352752686, 3.100104331970215, 3.438237428665161, 3.7763705253601074, 4.114503383636475, 4.45263671875, 4.790769577026367, 5.128902435302734, 5.46703577041626, 5.805168628692627, 6.143301963806152, 6.4814348220825195, 6.819568157196045, 7.157701015472412, 7.4958343505859375, 7.833967208862305, 8.172100067138672, 8.510232925415039, 8.848365783691406, 9.18649959564209, 9.524632453918457, 9.862765312194824, 10.200898170471191, 10.539031982421875, 10.877164840698242]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 10.0, 18.0, 34.0, 48.0, 112.0, 266.0, 1045.0, 4178918.0, 12917.0, 583.0, 166.0, 73.0, 40.0, 21.0, 12.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -15.8369140625, -15.111328125, -14.3857421875, -13.66015625, -12.9345703125, -12.208984375, -11.4833984375, -10.7578125, -10.0322265625, -9.306640625, -8.5810546875, -7.85546875, -7.1298828125, -6.404296875, -5.6787109375, -4.953125, -4.2275390625, -3.501953125, -2.7763671875, -2.05078125, -1.3251953125, -0.599609375, 0.1259765625, 0.8515625, 1.5771484375, 2.302734375, 3.0283203125, 3.75390625, 4.4794921875, 5.205078125, 5.9306640625, 6.65625, 7.3818359375, 8.107421875, 8.8330078125, 9.55859375, 10.2841796875, 11.009765625, 11.7353515625, 12.4609375, 13.1865234375, 13.912109375, 14.6376953125, 15.36328125, 16.0888671875, 16.814453125, 17.5400390625, 18.265625, 18.9912109375, 19.716796875, 20.4423828125, 21.16796875, 21.8935546875, 22.619140625, 23.3447265625, 24.0703125, 24.7958984375, 25.521484375, 26.2470703125, 26.97265625, 27.6982421875, 28.423828125, 29.1494140625, 29.875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 15.0, 16.0, 15.0, 23.0, 20.0, 32.0, 38.0, 45.0, 49.0, 48.0, 53.0, 53.0, 71.0, 66.0, 58.0, 59.0, 52.0, 47.0, 46.0, 35.0, 28.0, 28.0, 20.0, 21.0, 12.0, 7.0, 12.0, 12.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.626953125, -0.602142333984375, -0.57733154296875, -0.552520751953125, -0.5277099609375, -0.502899169921875, -0.47808837890625, -0.453277587890625, -0.428466796875, -0.403656005859375, -0.37884521484375, -0.354034423828125, -0.3292236328125, -0.304412841796875, -0.27960205078125, -0.254791259765625, -0.22998046875, -0.205169677734375, -0.18035888671875, -0.155548095703125, -0.1307373046875, -0.105926513671875, -0.08111572265625, -0.056304931640625, -0.031494140625, -0.006683349609375, 0.01812744140625, 0.042938232421875, 0.0677490234375, 0.092559814453125, 0.11737060546875, 0.142181396484375, 0.1669921875, 0.191802978515625, 0.21661376953125, 0.241424560546875, 0.2662353515625, 0.291046142578125, 0.31585693359375, 0.340667724609375, 0.365478515625, 0.390289306640625, 0.41510009765625, 0.439910888671875, 0.4647216796875, 0.489532470703125, 0.51434326171875, 0.539154052734375, 0.56396484375, 0.588775634765625, 0.61358642578125, 0.638397216796875, 0.6632080078125, 0.688018798828125, 0.71282958984375, 0.737640380859375, 0.762451171875, 0.787261962890625, 0.81207275390625, 0.836883544921875, 0.8616943359375, 0.886505126953125, 0.91131591796875, 0.936126708984375, 0.9609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 6.0, 8.0, 3.0, 12.0, 16.0, 21.0, 22.0, 27.0, 34.0, 33.0, 61.0, 75.0, 95.0, 168.0, 175.0, 240.0, 343.0, 587.0, 1261.0, 4378.0, 38392.0, 4060103.0, 78377.0, 6188.0, 1513.0, 699.0, 375.0, 284.0, 189.0, 142.0, 106.0, 73.0, 59.0, 51.0, 43.0, 31.0, 19.0, 19.0, 13.0, 8.0, 14.0, 6.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.994140625, -3.875274658203125, -3.75640869140625, -3.637542724609375, -3.5186767578125, -3.399810791015625, -3.28094482421875, -3.162078857421875, -3.043212890625, -2.924346923828125, -2.80548095703125, -2.686614990234375, -2.5677490234375, -2.448883056640625, -2.33001708984375, -2.211151123046875, -2.09228515625, -1.973419189453125, -1.85455322265625, -1.735687255859375, -1.6168212890625, -1.497955322265625, -1.37908935546875, -1.260223388671875, -1.141357421875, -1.022491455078125, -0.90362548828125, -0.784759521484375, -0.6658935546875, -0.547027587890625, -0.42816162109375, -0.309295654296875, -0.1904296875, -0.071563720703125, 0.04730224609375, 0.166168212890625, 0.2850341796875, 0.403900146484375, 0.52276611328125, 0.641632080078125, 0.760498046875, 0.879364013671875, 0.99822998046875, 1.117095947265625, 1.2359619140625, 1.354827880859375, 1.47369384765625, 1.592559814453125, 1.71142578125, 1.830291748046875, 1.94915771484375, 2.068023681640625, 2.1868896484375, 2.305755615234375, 2.42462158203125, 2.543487548828125, 2.662353515625, 2.781219482421875, 2.90008544921875, 3.018951416015625, 3.1378173828125, 3.256683349609375, 3.37554931640625, 3.494415283203125, 3.61328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 9.0, 20.0, 39.0, 98.0, 701.0, 2978.0, 147.0, 41.0, 18.0, 8.0, 8.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0658798217773438, -1.0399627685546875, -1.0140457153320312, -0.988128662109375, -0.9622116088867188, -0.9362945556640625, -0.9103775024414062, -0.88446044921875, -0.8585433959960938, -0.8326263427734375, -0.8067092895507812, -0.780792236328125, -0.7548751831054688, -0.7289581298828125, -0.7030410766601562, -0.6771240234375, -0.6512069702148438, -0.6252899169921875, -0.5993728637695312, -0.573455810546875, -0.5475387573242188, -0.5216217041015625, -0.49570465087890625, -0.46978759765625, -0.44387054443359375, -0.4179534912109375, -0.39203643798828125, -0.366119384765625, -0.34020233154296875, -0.3142852783203125, -0.28836822509765625, -0.262451171875, -0.23653411865234375, -0.2106170654296875, -0.18470001220703125, -0.158782958984375, -0.13286590576171875, -0.1069488525390625, -0.08103179931640625, -0.05511474609375, -0.02919769287109375, -0.0032806396484375, 0.02263641357421875, 0.048553466796875, 0.07447052001953125, 0.1003875732421875, 0.12630462646484375, 0.1522216796875, 0.17813873291015625, 0.2040557861328125, 0.22997283935546875, 0.255889892578125, 0.28180694580078125, 0.3077239990234375, 0.33364105224609375, 0.35955810546875, 0.38547515869140625, 0.4113922119140625, 0.43730926513671875, 0.463226318359375, 0.48914337158203125, 0.5150604248046875, 0.5409774780273438, 0.56689453125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 3.0, 6.0, 6.0, 10.0, 19.0, 39.0, 76.0, 95.0, 160.0, 146.0, 153.0, 106.0, 74.0, 41.0, 27.0, 13.0, 12.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.014194488525391, -3.932225227355957, -3.8502559661865234, -3.768286943435669, -3.6863176822662354, -3.6043484210968018, -3.522379159927368, -3.4404101371765137, -3.35844087600708, -3.2764716148376465, -3.194502353668213, -3.1125333309173584, -3.030564069747925, -2.948594808578491, -2.8666255474090576, -2.784656524658203, -2.7026872634887695, -2.620718002319336, -2.5387487411499023, -2.456779718399048, -2.3748104572296143, -2.2928411960601807, -2.210871934890747, -2.1289029121398926, -2.04693341255188, -1.9649641513824463, -1.8829950094223022, -1.8010257482528687, -1.7190566062927246, -1.637087345123291, -1.5551180839538574, -1.4731489419937134, -1.3911798000335693, -1.3092105388641357, -1.2272413969039917, -1.145272135734558, -1.063302993774414, -0.9813337326049805, -0.8993645310401917, -0.8173953294754028, -0.735426127910614, -0.6534569263458252, -0.5714877247810364, -0.48951849341392517, -0.40754929184913635, -0.32558009028434753, -0.24361085891723633, -0.1616416573524475, -0.07967245578765869, 0.002296753227710724, 0.08426596224308014, 0.16623517870903015, 0.24820438027381897, 0.3301735818386078, 0.412142813205719, 0.4941120147705078, 0.5760812163352966, 0.6580504179000854, 0.7400196194648743, 0.8219888210296631, 0.9039580821990967, 0.9859272241592407, 1.0678964853286743, 1.1498656272888184, 1.231834888458252]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 8.0, 5.0, 8.0, 8.0, 11.0, 15.0, 15.0, 14.0, 19.0, 33.0, 21.0, 45.0, 39.0, 47.0, 46.0, 68.0, 60.0, 54.0, 47.0, 48.0, 50.0, 45.0, 41.0, 41.0, 38.0, 29.0, 27.0, 22.0, 17.0, 21.0, 17.0, 11.0, 10.0, 7.0, 4.0, 3.0, 9.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3710527420043945, -1.332878828048706, -1.2947050333023071, -1.2565312385559082, -1.2183573246002197, -1.1801834106445312, -1.1420096158981323, -1.1038358211517334, -1.065661907196045, -1.0274879932403564, -0.9893141984939575, -0.9511403441429138, -0.9129664897918701, -0.8747926354408264, -0.8366187810897827, -0.798444926738739, -0.7602710723876953, -0.7220972180366516, -0.6839233636856079, -0.6457495093345642, -0.6075756549835205, -0.5694018006324768, -0.5312279462814331, -0.4930540919303894, -0.4548802375793457, -0.416706383228302, -0.3785325288772583, -0.3403586745262146, -0.3021848201751709, -0.2640109658241272, -0.2258371114730835, -0.1876632571220398, -0.1494894027709961, -0.11131554841995239, -0.07314169406890869, -0.03496783971786499, 0.003206014633178711, 0.04137986898422241, 0.07955372333526611, 0.11772757768630981, 0.15590143203735352, 0.19407528638839722, 0.23224914073944092, 0.2704229950904846, 0.3085968494415283, 0.346770703792572, 0.3849445581436157, 0.4231184124946594, 0.4612922668457031, 0.4994661211967468, 0.5376399755477905, 0.5758138298988342, 0.6139876842498779, 0.6521615386009216, 0.6903353929519653, 0.728509247303009, 0.7666831016540527, 0.8048569560050964, 0.8430308103561401, 0.8812046647071838, 0.9193785190582275, 0.9575523734092712, 0.9957262277603149, 1.0339000225067139, 1.0720739364624023]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 7.0, 7.0, 2.0, 7.0, 13.0, 4.0, 11.0, 25.0, 34.0, 73.0, 87.0, 113.0, 182.0, 362.0, 744.0, 1802.0, 5824.0, 23841.0, 144971.0, 592936.0, 229381.0, 35812.0, 7872.0, 2397.0, 967.0, 451.0, 237.0, 119.0, 98.0, 57.0, 30.0, 22.0, 13.0, 8.0, 10.0, 16.0, 6.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.791015625, -3.678253173828125, -3.56549072265625, -3.452728271484375, -3.3399658203125, -3.227203369140625, -3.11444091796875, -3.001678466796875, -2.888916015625, -2.776153564453125, -2.66339111328125, -2.550628662109375, -2.4378662109375, -2.325103759765625, -2.21234130859375, -2.099578857421875, -1.98681640625, -1.874053955078125, -1.76129150390625, -1.648529052734375, -1.5357666015625, -1.423004150390625, -1.31024169921875, -1.197479248046875, -1.084716796875, -0.971954345703125, -0.85919189453125, -0.746429443359375, -0.6336669921875, -0.520904541015625, -0.40814208984375, -0.295379638671875, -0.1826171875, -0.069854736328125, 0.04290771484375, 0.155670166015625, 0.2684326171875, 0.381195068359375, 0.49395751953125, 0.606719970703125, 0.719482421875, 0.832244873046875, 0.94500732421875, 1.057769775390625, 1.1705322265625, 1.283294677734375, 1.39605712890625, 1.508819580078125, 1.62158203125, 1.734344482421875, 1.84710693359375, 1.959869384765625, 2.0726318359375, 2.185394287109375, 2.29815673828125, 2.410919189453125, 2.523681640625, 2.636444091796875, 2.74920654296875, 2.861968994140625, 2.9747314453125, 3.087493896484375, 3.20025634765625, 3.313018798828125, 3.42578125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 4.0, 15.0, 14.0, 24.0, 23.0, 31.0, 45.0, 22.0, 25.0, 34.0, 64.0, 55.0, 47.0, 61.0, 60.0, 62.0, 48.0, 50.0, 45.0, 39.0, 46.0, 29.0, 26.0, 20.0, 16.0, 20.0, 17.0, 14.0, 6.0, 9.0, 8.0, 8.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64111328125, -0.617828369140625, -0.59454345703125, -0.571258544921875, -0.5479736328125, -0.524688720703125, -0.50140380859375, -0.478118896484375, -0.454833984375, -0.431549072265625, -0.40826416015625, -0.384979248046875, -0.3616943359375, -0.338409423828125, -0.31512451171875, -0.291839599609375, -0.2685546875, -0.245269775390625, -0.22198486328125, -0.198699951171875, -0.1754150390625, -0.152130126953125, -0.12884521484375, -0.105560302734375, -0.082275390625, -0.058990478515625, -0.03570556640625, -0.012420654296875, 0.0108642578125, 0.034149169921875, 0.05743408203125, 0.080718994140625, 0.10400390625, 0.127288818359375, 0.15057373046875, 0.173858642578125, 0.1971435546875, 0.220428466796875, 0.24371337890625, 0.266998291015625, 0.290283203125, 0.313568115234375, 0.33685302734375, 0.360137939453125, 0.3834228515625, 0.406707763671875, 0.42999267578125, 0.453277587890625, 0.4765625, 0.499847412109375, 0.52313232421875, 0.546417236328125, 0.5697021484375, 0.592987060546875, 0.61627197265625, 0.639556884765625, 0.662841796875, 0.686126708984375, 0.70941162109375, 0.732696533203125, 0.7559814453125, 0.779266357421875, 0.80255126953125, 0.825836181640625, 0.84912109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 18.0, 18.0, 39.0, 52.0, 73.0, 94.0, 167.0, 260.0, 417.0, 744.0, 1502.0, 3945.0, 15484.0, 94641.0, 603176.0, 278059.0, 37402.0, 7679.0, 2276.0, 1016.0, 565.0, 318.0, 201.0, 140.0, 87.0, 61.0, 42.0, 25.0, 14.0, 11.0, 11.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.287109375, -3.192535400390625, -3.09796142578125, -3.003387451171875, -2.9088134765625, -2.814239501953125, -2.71966552734375, -2.625091552734375, -2.530517578125, -2.435943603515625, -2.34136962890625, -2.246795654296875, -2.1522216796875, -2.057647705078125, -1.96307373046875, -1.868499755859375, -1.77392578125, -1.679351806640625, -1.58477783203125, -1.490203857421875, -1.3956298828125, -1.301055908203125, -1.20648193359375, -1.111907958984375, -1.017333984375, -0.922760009765625, -0.82818603515625, -0.733612060546875, -0.6390380859375, -0.544464111328125, -0.44989013671875, -0.355316162109375, -0.2607421875, -0.166168212890625, -0.07159423828125, 0.022979736328125, 0.1175537109375, 0.212127685546875, 0.30670166015625, 0.401275634765625, 0.495849609375, 0.590423583984375, 0.68499755859375, 0.779571533203125, 0.8741455078125, 0.968719482421875, 1.06329345703125, 1.157867431640625, 1.25244140625, 1.347015380859375, 1.44158935546875, 1.536163330078125, 1.6307373046875, 1.725311279296875, 1.81988525390625, 1.914459228515625, 2.009033203125, 2.103607177734375, 2.19818115234375, 2.292755126953125, 2.3873291015625, 2.481903076171875, 2.57647705078125, 2.671051025390625, 2.765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 3.0, 6.0, 6.0, 8.0, 6.0, 13.0, 19.0, 11.0, 18.0, 21.0, 31.0, 23.0, 31.0, 33.0, 40.0, 37.0, 49.0, 45.0, 46.0, 47.0, 47.0, 33.0, 50.0, 38.0, 43.0, 46.0, 31.0, 24.0, 22.0, 17.0, 28.0, 17.0, 13.0, 21.0, 18.0, 9.0, 11.0, 9.0, 7.0, 6.0, 6.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.96875, -2.8795166015625, -2.790283203125, -2.7010498046875, -2.61181640625, -2.5225830078125, -2.433349609375, -2.3441162109375, -2.2548828125, -2.1656494140625, -2.076416015625, -1.9871826171875, -1.89794921875, -1.8087158203125, -1.719482421875, -1.6302490234375, -1.541015625, -1.4517822265625, -1.362548828125, -1.2733154296875, -1.18408203125, -1.0948486328125, -1.005615234375, -0.9163818359375, -0.8271484375, -0.7379150390625, -0.648681640625, -0.5594482421875, -0.47021484375, -0.3809814453125, -0.291748046875, -0.2025146484375, -0.11328125, -0.0240478515625, 0.065185546875, 0.1544189453125, 0.24365234375, 0.3328857421875, 0.422119140625, 0.5113525390625, 0.6005859375, 0.6898193359375, 0.779052734375, 0.8682861328125, 0.95751953125, 1.0467529296875, 1.135986328125, 1.2252197265625, 1.314453125, 1.4036865234375, 1.492919921875, 1.5821533203125, 1.67138671875, 1.7606201171875, 1.849853515625, 1.9390869140625, 2.0283203125, 2.1175537109375, 2.206787109375, 2.2960205078125, 2.38525390625, 2.4744873046875, 2.563720703125, 2.6529541015625, 2.7421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 23.0, 36.0, 61.0, 110.0, 175.0, 393.0, 917.0, 2223.0, 6243.0, 28850.0, 406520.0, 555613.0, 35655.0, 7306.0, 2435.0, 986.0, 473.0, 229.0, 111.0, 69.0, 36.0, 22.0, 17.0, 10.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.810546875, -1.75030517578125, -1.6900634765625, -1.62982177734375, -1.569580078125, -1.50933837890625, -1.4490966796875, -1.38885498046875, -1.32861328125, -1.26837158203125, -1.2081298828125, -1.14788818359375, -1.087646484375, -1.02740478515625, -0.9671630859375, -0.90692138671875, -0.8466796875, -0.78643798828125, -0.7261962890625, -0.66595458984375, -0.605712890625, -0.54547119140625, -0.4852294921875, -0.42498779296875, -0.36474609375, -0.30450439453125, -0.2442626953125, -0.18402099609375, -0.123779296875, -0.06353759765625, -0.0032958984375, 0.05694580078125, 0.1171875, 0.17742919921875, 0.2376708984375, 0.29791259765625, 0.358154296875, 0.41839599609375, 0.4786376953125, 0.53887939453125, 0.59912109375, 0.65936279296875, 0.7196044921875, 0.77984619140625, 0.840087890625, 0.90032958984375, 0.9605712890625, 1.02081298828125, 1.0810546875, 1.14129638671875, 1.2015380859375, 1.26177978515625, 1.322021484375, 1.38226318359375, 1.4425048828125, 1.50274658203125, 1.56298828125, 1.62322998046875, 1.6834716796875, 1.74371337890625, 1.803955078125, 1.86419677734375, 1.9244384765625, 1.98468017578125, 2.044921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 15.0, 13.0, 25.0, 22.0, 35.0, 55.0, 56.0, 85.0, 92.0, 105.0, 112.0, 78.0, 76.0, 46.0, 43.0, 38.0, 19.0, 17.0, 16.0, 8.0, 9.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.000209808349609375, -0.0002022385597229004, -0.00019466876983642578, -0.00018709897994995117, -0.00017952919006347656, -0.00017195940017700195, -0.00016438961029052734, -0.00015681982040405273, -0.00014925003051757812, -0.00014168024063110352, -0.0001341104507446289, -0.0001265406608581543, -0.00011897087097167969, -0.00011140108108520508, -0.00010383129119873047, -9.626150131225586e-05, -8.869171142578125e-05, -8.112192153930664e-05, -7.355213165283203e-05, -6.598234176635742e-05, -5.841255187988281e-05, -5.08427619934082e-05, -4.3272972106933594e-05, -3.5703182220458984e-05, -2.8133392333984375e-05, -2.0563602447509766e-05, -1.2993812561035156e-05, -5.424022674560547e-06, 2.1457672119140625e-06, 9.715557098388672e-06, 1.728534698486328e-05, 2.485513687133789e-05, 3.24249267578125e-05, 3.999471664428711e-05, 4.756450653076172e-05, 5.513429641723633e-05, 6.270408630371094e-05, 7.027387619018555e-05, 7.784366607666016e-05, 8.541345596313477e-05, 9.298324584960938e-05, 0.00010055303573608398, 0.0001081228256225586, 0.0001156926155090332, 0.0001232624053955078, 0.00013083219528198242, 0.00013840198516845703, 0.00014597177505493164, 0.00015354156494140625, 0.00016111135482788086, 0.00016868114471435547, 0.00017625093460083008, 0.0001838207244873047, 0.0001913905143737793, 0.0001989603042602539, 0.00020653009414672852, 0.00021409988403320312, 0.00022166967391967773, 0.00022923946380615234, 0.00023680925369262695, 0.00024437904357910156, 0.00025194883346557617, 0.0002595186233520508, 0.0002670884132385254, 0.000274658203125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 11.0, 7.0, 11.0, 17.0, 28.0, 36.0, 48.0, 63.0, 135.0, 194.0, 368.0, 720.0, 1712.0, 4369.0, 14038.0, 83231.0, 752519.0, 160904.0, 20287.0, 5797.0, 2051.0, 920.0, 423.0, 261.0, 125.0, 73.0, 47.0, 36.0, 28.0, 25.0, 11.0, 12.0, 8.0, 4.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.8349609375, -1.778717041015625, -1.72247314453125, -1.666229248046875, -1.6099853515625, -1.553741455078125, -1.49749755859375, -1.441253662109375, -1.385009765625, -1.328765869140625, -1.27252197265625, -1.216278076171875, -1.1600341796875, -1.103790283203125, -1.04754638671875, -0.991302490234375, -0.93505859375, -0.878814697265625, -0.82257080078125, -0.766326904296875, -0.7100830078125, -0.653839111328125, -0.59759521484375, -0.541351318359375, -0.485107421875, -0.428863525390625, -0.37261962890625, -0.316375732421875, -0.2601318359375, -0.203887939453125, -0.14764404296875, -0.091400146484375, -0.03515625, 0.021087646484375, 0.07733154296875, 0.133575439453125, 0.1898193359375, 0.246063232421875, 0.30230712890625, 0.358551025390625, 0.414794921875, 0.471038818359375, 0.52728271484375, 0.583526611328125, 0.6397705078125, 0.696014404296875, 0.75225830078125, 0.808502197265625, 0.86474609375, 0.920989990234375, 0.97723388671875, 1.033477783203125, 1.0897216796875, 1.145965576171875, 1.20220947265625, 1.258453369140625, 1.314697265625, 1.370941162109375, 1.42718505859375, 1.483428955078125, 1.5396728515625, 1.595916748046875, 1.65216064453125, 1.708404541015625, 1.7646484375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 8.0, 10.0, 21.0, 13.0, 31.0, 46.0, 65.0, 104.0, 141.0, 178.0, 125.0, 85.0, 52.0, 43.0, 25.0, 12.0, 13.0, 4.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.146484375, -2.0840606689453125, -2.021636962890625, -1.9592132568359375, -1.89678955078125, -1.8343658447265625, -1.771942138671875, -1.7095184326171875, -1.6470947265625, -1.5846710205078125, -1.522247314453125, -1.4598236083984375, -1.39739990234375, -1.3349761962890625, -1.272552490234375, -1.2101287841796875, -1.147705078125, -1.0852813720703125, -1.022857666015625, -0.9604339599609375, -0.89801025390625, -0.8355865478515625, -0.773162841796875, -0.7107391357421875, -0.6483154296875, -0.5858917236328125, -0.523468017578125, -0.4610443115234375, -0.39862060546875, -0.3361968994140625, -0.273773193359375, -0.2113494873046875, -0.14892578125, -0.0865020751953125, -0.024078369140625, 0.0383453369140625, 0.10076904296875, 0.1631927490234375, 0.225616455078125, 0.2880401611328125, 0.3504638671875, 0.4128875732421875, 0.475311279296875, 0.5377349853515625, 0.60015869140625, 0.6625823974609375, 0.725006103515625, 0.7874298095703125, 0.849853515625, 0.9122772216796875, 0.974700927734375, 1.0371246337890625, 1.09954833984375, 1.1619720458984375, 1.224395751953125, 1.2868194580078125, 1.3492431640625, 1.4116668701171875, 1.474090576171875, 1.5365142822265625, 1.59893798828125, 1.6613616943359375, 1.723785400390625, 1.7862091064453125, 1.8486328125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 12.0, 14.0, 25.0, 51.0, 79.0, 111.0, 149.0, 133.0, 157.0, 84.0, 67.0, 49.0, 32.0, 14.0, 7.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-33.18993377685547, -32.51729965209961, -31.844667434692383, -31.172035217285156, -30.499401092529297, -29.82676887512207, -29.154136657714844, -28.481502532958984, -27.808868408203125, -27.1362361907959, -26.46360206604004, -25.790969848632812, -25.118335723876953, -24.445703506469727, -23.7730712890625, -23.10043716430664, -22.427804946899414, -21.755172729492188, -21.082538604736328, -20.4099063873291, -19.737272262573242, -19.064640045166016, -18.392005920410156, -17.71937370300293, -17.046741485595703, -16.374109268188477, -15.701475143432617, -15.02884292602539, -14.356208801269531, -13.683576583862305, -13.010943412780762, -12.338310241699219, -11.66567611694336, -10.993042945861816, -10.320409774780273, -9.647777557373047, -8.975143432617188, -8.302511215209961, -7.629878044128418, -6.957244873046875, -6.284611701965332, -5.611978530883789, -4.939345359802246, -4.266712665557861, -3.5940794944763184, -2.9214463233947754, -2.2488136291503906, -1.5761804580688477, -0.9035472869873047, -0.23091423511505127, 0.44171881675720215, 1.114351749420166, 1.786984920501709, 2.459618091583252, 3.1322507858276367, 3.8048839569091797, 4.477517127990723, 5.150150299072266, 5.822783470153809, 6.495416164398193, 7.168049335479736, 7.840682506561279, 8.513315200805664, 9.185948371887207, 9.85858154296875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 18.0, 14.0, 19.0, 23.0, 25.0, 40.0, 53.0, 47.0, 54.0, 64.0, 77.0, 65.0, 80.0, 77.0, 71.0, 53.0, 41.0, 32.0, 39.0, 20.0, 15.0, 22.0, 10.0, 10.0, 10.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.261594772338867, -22.571834564208984, -21.88207244873047, -21.192312240600586, -20.502552032470703, -19.812789916992188, -19.123029708862305, -18.433269500732422, -17.743507385253906, -17.053747177124023, -16.363985061645508, -15.674224853515625, -14.984464645385742, -14.294703483581543, -13.604942321777344, -12.915182113647461, -12.225421905517578, -11.535660743713379, -10.845900535583496, -10.156139373779297, -9.466379165649414, -8.776618003845215, -8.086856842041016, -7.397096157073975, -6.707335472106934, -6.017574787139893, -5.327814102172852, -4.638052940368652, -3.9482922554016113, -3.2585315704345703, -2.568770408630371, -1.87900972366333, -1.1892471313476562, -0.4994863271713257, 0.19027447700500488, 0.880035400390625, 1.569796085357666, 2.259556770324707, 2.9493179321289062, 3.6390786170959473, 4.328839302062988, 5.018599987030029, 5.70836067199707, 6.3981218338012695, 7.0878825187683105, 7.777643203735352, 8.46740436553955, 9.15716552734375, 9.846925735473633, 10.536686897277832, 11.226447105407715, 11.916208267211914, 12.605968475341797, 13.295729637145996, 13.985490798950195, 14.675251007080078, 15.365012168884277, 16.054773330688477, 16.74453353881836, 17.434295654296875, 18.124055862426758, 18.81381607055664, 19.503578186035156, 20.19333839416504, 20.883098602294922]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 9.0, 18.0, 26.0, 54.0, 93.0, 183.0, 357.0, 6739.0, 4185205.0, 1072.0, 254.0, 117.0, 64.0, 44.0, 14.0, 11.0, 11.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.84375, -13.249267578125, -12.65478515625, -12.060302734375, -11.4658203125, -10.871337890625, -10.27685546875, -9.682373046875, -9.087890625, -8.493408203125, -7.89892578125, -7.304443359375, -6.7099609375, -6.115478515625, -5.52099609375, -4.926513671875, -4.33203125, -3.737548828125, -3.14306640625, -2.548583984375, -1.9541015625, -1.359619140625, -0.76513671875, -0.170654296875, 0.423828125, 1.018310546875, 1.61279296875, 2.207275390625, 2.8017578125, 3.396240234375, 3.99072265625, 4.585205078125, 5.1796875, 5.774169921875, 6.36865234375, 6.963134765625, 7.5576171875, 8.152099609375, 8.74658203125, 9.341064453125, 9.935546875, 10.530029296875, 11.12451171875, 11.718994140625, 12.3134765625, 12.907958984375, 13.50244140625, 14.096923828125, 14.69140625, 15.285888671875, 15.88037109375, 16.474853515625, 17.0693359375, 17.663818359375, 18.25830078125, 18.852783203125, 19.447265625, 20.041748046875, 20.63623046875, 21.230712890625, 21.8251953125, 22.419677734375, 23.01416015625, 23.608642578125, 24.203125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 6.0, 16.0, 12.0, 25.0, 26.0, 42.0, 37.0, 44.0, 42.0, 70.0, 62.0, 61.0, 56.0, 60.0, 74.0, 73.0, 48.0, 43.0, 37.0, 33.0, 26.0, 17.0, 15.0, 17.0, 10.0, 12.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.005859375, -0.976837158203125, -0.94781494140625, -0.918792724609375, -0.8897705078125, -0.860748291015625, -0.83172607421875, -0.802703857421875, -0.773681640625, -0.744659423828125, -0.71563720703125, -0.686614990234375, -0.6575927734375, -0.628570556640625, -0.59954833984375, -0.570526123046875, -0.54150390625, -0.512481689453125, -0.48345947265625, -0.454437255859375, -0.4254150390625, -0.396392822265625, -0.36737060546875, -0.338348388671875, -0.309326171875, -0.280303955078125, -0.25128173828125, -0.222259521484375, -0.1932373046875, -0.164215087890625, -0.13519287109375, -0.106170654296875, -0.0771484375, -0.048126220703125, -0.01910400390625, 0.009918212890625, 0.0389404296875, 0.067962646484375, 0.09698486328125, 0.126007080078125, 0.155029296875, 0.184051513671875, 0.21307373046875, 0.242095947265625, 0.2711181640625, 0.300140380859375, 0.32916259765625, 0.358184814453125, 0.38720703125, 0.416229248046875, 0.44525146484375, 0.474273681640625, 0.5032958984375, 0.532318115234375, 0.56134033203125, 0.590362548828125, 0.619384765625, 0.648406982421875, 0.67742919921875, 0.706451416015625, 0.7354736328125, 0.764495849609375, 0.79351806640625, 0.822540283203125, 0.8515625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 8.0, 9.0, 15.0, 23.0, 30.0, 38.0, 47.0, 83.0, 106.0, 119.0, 182.0, 233.0, 279.0, 414.0, 519.0, 721.0, 1127.0, 2144.0, 5760.0, 26837.0, 599183.0, 3503246.0, 39152.0, 7214.0, 2511.0, 1236.0, 781.0, 559.0, 454.0, 341.0, 201.0, 189.0, 143.0, 102.0, 76.0, 51.0, 48.0, 39.0, 19.0, 15.0, 7.0, 8.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.369140625, -2.295318603515625, -2.22149658203125, -2.147674560546875, -2.0738525390625, -2.000030517578125, -1.92620849609375, -1.852386474609375, -1.778564453125, -1.704742431640625, -1.63092041015625, -1.557098388671875, -1.4832763671875, -1.409454345703125, -1.33563232421875, -1.261810302734375, -1.18798828125, -1.114166259765625, -1.04034423828125, -0.966522216796875, -0.8927001953125, -0.818878173828125, -0.74505615234375, -0.671234130859375, -0.597412109375, -0.523590087890625, -0.44976806640625, -0.375946044921875, -0.3021240234375, -0.228302001953125, -0.15447998046875, -0.080657958984375, -0.0068359375, 0.066986083984375, 0.14080810546875, 0.214630126953125, 0.2884521484375, 0.362274169921875, 0.43609619140625, 0.509918212890625, 0.583740234375, 0.657562255859375, 0.73138427734375, 0.805206298828125, 0.8790283203125, 0.952850341796875, 1.02667236328125, 1.100494384765625, 1.17431640625, 1.248138427734375, 1.32196044921875, 1.395782470703125, 1.4696044921875, 1.543426513671875, 1.61724853515625, 1.691070556640625, 1.764892578125, 1.838714599609375, 1.91253662109375, 1.986358642578125, 2.0601806640625, 2.134002685546875, 2.20782470703125, 2.281646728515625, 2.35546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 8.0, 9.0, 21.0, 41.0, 99.0, 485.0, 3011.0, 259.0, 80.0, 25.0, 15.0, 6.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.98681640625, -0.9603424072265625, -0.933868408203125, -0.9073944091796875, -0.88092041015625, -0.8544464111328125, -0.827972412109375, -0.8014984130859375, -0.7750244140625, -0.7485504150390625, -0.722076416015625, -0.6956024169921875, -0.66912841796875, -0.6426544189453125, -0.616180419921875, -0.5897064208984375, -0.563232421875, -0.5367584228515625, -0.510284423828125, -0.4838104248046875, -0.45733642578125, -0.4308624267578125, -0.404388427734375, -0.3779144287109375, -0.3514404296875, -0.3249664306640625, -0.298492431640625, -0.2720184326171875, -0.24554443359375, -0.2190704345703125, -0.192596435546875, -0.1661224365234375, -0.1396484375, -0.1131744384765625, -0.086700439453125, -0.0602264404296875, -0.03375244140625, -0.0072784423828125, 0.019195556640625, 0.0456695556640625, 0.0721435546875, 0.0986175537109375, 0.125091552734375, 0.1515655517578125, 0.17803955078125, 0.2045135498046875, 0.230987548828125, 0.2574615478515625, 0.283935546875, 0.3104095458984375, 0.336883544921875, 0.3633575439453125, 0.38983154296875, 0.4163055419921875, 0.442779541015625, 0.4692535400390625, 0.4957275390625, 0.5222015380859375, 0.548675537109375, 0.5751495361328125, 0.60162353515625, 0.6280975341796875, 0.654571533203125, 0.6810455322265625, 0.70751953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 21.0, 20.0, 21.0, 34.0, 64.0, 80.0, 81.0, 111.0, 138.0, 110.0, 101.0, 75.0, 38.0, 39.0, 19.0, 11.0, 11.0, 9.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0537328720092773, -1.9818326234817505, -1.9099323749542236, -1.8380321264266968, -1.76613187789917, -1.6942315101623535, -1.6223312616348267, -1.5504310131072998, -1.478530764579773, -1.406630516052246, -1.3347302675247192, -1.2628300189971924, -1.190929651260376, -1.1190295219421387, -1.0471291542053223, -0.9752289056777954, -0.9033286571502686, -0.8314284086227417, -0.7595281600952148, -0.6876278519630432, -0.6157276034355164, -0.5438273549079895, -0.47192707657814026, -0.400026798248291, -0.32812654972076416, -0.2562263011932373, -0.18432602286338806, -0.11242575943470001, -0.04052549600601196, 0.03137475252151489, 0.10327503085136414, 0.17517530918121338, 0.24707555770874023, 0.3189758062362671, 0.39087608456611633, 0.4627763628959656, 0.5346766114234924, 0.6065768599510193, 0.6784771680831909, 0.7503774166107178, 0.8222776651382446, 0.8941779136657715, 0.9660781621932983, 1.0379784107208252, 1.1098787784576416, 1.181778907775879, 1.2536792755126953, 1.3255795240402222, 1.397479772567749, 1.4693800210952759, 1.5412802696228027, 1.6131805181503296, 1.6850807666778564, 1.7569811344146729, 1.8288813829421997, 1.9007816314697266, 1.9726818799972534, 2.0445821285247803, 2.1164824962615967, 2.188382625579834, 2.2602829933166504, 2.3321831226348877, 2.404083490371704, 2.4759836196899414, 2.547883987426758]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 10.0, 4.0, 8.0, 15.0, 17.0, 21.0, 15.0, 35.0, 23.0, 30.0, 24.0, 48.0, 42.0, 36.0, 38.0, 51.0, 42.0, 48.0, 42.0, 46.0, 41.0, 54.0, 39.0, 35.0, 29.0, 40.0, 39.0, 33.0, 17.0, 15.0, 15.0, 13.0, 9.0, 10.0, 4.0, 3.0, 7.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796478033065796, -1.7438796758651733, -1.6912813186645508, -1.6386830806732178, -1.5860847234725952, -1.5334863662719727, -1.4808881282806396, -1.428289771080017, -1.3756914138793945, -1.323093056678772, -1.2704946994781494, -1.2178964614868164, -1.1652981042861938, -1.1126997470855713, -1.0601015090942383, -1.0075031518936157, -0.9549047946929932, -0.9023064374923706, -0.8497081398963928, -0.797109842300415, -0.7445114850997925, -0.6919131278991699, -0.6393148303031921, -0.5867165327072144, -0.5341181755065918, -0.4815198481082916, -0.42892152070999146, -0.3763231933116913, -0.3237248659133911, -0.27112653851509094, -0.21852821111679077, -0.1659298837184906, -0.11333167552947998, -0.06073334813117981, -0.008135020732879639, 0.04446330666542053, 0.0970616340637207, 0.14965996146202087, 0.20225828886032104, 0.2548566162586212, 0.3074549436569214, 0.36005327105522156, 0.41265159845352173, 0.4652499258518219, 0.5178482532501221, 0.5704466104507446, 0.6230449080467224, 0.6756432056427002, 0.7282415628433228, 0.7808399200439453, 0.8334382176399231, 0.8860365152359009, 0.9386348724365234, 0.991233229637146, 1.0438315868377686, 1.0964298248291016, 1.1490281820297241, 1.2016265392303467, 1.2542247772216797, 1.3068231344223022, 1.3594214916229248, 1.4120198488235474, 1.46461820602417, 1.517216444015503, 1.5698148012161255]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 8.0, 4.0, 9.0, 10.0, 20.0, 19.0, 22.0, 36.0, 47.0, 76.0, 148.0, 227.0, 446.0, 866.0, 2022.0, 5388.0, 18141.0, 83605.0, 424793.0, 407129.0, 79050.0, 17276.0, 5355.0, 1945.0, 876.0, 395.0, 242.0, 139.0, 80.0, 57.0, 36.0, 17.0, 21.0, 13.0, 11.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.794921875, -2.71502685546875, -2.6351318359375, -2.55523681640625, -2.475341796875, -2.39544677734375, -2.3155517578125, -2.23565673828125, -2.15576171875, -2.07586669921875, -1.9959716796875, -1.91607666015625, -1.836181640625, -1.75628662109375, -1.6763916015625, -1.59649658203125, -1.5166015625, -1.43670654296875, -1.3568115234375, -1.27691650390625, -1.197021484375, -1.11712646484375, -1.0372314453125, -0.95733642578125, -0.87744140625, -0.79754638671875, -0.7176513671875, -0.63775634765625, -0.557861328125, -0.47796630859375, -0.3980712890625, -0.31817626953125, -0.23828125, -0.15838623046875, -0.0784912109375, 0.00140380859375, 0.081298828125, 0.16119384765625, 0.2410888671875, 0.32098388671875, 0.40087890625, 0.48077392578125, 0.5606689453125, 0.64056396484375, 0.720458984375, 0.80035400390625, 0.8802490234375, 0.96014404296875, 1.0400390625, 1.11993408203125, 1.1998291015625, 1.27972412109375, 1.359619140625, 1.43951416015625, 1.5194091796875, 1.59930419921875, 1.67919921875, 1.75909423828125, 1.8389892578125, 1.91888427734375, 1.998779296875, 2.07867431640625, 2.1585693359375, 2.23846435546875, 2.318359375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 7.0, 14.0, 18.0, 21.0, 36.0, 36.0, 40.0, 35.0, 48.0, 48.0, 64.0, 55.0, 79.0, 65.0, 56.0, 54.0, 53.0, 46.0, 38.0, 34.0, 29.0, 21.0, 19.0, 20.0, 10.0, 9.0, 10.0, 1.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9482421875, -0.9201507568359375, -0.892059326171875, -0.8639678955078125, -0.83587646484375, -0.8077850341796875, -0.779693603515625, -0.7516021728515625, -0.7235107421875, -0.6954193115234375, -0.667327880859375, -0.6392364501953125, -0.61114501953125, -0.5830535888671875, -0.554962158203125, -0.5268707275390625, -0.498779296875, -0.4706878662109375, -0.442596435546875, -0.4145050048828125, -0.38641357421875, -0.3583221435546875, -0.330230712890625, -0.3021392822265625, -0.2740478515625, -0.2459564208984375, -0.217864990234375, -0.1897735595703125, -0.16168212890625, -0.1335906982421875, -0.105499267578125, -0.0774078369140625, -0.04931640625, -0.0212249755859375, 0.006866455078125, 0.0349578857421875, 0.06304931640625, 0.0911407470703125, 0.119232177734375, 0.1473236083984375, 0.1754150390625, 0.2035064697265625, 0.231597900390625, 0.2596893310546875, 0.28778076171875, 0.3158721923828125, 0.343963623046875, 0.3720550537109375, 0.400146484375, 0.4282379150390625, 0.456329345703125, 0.4844207763671875, 0.51251220703125, 0.5406036376953125, 0.568695068359375, 0.5967864990234375, 0.6248779296875, 0.6529693603515625, 0.681060791015625, 0.7091522216796875, 0.73724365234375, 0.7653350830078125, 0.793426513671875, 0.8215179443359375, 0.849609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 6.0, 10.0, 11.0, 23.0, 26.0, 44.0, 58.0, 103.0, 149.0, 209.0, 418.0, 802.0, 1600.0, 4743.0, 26392.0, 429842.0, 542450.0, 32604.0, 5259.0, 1830.0, 814.0, 449.0, 253.0, 135.0, 101.0, 78.0, 43.0, 26.0, 12.0, 14.0, 16.0, 11.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5234375, -3.409942626953125, -3.29644775390625, -3.182952880859375, -3.0694580078125, -2.955963134765625, -2.84246826171875, -2.728973388671875, -2.615478515625, -2.501983642578125, -2.38848876953125, -2.274993896484375, -2.1614990234375, -2.048004150390625, -1.93450927734375, -1.821014404296875, -1.70751953125, -1.594024658203125, -1.48052978515625, -1.367034912109375, -1.2535400390625, -1.140045166015625, -1.02655029296875, -0.913055419921875, -0.799560546875, -0.686065673828125, -0.57257080078125, -0.459075927734375, -0.3455810546875, -0.232086181640625, -0.11859130859375, -0.005096435546875, 0.1083984375, 0.221893310546875, 0.33538818359375, 0.448883056640625, 0.5623779296875, 0.675872802734375, 0.78936767578125, 0.902862548828125, 1.016357421875, 1.129852294921875, 1.24334716796875, 1.356842041015625, 1.4703369140625, 1.583831787109375, 1.69732666015625, 1.810821533203125, 1.92431640625, 2.037811279296875, 2.15130615234375, 2.264801025390625, 2.3782958984375, 2.491790771484375, 2.60528564453125, 2.718780517578125, 2.832275390625, 2.945770263671875, 3.05926513671875, 3.172760009765625, 3.2862548828125, 3.399749755859375, 3.51324462890625, 3.626739501953125, 3.740234375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 2.0, 14.0, 7.0, 10.0, 17.0, 20.0, 38.0, 36.0, 50.0, 68.0, 55.0, 67.0, 63.0, 73.0, 73.0, 65.0, 76.0, 63.0, 55.0, 40.0, 31.0, 20.0, 17.0, 13.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8125, -3.6571044921875, -3.501708984375, -3.3463134765625, -3.19091796875, -3.0355224609375, -2.880126953125, -2.7247314453125, -2.5693359375, -2.4139404296875, -2.258544921875, -2.1031494140625, -1.94775390625, -1.7923583984375, -1.636962890625, -1.4815673828125, -1.326171875, -1.1707763671875, -1.015380859375, -0.8599853515625, -0.70458984375, -0.5491943359375, -0.393798828125, -0.2384033203125, -0.0830078125, 0.0723876953125, 0.227783203125, 0.3831787109375, 0.53857421875, 0.6939697265625, 0.849365234375, 1.0047607421875, 1.16015625, 1.3155517578125, 1.470947265625, 1.6263427734375, 1.78173828125, 1.9371337890625, 2.092529296875, 2.2479248046875, 2.4033203125, 2.5587158203125, 2.714111328125, 2.8695068359375, 3.02490234375, 3.1802978515625, 3.335693359375, 3.4910888671875, 3.646484375, 3.8018798828125, 3.957275390625, 4.1126708984375, 4.26806640625, 4.4234619140625, 4.578857421875, 4.7342529296875, 4.8896484375, 5.0450439453125, 5.200439453125, 5.3558349609375, 5.51123046875, 5.6666259765625, 5.822021484375, 5.9774169921875, 6.1328125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 10.0, 11.0, 15.0, 42.0, 84.0, 180.0, 968.0, 12392.0, 1022541.0, 11053.0, 893.0, 197.0, 66.0, 34.0, 17.0, 14.0, 11.0, 11.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.857421875, -3.677886962890625, -3.49835205078125, -3.318817138671875, -3.1392822265625, -2.959747314453125, -2.78021240234375, -2.600677490234375, -2.421142578125, -2.241607666015625, -2.06207275390625, -1.882537841796875, -1.7030029296875, -1.523468017578125, -1.34393310546875, -1.164398193359375, -0.98486328125, -0.805328369140625, -0.62579345703125, -0.446258544921875, -0.2667236328125, -0.087188720703125, 0.09234619140625, 0.271881103515625, 0.451416015625, 0.630950927734375, 0.81048583984375, 0.990020751953125, 1.1695556640625, 1.349090576171875, 1.52862548828125, 1.708160400390625, 1.8876953125, 2.067230224609375, 2.24676513671875, 2.426300048828125, 2.6058349609375, 2.785369873046875, 2.96490478515625, 3.144439697265625, 3.323974609375, 3.503509521484375, 3.68304443359375, 3.862579345703125, 4.0421142578125, 4.221649169921875, 4.40118408203125, 4.580718994140625, 4.76025390625, 4.939788818359375, 5.11932373046875, 5.298858642578125, 5.4783935546875, 5.657928466796875, 5.83746337890625, 6.016998291015625, 6.196533203125, 6.376068115234375, 6.55560302734375, 6.735137939453125, 6.9146728515625, 7.094207763671875, 7.27374267578125, 7.453277587890625, 7.6328125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 7.0, 9.0, 9.0, 8.0, 17.0, 20.0, 41.0, 37.0, 62.0, 84.0, 104.0, 127.0, 116.0, 92.0, 67.0, 61.0, 47.0, 19.0, 21.0, 14.0, 8.0, 10.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025343894958496094, -0.0002459511160850525, -0.00023846328258514404, -0.0002309754490852356, -0.00022348761558532715, -0.0002159997820854187, -0.00020851194858551025, -0.0002010241150856018, -0.00019353628158569336, -0.0001860484480857849, -0.00017856061458587646, -0.00017107278108596802, -0.00016358494758605957, -0.00015609711408615112, -0.00014860928058624268, -0.00014112144708633423, -0.00013363361358642578, -0.00012614578008651733, -0.00011865794658660889, -0.00011117011308670044, -0.00010368227958679199, -9.619444608688354e-05, -8.87066125869751e-05, -8.121877908706665e-05, -7.37309455871582e-05, -6.624311208724976e-05, -5.875527858734131e-05, -5.126744508743286e-05, -4.3779611587524414e-05, -3.629177808761597e-05, -2.880394458770752e-05, -2.1316111087799072e-05, -1.3828277587890625e-05, -6.340444087982178e-06, 1.1473894119262695e-06, 8.635222911834717e-06, 1.6123056411743164e-05, 2.361088991165161e-05, 3.109872341156006e-05, 3.8586556911468506e-05, 4.607439041137695e-05, 5.35622239112854e-05, 6.105005741119385e-05, 6.85378909111023e-05, 7.602572441101074e-05, 8.351355791091919e-05, 9.100139141082764e-05, 9.848922491073608e-05, 0.00010597705841064453, 0.00011346489191055298, 0.00012095272541046143, 0.00012844055891036987, 0.00013592839241027832, 0.00014341622591018677, 0.00015090405941009521, 0.00015839189291000366, 0.0001658797264099121, 0.00017336755990982056, 0.000180855393409729, 0.00018834322690963745, 0.0001958310604095459, 0.00020331889390945435, 0.0002108067274093628, 0.00021829456090927124, 0.0002257823944091797]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 6.0, 10.0, 16.0, 31.0, 66.0, 114.0, 282.0, 1099.0, 7694.0, 964429.0, 71109.0, 2789.0, 540.0, 171.0, 79.0, 42.0, 24.0, 11.0, 15.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.56640625, -4.42266845703125, -4.2789306640625, -4.13519287109375, -3.991455078125, -3.84771728515625, -3.7039794921875, -3.56024169921875, -3.41650390625, -3.27276611328125, -3.1290283203125, -2.98529052734375, -2.841552734375, -2.69781494140625, -2.5540771484375, -2.41033935546875, -2.2666015625, -2.12286376953125, -1.9791259765625, -1.83538818359375, -1.691650390625, -1.54791259765625, -1.4041748046875, -1.26043701171875, -1.11669921875, -0.97296142578125, -0.8292236328125, -0.68548583984375, -0.541748046875, -0.39801025390625, -0.2542724609375, -0.11053466796875, 0.033203125, 0.17694091796875, 0.3206787109375, 0.46441650390625, 0.608154296875, 0.75189208984375, 0.8956298828125, 1.03936767578125, 1.18310546875, 1.32684326171875, 1.4705810546875, 1.61431884765625, 1.758056640625, 1.90179443359375, 2.0455322265625, 2.18927001953125, 2.3330078125, 2.47674560546875, 2.6204833984375, 2.76422119140625, 2.907958984375, 3.05169677734375, 3.1954345703125, 3.33917236328125, 3.48291015625, 3.62664794921875, 3.7703857421875, 3.91412353515625, 4.057861328125, 4.20159912109375, 4.3453369140625, 4.48907470703125, 4.6328125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 12.0, 16.0, 32.0, 118.0, 281.0, 273.0, 192.0, 41.0, 18.0, 7.0, 2.0, 7.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5859375, -5.4722747802734375, -5.358612060546875, -5.2449493408203125, -5.13128662109375, -5.0176239013671875, -4.903961181640625, -4.7902984619140625, -4.6766357421875, -4.5629730224609375, -4.449310302734375, -4.3356475830078125, -4.22198486328125, -4.1083221435546875, -3.994659423828125, -3.8809967041015625, -3.767333984375, -3.6536712646484375, -3.540008544921875, -3.4263458251953125, -3.31268310546875, -3.1990203857421875, -3.085357666015625, -2.9716949462890625, -2.8580322265625, -2.7443695068359375, -2.630706787109375, -2.5170440673828125, -2.40338134765625, -2.2897186279296875, -2.176055908203125, -2.0623931884765625, -1.94873046875, -1.8350677490234375, -1.721405029296875, -1.6077423095703125, -1.49407958984375, -1.3804168701171875, -1.266754150390625, -1.1530914306640625, -1.0394287109375, -0.9257659912109375, -0.812103271484375, -0.6984405517578125, -0.58477783203125, -0.4711151123046875, -0.357452392578125, -0.2437896728515625, -0.130126953125, -0.0164642333984375, 0.097198486328125, 0.2108612060546875, 0.32452392578125, 0.4381866455078125, 0.551849365234375, 0.6655120849609375, 0.7791748046875, 0.8928375244140625, 1.006500244140625, 1.1201629638671875, 1.23382568359375, 1.3474884033203125, 1.461151123046875, 1.5748138427734375, 1.6884765625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 11.0, 11.0, 17.0, 55.0, 217.0, 437.0, 207.0, 40.0, 9.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.18252182006836, -44.0576171875, -41.93271255493164, -39.80780792236328, -37.68290710449219, -35.55799865722656, -33.43309783935547, -31.30819320678711, -29.18328857421875, -27.05838394165039, -24.93347930908203, -22.808576583862305, -20.683671951293945, -18.558767318725586, -16.43386459350586, -14.3089599609375, -12.18405532836914, -10.059150695800781, -7.934247016906738, -5.809342861175537, -3.684438705444336, -1.5595340728759766, 0.5653696060180664, 2.6902732849121094, 4.815177917480469, 6.94008207321167, 9.064986228942871, 11.189889907836914, 13.314794540405273, 15.439699172973633, 17.56460189819336, 19.68950653076172, 21.814414978027344, 23.939319610595703, 26.064224243164062, 28.18912696838379, 30.31403160095215, 32.438934326171875, 34.563838958740234, 36.688743591308594, 38.81364822387695, 40.93855285644531, 43.06345748901367, 45.18836212158203, 47.313262939453125, 49.43817138671875, 51.563072204589844, 53.6879768371582, 55.81288146972656, 57.93778610229492, 60.06269073486328, 62.18759536743164, 64.3125, 66.4374008178711, 68.56230926513672, 70.68721008300781, 72.81211853027344, 74.93701934814453, 77.06192779541016, 79.18682861328125, 81.31173706054688, 83.43663787841797, 85.5615463256836, 87.68644714355469, 89.81134796142578]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 16.0, 11.0, 13.0, 18.0, 21.0, 23.0, 35.0, 35.0, 51.0, 43.0, 64.0, 63.0, 62.0, 62.0, 61.0, 69.0, 76.0, 50.0, 47.0, 25.0, 21.0, 22.0, 24.0, 21.0, 13.0, 17.0, 12.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.7541446685791, -19.141265869140625, -18.52838897705078, -17.915510177612305, -17.30263328552246, -16.689754486083984, -16.07687759399414, -15.463998794555664, -14.851120948791504, -14.238243103027344, -13.625365257263184, -13.012487411499023, -12.399608612060547, -11.786731719970703, -11.173852920532227, -10.560975074768066, -9.948097229003906, -9.335219383239746, -8.722341537475586, -8.109463691711426, -7.496585369110107, -6.883707523345947, -6.270829200744629, -5.657951354980469, -5.045073509216309, -4.432195663452148, -3.819317579269409, -3.20643949508667, -2.5935616493225098, -1.9806838035583496, -1.3678057193756104, -0.7549276351928711, -0.14204978942871094, 0.47082817554473877, 1.0837061405181885, 1.6965841054916382, 2.309462070465088, 2.922339916229248, 3.5352180004119873, 4.148096084594727, 4.760973930358887, 5.373851776123047, 5.986729621887207, 6.599607944488525, 7.2124857902526855, 7.825363636016846, 8.438241958618164, 9.051119804382324, 9.663997650146484, 10.276875495910645, 10.889753341674805, 11.502631187438965, 12.115509033203125, 12.728387832641602, 13.341265678405762, 13.954143524169922, 14.567021369934082, 15.179899215698242, 15.792777061462402, 16.405654907226562, 17.01853370666504, 17.631410598754883, 18.24428939819336, 18.857166290283203, 19.47004508972168]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 11.0, 10.0, 6.0, 18.0, 24.0, 55.0, 77.0, 155.0, 252.0, 606.0, 1517.0, 4933.0, 33167.0, 4081102.0, 62549.0, 6551.0, 1840.0, 692.0, 331.0, 165.0, 98.0, 35.0, 33.0, 13.0, 16.0, 5.0, 11.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.341796875, -2.242584228515625, -2.14337158203125, -2.044158935546875, -1.9449462890625, -1.845733642578125, -1.74652099609375, -1.647308349609375, -1.548095703125, -1.448883056640625, -1.34967041015625, -1.250457763671875, -1.1512451171875, -1.052032470703125, -0.95281982421875, -0.853607177734375, -0.75439453125, -0.655181884765625, -0.55596923828125, -0.456756591796875, -0.3575439453125, -0.258331298828125, -0.15911865234375, -0.059906005859375, 0.039306640625, 0.138519287109375, 0.23773193359375, 0.336944580078125, 0.4361572265625, 0.535369873046875, 0.63458251953125, 0.733795166015625, 0.8330078125, 0.932220458984375, 1.03143310546875, 1.130645751953125, 1.2298583984375, 1.329071044921875, 1.42828369140625, 1.527496337890625, 1.626708984375, 1.725921630859375, 1.82513427734375, 1.924346923828125, 2.0235595703125, 2.122772216796875, 2.22198486328125, 2.321197509765625, 2.42041015625, 2.519622802734375, 2.61883544921875, 2.718048095703125, 2.8172607421875, 2.916473388671875, 3.01568603515625, 3.114898681640625, 3.214111328125, 3.313323974609375, 3.41253662109375, 3.511749267578125, 3.6109619140625, 3.710174560546875, 3.80938720703125, 3.908599853515625, 4.0078125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 7.0, 10.0, 9.0, 17.0, 36.0, 35.0, 43.0, 68.0, 63.0, 89.0, 96.0, 88.0, 92.0, 68.0, 70.0, 50.0, 42.0, 32.0, 28.0, 15.0, 15.0, 11.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.716796875, -1.6753463745117188, -1.6338958740234375, -1.5924453735351562, -1.550994873046875, -1.5095443725585938, -1.4680938720703125, -1.4266433715820312, -1.38519287109375, -1.3437423706054688, -1.3022918701171875, -1.2608413696289062, -1.219390869140625, -1.1779403686523438, -1.1364898681640625, -1.0950393676757812, -1.0535888671875, -1.0121383666992188, -0.9706878662109375, -0.9292373657226562, -0.887786865234375, -0.8463363647460938, -0.8048858642578125, -0.7634353637695312, -0.72198486328125, -0.6805343627929688, -0.6390838623046875, -0.5976333618164062, -0.556182861328125, -0.5147323608398438, -0.4732818603515625, -0.43183135986328125, -0.390380859375, -0.34893035888671875, -0.3074798583984375, -0.26602935791015625, -0.224578857421875, -0.18312835693359375, -0.1416778564453125, -0.10022735595703125, -0.05877685546875, -0.01732635498046875, 0.0241241455078125, 0.06557464599609375, 0.107025146484375, 0.14847564697265625, 0.1899261474609375, 0.23137664794921875, 0.2728271484375, 0.31427764892578125, 0.3557281494140625, 0.39717864990234375, 0.438629150390625, 0.48007965087890625, 0.5215301513671875, 0.5629806518554688, 0.60443115234375, 0.6458816528320312, 0.6873321533203125, 0.7287826538085938, 0.770233154296875, 0.8116836547851562, 0.8531341552734375, 0.8945846557617188, 0.93603515625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 14.0, 16.0, 28.0, 26.0, 29.0, 34.0, 66.0, 71.0, 85.0, 133.0, 181.0, 310.0, 467.0, 894.0, 2135.0, 6651.0, 45182.0, 4016353.0, 105919.0, 10079.0, 2789.0, 1135.0, 569.0, 337.0, 213.0, 125.0, 100.0, 81.0, 56.0, 38.0, 33.0, 38.0, 19.0, 23.0, 13.0, 4.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.830078125, -2.745941162109375, -2.66180419921875, -2.577667236328125, -2.4935302734375, -2.409393310546875, -2.32525634765625, -2.241119384765625, -2.156982421875, -2.072845458984375, -1.98870849609375, -1.904571533203125, -1.8204345703125, -1.736297607421875, -1.65216064453125, -1.568023681640625, -1.48388671875, -1.399749755859375, -1.31561279296875, -1.231475830078125, -1.1473388671875, -1.063201904296875, -0.97906494140625, -0.894927978515625, -0.810791015625, -0.726654052734375, -0.64251708984375, -0.558380126953125, -0.4742431640625, -0.390106201171875, -0.30596923828125, -0.221832275390625, -0.1376953125, -0.053558349609375, 0.03057861328125, 0.114715576171875, 0.1988525390625, 0.282989501953125, 0.36712646484375, 0.451263427734375, 0.535400390625, 0.619537353515625, 0.70367431640625, 0.787811279296875, 0.8719482421875, 0.956085205078125, 1.04022216796875, 1.124359130859375, 1.20849609375, 1.292633056640625, 1.37677001953125, 1.460906982421875, 1.5450439453125, 1.629180908203125, 1.71331787109375, 1.797454833984375, 1.881591796875, 1.965728759765625, 2.04986572265625, 2.134002685546875, 2.2181396484375, 2.302276611328125, 2.38641357421875, 2.470550537109375, 2.5546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 12.0, 21.0, 63.0, 161.0, 3030.0, 561.0, 121.0, 37.0, 24.0, 10.0, 8.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69287109375, -0.6717681884765625, -0.650665283203125, -0.6295623779296875, -0.60845947265625, -0.5873565673828125, -0.566253662109375, -0.5451507568359375, -0.5240478515625, -0.5029449462890625, -0.481842041015625, -0.4607391357421875, -0.43963623046875, -0.4185333251953125, -0.397430419921875, -0.3763275146484375, -0.355224609375, -0.3341217041015625, -0.313018798828125, -0.2919158935546875, -0.27081298828125, -0.2497100830078125, -0.228607177734375, -0.2075042724609375, -0.1864013671875, -0.1652984619140625, -0.144195556640625, -0.1230926513671875, -0.10198974609375, -0.0808868408203125, -0.059783935546875, -0.0386810302734375, -0.017578125, 0.0035247802734375, 0.024627685546875, 0.0457305908203125, 0.06683349609375, 0.0879364013671875, 0.109039306640625, 0.1301422119140625, 0.1512451171875, 0.1723480224609375, 0.193450927734375, 0.2145538330078125, 0.23565673828125, 0.2567596435546875, 0.277862548828125, 0.2989654541015625, 0.320068359375, 0.3411712646484375, 0.362274169921875, 0.3833770751953125, 0.40447998046875, 0.4255828857421875, 0.446685791015625, 0.4677886962890625, 0.4888916015625, 0.5099945068359375, 0.531097412109375, 0.5522003173828125, 0.57330322265625, 0.5944061279296875, 0.615509033203125, 0.6366119384765625, 0.65771484375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 9.0, 17.0, 27.0, 61.0, 81.0, 110.0, 167.0, 160.0, 142.0, 124.0, 41.0, 27.0, 10.0, 9.0, 6.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.570201873779297, -2.4905529022216797, -2.4109039306640625, -2.331254720687866, -2.251605749130249, -2.171956777572632, -2.0923078060150146, -2.0126585960388184, -1.9330096244812012, -1.853360652923584, -1.7737115621566772, -1.69406259059906, -1.6144134998321533, -1.5347645282745361, -1.455115556716919, -1.3754664659500122, -1.295817494392395, -1.2161685228347778, -1.136519432067871, -1.056870460510254, -0.9772213697433472, -0.89757239818573, -0.817923367023468, -0.738274335861206, -0.6586253046989441, -0.5789762735366821, -0.49932724237442017, -0.4196782410144806, -0.34002920985221863, -0.26038017868995667, -0.1807311773300171, -0.10108214616775513, -0.021433115005493164, 0.0582159087061882, 0.13786493241786957, 0.21751394867897034, 0.2971629798412323, 0.37681201100349426, 0.45646101236343384, 0.5361100435256958, 0.6157590746879578, 0.6954081058502197, 0.7750571370124817, 0.8547061681747437, 0.9343551397323608, 1.0140042304992676, 1.0936532020568848, 1.173302173614502, 1.2529512643814087, 1.3326002359390259, 1.4122493267059326, 1.4918982982635498, 1.5715473890304565, 1.6511963605880737, 1.7308454513549805, 1.8104944229125977, 1.8901433944702148, 1.969792366027832, 2.049441337585449, 2.1290905475616455, 2.2087395191192627, 2.28838849067688, 2.368037462234497, 2.4476866722106934, 2.5273356437683105]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 6.0, 11.0, 14.0, 8.0, 15.0, 19.0, 15.0, 29.0, 34.0, 29.0, 30.0, 29.0, 39.0, 44.0, 37.0, 43.0, 54.0, 50.0, 55.0, 48.0, 43.0, 35.0, 32.0, 34.0, 37.0, 35.0, 29.0, 22.0, 14.0, 17.0, 14.0, 13.0, 10.0, 8.0, 11.0, 7.0, 4.0, 5.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.0114667415618896, -0.9792153835296631, -0.9469640851020813, -0.9147127270698547, -0.882461428642273, -0.8502100706100464, -0.8179587125778198, -0.785707414150238, -0.7534561157226562, -0.7212047576904297, -0.6889534592628479, -0.6567021012306213, -0.6244508028030396, -0.592199444770813, -0.5599480867385864, -0.5276967883110046, -0.4954454302787781, -0.4631941020488739, -0.4309427738189697, -0.39869141578674316, -0.3664401173591614, -0.3341887593269348, -0.30193743109703064, -0.26968610286712646, -0.2374347746372223, -0.20518344640731812, -0.17293211817741394, -0.14068077504634857, -0.1084294468164444, -0.07617811858654022, -0.043926775455474854, -0.011675447225570679, 0.020575881004333496, 0.05282721295952797, 0.08507854491472244, 0.11732988059520721, 0.1495812088251114, 0.18183253705501556, 0.21408388018608093, 0.2463352084159851, 0.2785865366458893, 0.31083786487579346, 0.34308919310569763, 0.3753405213356018, 0.40759187936782837, 0.43984317779541016, 0.4720945358276367, 0.5043458938598633, 0.5365971922874451, 0.5688485503196716, 0.6010998487472534, 0.63335120677948, 0.6656025052070618, 0.6978538632392883, 0.7301051616668701, 0.7623565196990967, 0.7946078777313232, 0.8268592357635498, 0.8591105341911316, 0.8913618922233582, 0.9236131906509399, 0.9558645486831665, 0.9881159067153931, 1.02036714553833, 1.0526185035705566]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 8.0, 5.0, 3.0, 11.0, 11.0, 15.0, 23.0, 51.0, 57.0, 78.0, 148.0, 302.0, 477.0, 994.0, 2208.0, 5939.0, 19987.0, 88387.0, 416098.0, 400469.0, 83986.0, 19174.0, 5695.0, 2242.0, 982.0, 540.0, 242.0, 158.0, 79.0, 55.0, 43.0, 29.0, 15.0, 11.0, 12.0, 12.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.88671875, -1.821624755859375, -1.75653076171875, -1.691436767578125, -1.6263427734375, -1.561248779296875, -1.49615478515625, -1.431060791015625, -1.365966796875, -1.300872802734375, -1.23577880859375, -1.170684814453125, -1.1055908203125, -1.040496826171875, -0.97540283203125, -0.910308837890625, -0.84521484375, -0.780120849609375, -0.71502685546875, -0.649932861328125, -0.5848388671875, -0.519744873046875, -0.45465087890625, -0.389556884765625, -0.324462890625, -0.259368896484375, -0.19427490234375, -0.129180908203125, -0.0640869140625, 0.001007080078125, 0.06610107421875, 0.131195068359375, 0.1962890625, 0.261383056640625, 0.32647705078125, 0.391571044921875, 0.4566650390625, 0.521759033203125, 0.58685302734375, 0.651947021484375, 0.717041015625, 0.782135009765625, 0.84722900390625, 0.912322998046875, 0.9774169921875, 1.042510986328125, 1.10760498046875, 1.172698974609375, 1.23779296875, 1.302886962890625, 1.36798095703125, 1.433074951171875, 1.4981689453125, 1.563262939453125, 1.62835693359375, 1.693450927734375, 1.758544921875, 1.823638916015625, 1.88873291015625, 1.953826904296875, 2.0189208984375, 2.084014892578125, 2.14910888671875, 2.214202880859375, 2.279296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 12.0, 8.0, 18.0, 18.0, 33.0, 51.0, 58.0, 67.0, 61.0, 75.0, 71.0, 93.0, 80.0, 77.0, 57.0, 50.0, 37.0, 33.0, 29.0, 20.0, 11.0, 13.0, 4.0, 6.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5556640625, -1.5158767700195312, -1.4760894775390625, -1.4363021850585938, -1.396514892578125, -1.3567276000976562, -1.3169403076171875, -1.2771530151367188, -1.23736572265625, -1.1975784301757812, -1.1577911376953125, -1.1180038452148438, -1.078216552734375, -1.0384292602539062, -0.9986419677734375, -0.9588546752929688, -0.9190673828125, -0.8792800903320312, -0.8394927978515625, -0.7997055053710938, -0.759918212890625, -0.7201309204101562, -0.6803436279296875, -0.6405563354492188, -0.60076904296875, -0.5609817504882812, -0.5211944580078125, -0.48140716552734375, -0.441619873046875, -0.40183258056640625, -0.3620452880859375, -0.32225799560546875, -0.282470703125, -0.24268341064453125, -0.2028961181640625, -0.16310882568359375, -0.123321533203125, -0.08353424072265625, -0.0437469482421875, -0.00395965576171875, 0.03582763671875, 0.07561492919921875, 0.1154022216796875, 0.15518951416015625, 0.194976806640625, 0.23476409912109375, 0.2745513916015625, 0.31433868408203125, 0.3541259765625, 0.39391326904296875, 0.4337005615234375, 0.47348785400390625, 0.513275146484375, 0.5530624389648438, 0.5928497314453125, 0.6326370239257812, 0.67242431640625, 0.7122116088867188, 0.7519989013671875, 0.7917861938476562, 0.831573486328125, 0.8713607788085938, 0.9111480712890625, 0.9509353637695312, 0.99072265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 15.0, 31.0, 40.0, 90.0, 161.0, 288.0, 636.0, 1438.0, 5399.0, 134831.0, 878180.0, 22885.0, 2671.0, 927.0, 485.0, 209.0, 115.0, 63.0, 35.0, 17.0, 16.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.03192138671875, -3.8724365234375, -3.71295166015625, -3.553466796875, -3.39398193359375, -3.2344970703125, -3.07501220703125, -2.91552734375, -2.75604248046875, -2.5965576171875, -2.43707275390625, -2.277587890625, -2.11810302734375, -1.9586181640625, -1.79913330078125, -1.6396484375, -1.48016357421875, -1.3206787109375, -1.16119384765625, -1.001708984375, -0.84222412109375, -0.6827392578125, -0.52325439453125, -0.36376953125, -0.20428466796875, -0.0447998046875, 0.11468505859375, 0.274169921875, 0.43365478515625, 0.5931396484375, 0.75262451171875, 0.912109375, 1.07159423828125, 1.2310791015625, 1.39056396484375, 1.550048828125, 1.70953369140625, 1.8690185546875, 2.02850341796875, 2.18798828125, 2.34747314453125, 2.5069580078125, 2.66644287109375, 2.825927734375, 2.98541259765625, 3.1448974609375, 3.30438232421875, 3.4638671875, 3.62335205078125, 3.7828369140625, 3.94232177734375, 4.101806640625, 4.26129150390625, 4.4207763671875, 4.58026123046875, 4.73974609375, 4.89923095703125, 5.0587158203125, 5.21820068359375, 5.377685546875, 5.53717041015625, 5.6966552734375, 5.85614013671875, 6.015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 9.0, 11.0, 6.0, 6.0, 15.0, 13.0, 12.0, 27.0, 29.0, 31.0, 33.0, 39.0, 42.0, 44.0, 52.0, 48.0, 49.0, 62.0, 55.0, 52.0, 41.0, 39.0, 45.0, 30.0, 28.0, 30.0, 25.0, 21.0, 26.0, 15.0, 9.0, 12.0, 8.0, 6.0, 4.0, 3.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.66015625, -3.541351318359375, -3.42254638671875, -3.303741455078125, -3.1849365234375, -3.066131591796875, -2.94732666015625, -2.828521728515625, -2.709716796875, -2.590911865234375, -2.47210693359375, -2.353302001953125, -2.2344970703125, -2.115692138671875, -1.99688720703125, -1.878082275390625, -1.75927734375, -1.640472412109375, -1.52166748046875, -1.402862548828125, -1.2840576171875, -1.165252685546875, -1.04644775390625, -0.927642822265625, -0.808837890625, -0.690032958984375, -0.57122802734375, -0.452423095703125, -0.3336181640625, -0.214813232421875, -0.09600830078125, 0.022796630859375, 0.1416015625, 0.260406494140625, 0.37921142578125, 0.498016357421875, 0.6168212890625, 0.735626220703125, 0.85443115234375, 0.973236083984375, 1.092041015625, 1.210845947265625, 1.32965087890625, 1.448455810546875, 1.5672607421875, 1.686065673828125, 1.80487060546875, 1.923675537109375, 2.04248046875, 2.161285400390625, 2.28009033203125, 2.398895263671875, 2.5177001953125, 2.636505126953125, 2.75531005859375, 2.874114990234375, 2.992919921875, 3.111724853515625, 3.23052978515625, 3.349334716796875, 3.4681396484375, 3.586944580078125, 3.70574951171875, 3.824554443359375, 3.943359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 15.0, 5.0, 16.0, 16.0, 18.0, 13.0, 36.0, 41.0, 56.0, 101.0, 140.0, 302.0, 644.0, 1920.0, 12488.0, 638316.0, 381965.0, 9611.0, 1536.0, 575.0, 255.0, 131.0, 101.0, 68.0, 37.0, 37.0, 19.0, 18.0, 10.0, 10.0, 11.0, 1.0, 9.0, 5.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.19140625, -2.122802734375, -2.05419921875, -1.985595703125, -1.9169921875, -1.848388671875, -1.77978515625, -1.711181640625, -1.642578125, -1.573974609375, -1.50537109375, -1.436767578125, -1.3681640625, -1.299560546875, -1.23095703125, -1.162353515625, -1.09375, -1.025146484375, -0.95654296875, -0.887939453125, -0.8193359375, -0.750732421875, -0.68212890625, -0.613525390625, -0.544921875, -0.476318359375, -0.40771484375, -0.339111328125, -0.2705078125, -0.201904296875, -0.13330078125, -0.064697265625, 0.00390625, 0.072509765625, 0.14111328125, 0.209716796875, 0.2783203125, 0.346923828125, 0.41552734375, 0.484130859375, 0.552734375, 0.621337890625, 0.68994140625, 0.758544921875, 0.8271484375, 0.895751953125, 0.96435546875, 1.032958984375, 1.1015625, 1.170166015625, 1.23876953125, 1.307373046875, 1.3759765625, 1.444580078125, 1.51318359375, 1.581787109375, 1.650390625, 1.718994140625, 1.78759765625, 1.856201171875, 1.9248046875, 1.993408203125, 2.06201171875, 2.130615234375, 2.19921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 9.0, 8.0, 14.0, 17.0, 22.0, 30.0, 27.0, 40.0, 79.0, 96.0, 128.0, 128.0, 107.0, 67.0, 71.0, 41.0, 23.0, 26.0, 17.0, 7.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002200603485107422, -0.00021378695964813232, -0.00020751357078552246, -0.0002012401819229126, -0.00019496679306030273, -0.00018869340419769287, -0.000182420015335083, -0.00017614662647247314, -0.00016987323760986328, -0.00016359984874725342, -0.00015732645988464355, -0.0001510530710220337, -0.00014477968215942383, -0.00013850629329681396, -0.0001322329044342041, -0.00012595951557159424, -0.00011968612670898438, -0.00011341273784637451, -0.00010713934898376465, -0.00010086596012115479, -9.459257125854492e-05, -8.831918239593506e-05, -8.20457935333252e-05, -7.577240467071533e-05, -6.949901580810547e-05, -6.32256269454956e-05, -5.695223808288574e-05, -5.067884922027588e-05, -4.4405460357666016e-05, -3.813207149505615e-05, -3.185868263244629e-05, -2.5585293769836426e-05, -1.9311904907226562e-05, -1.30385160446167e-05, -6.765127182006836e-06, -4.917383193969727e-07, 5.781650543212891e-06, 1.2055039405822754e-05, 1.8328428268432617e-05, 2.460181713104248e-05, 3.0875205993652344e-05, 3.714859485626221e-05, 4.342198371887207e-05, 4.9695372581481934e-05, 5.59687614440918e-05, 6.224215030670166e-05, 6.851553916931152e-05, 7.478892803192139e-05, 8.106231689453125e-05, 8.733570575714111e-05, 9.360909461975098e-05, 9.988248348236084e-05, 0.0001061558723449707, 0.00011242926120758057, 0.00011870265007019043, 0.0001249760389328003, 0.00013124942779541016, 0.00013752281665802002, 0.00014379620552062988, 0.00015006959438323975, 0.0001563429832458496, 0.00016261637210845947, 0.00016888976097106934, 0.0001751631498336792, 0.00018143653869628906]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 10.0, 9.0, 12.0, 22.0, 31.0, 36.0, 88.0, 104.0, 217.0, 357.0, 868.0, 2664.0, 17312.0, 607270.0, 402075.0, 13623.0, 2265.0, 784.0, 371.0, 168.0, 92.0, 56.0, 37.0, 21.0, 13.0, 18.0, 4.0, 5.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4140625, -1.355010986328125, -1.29595947265625, -1.236907958984375, -1.1778564453125, -1.118804931640625, -1.05975341796875, -1.000701904296875, -0.941650390625, -0.882598876953125, -0.82354736328125, -0.764495849609375, -0.7054443359375, -0.646392822265625, -0.58734130859375, -0.528289794921875, -0.46923828125, -0.410186767578125, -0.35113525390625, -0.292083740234375, -0.2330322265625, -0.173980712890625, -0.11492919921875, -0.055877685546875, 0.003173828125, 0.062225341796875, 0.12127685546875, 0.180328369140625, 0.2393798828125, 0.298431396484375, 0.35748291015625, 0.416534423828125, 0.4755859375, 0.534637451171875, 0.59368896484375, 0.652740478515625, 0.7117919921875, 0.770843505859375, 0.82989501953125, 0.888946533203125, 0.947998046875, 1.007049560546875, 1.06610107421875, 1.125152587890625, 1.1842041015625, 1.243255615234375, 1.30230712890625, 1.361358642578125, 1.42041015625, 1.479461669921875, 1.53851318359375, 1.597564697265625, 1.6566162109375, 1.715667724609375, 1.77471923828125, 1.833770751953125, 1.892822265625, 1.951873779296875, 2.01092529296875, 2.069976806640625, 2.1290283203125, 2.188079833984375, 2.24713134765625, 2.306182861328125, 2.365234375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 7.0, 8.0, 6.0, 7.0, 17.0, 22.0, 47.0, 78.0, 90.0, 130.0, 155.0, 140.0, 94.0, 64.0, 51.0, 20.0, 26.0, 14.0, 10.0, 5.0, 3.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.822265625, -1.771026611328125, -1.71978759765625, -1.668548583984375, -1.6173095703125, -1.566070556640625, -1.51483154296875, -1.463592529296875, -1.412353515625, -1.361114501953125, -1.30987548828125, -1.258636474609375, -1.2073974609375, -1.156158447265625, -1.10491943359375, -1.053680419921875, -1.00244140625, -0.951202392578125, -0.89996337890625, -0.848724365234375, -0.7974853515625, -0.746246337890625, -0.69500732421875, -0.643768310546875, -0.592529296875, -0.541290283203125, -0.49005126953125, -0.438812255859375, -0.3875732421875, -0.336334228515625, -0.28509521484375, -0.233856201171875, -0.1826171875, -0.131378173828125, -0.08013916015625, -0.028900146484375, 0.0223388671875, 0.073577880859375, 0.12481689453125, 0.176055908203125, 0.227294921875, 0.278533935546875, 0.32977294921875, 0.381011962890625, 0.4322509765625, 0.483489990234375, 0.53472900390625, 0.585968017578125, 0.63720703125, 0.688446044921875, 0.73968505859375, 0.790924072265625, 0.8421630859375, 0.893402099609375, 0.94464111328125, 0.995880126953125, 1.047119140625, 1.098358154296875, 1.14959716796875, 1.200836181640625, 1.2520751953125, 1.303314208984375, 1.35455322265625, 1.405792236328125, 1.45703125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 12.0, 53.0, 241.0, 486.0, 181.0, 24.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.10023498535156, -46.34389877319336, -44.587562561035156, -42.83123016357422, -41.074893951416016, -39.31855773925781, -37.56222152709961, -35.805885314941406, -34.04955291748047, -32.293216705322266, -30.536882400512695, -28.780546188354492, -27.024211883544922, -25.26787567138672, -23.511539459228516, -21.755203247070312, -19.99886703491211, -18.242530822753906, -16.486196517944336, -14.729860305786133, -12.973525047302246, -11.21718978881836, -9.460853576660156, -7.7045183181762695, -5.948183059692383, -4.191847801208496, -2.435512065887451, -0.6791763305664062, 1.0771589279174805, 2.833494186401367, 4.58983039855957, 6.346165657043457, 8.102500915527344, 9.85883617401123, 11.615171432495117, 13.37150764465332, 15.127842903137207, 16.884178161621094, 18.640514373779297, 20.3968505859375, 22.15318489074707, 23.909521102905273, 25.665855407714844, 27.422191619873047, 29.17852783203125, 30.93486213684082, 32.691200256347656, 34.447532653808594, 36.2038688659668, 37.960205078125, 39.7165412902832, 41.472877502441406, 43.229209899902344, 44.98554611206055, 46.74188232421875, 48.49821853637695, 50.254554748535156, 52.01089096069336, 53.76722717285156, 55.5235595703125, 57.2798957824707, 59.036231994628906, 60.79256820678711, 62.54890441894531, 64.30523681640625]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 15.0, 22.0, 15.0, 14.0, 21.0, 14.0, 28.0, 34.0, 34.0, 31.0, 42.0, 45.0, 54.0, 29.0, 47.0, 39.0, 48.0, 50.0, 51.0, 35.0, 39.0, 32.0, 26.0, 20.0, 19.0, 32.0, 27.0, 19.0, 16.0, 15.0, 13.0, 9.0, 3.0, 7.0, 5.0, 5.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0], "bins": [-14.294331550598145, -13.854954719543457, -13.41557788848877, -12.976201057434082, -12.536823272705078, -12.09744644165039, -11.658069610595703, -11.218692779541016, -10.779315948486328, -10.33993911743164, -9.900562286376953, -9.461185455322266, -9.021808624267578, -8.58243179321289, -8.143054008483887, -7.703677177429199, -7.264300346374512, -6.824923515319824, -6.385546684265137, -5.946169376373291, -5.5067925453186035, -5.067415714263916, -4.62803840637207, -4.188661575317383, -3.7492847442626953, -3.309907913208008, -2.870530843734741, -2.4311537742614746, -1.991776943206787, -1.5524001121520996, -1.113023042678833, -0.6736459732055664, -0.2342691421508789, 0.20510780811309814, 0.6444847583770752, 1.0838617086410522, 1.5232386589050293, 1.9626154899597168, 2.4019925594329834, 2.84136962890625, 3.2807464599609375, 3.720123291015625, 4.1595001220703125, 4.598877429962158, 5.038254261016846, 5.477631092071533, 5.917008399963379, 6.356385231018066, 6.795762062072754, 7.235138893127441, 7.674515724182129, 8.113892555236816, 8.55327033996582, 8.992647171020508, 9.432024002075195, 9.871400833129883, 10.31077766418457, 10.750154495239258, 11.189531326293945, 11.628908157348633, 12.06828498840332, 12.507661819458008, 12.947039604187012, 13.3864164352417, 13.825793266296387]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 13.0, 12.0, 23.0, 53.0, 75.0, 111.0, 232.0, 425.0, 913.0, 2765.0, 24107.0, 4126240.0, 34236.0, 3070.0, 1011.0, 442.0, 246.0, 114.0, 75.0, 39.0, 23.0, 9.0, 10.0, 8.0, 9.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.12078857421875, -2.9759521484375, -2.83111572265625, -2.686279296875, -2.54144287109375, -2.3966064453125, -2.25177001953125, -2.10693359375, -1.96209716796875, -1.8172607421875, -1.67242431640625, -1.527587890625, -1.38275146484375, -1.2379150390625, -1.09307861328125, -0.9482421875, -0.80340576171875, -0.6585693359375, -0.51373291015625, -0.368896484375, -0.22406005859375, -0.0792236328125, 0.06561279296875, 0.21044921875, 0.35528564453125, 0.5001220703125, 0.64495849609375, 0.789794921875, 0.93463134765625, 1.0794677734375, 1.22430419921875, 1.369140625, 1.51397705078125, 1.6588134765625, 1.80364990234375, 1.948486328125, 2.09332275390625, 2.2381591796875, 2.38299560546875, 2.52783203125, 2.67266845703125, 2.8175048828125, 2.96234130859375, 3.107177734375, 3.25201416015625, 3.3968505859375, 3.54168701171875, 3.6865234375, 3.83135986328125, 3.9761962890625, 4.12103271484375, 4.265869140625, 4.41070556640625, 4.5555419921875, 4.70037841796875, 4.84521484375, 4.99005126953125, 5.1348876953125, 5.27972412109375, 5.424560546875, 5.56939697265625, 5.7142333984375, 5.85906982421875, 6.00390625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 6.0, 16.0, 15.0, 30.0, 29.0, 39.0, 56.0, 77.0, 72.0, 71.0, 101.0, 69.0, 82.0, 70.0, 60.0, 44.0, 45.0, 22.0, 26.0, 13.0, 20.0, 10.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.068359375, -1.02886962890625, -0.9893798828125, -0.94989013671875, -0.910400390625, -0.87091064453125, -0.8314208984375, -0.79193115234375, -0.75244140625, -0.71295166015625, -0.6734619140625, -0.63397216796875, -0.594482421875, -0.55499267578125, -0.5155029296875, -0.47601318359375, -0.4365234375, -0.39703369140625, -0.3575439453125, -0.31805419921875, -0.278564453125, -0.23907470703125, -0.1995849609375, -0.16009521484375, -0.12060546875, -0.08111572265625, -0.0416259765625, -0.00213623046875, 0.037353515625, 0.07684326171875, 0.1163330078125, 0.15582275390625, 0.1953125, 0.23480224609375, 0.2742919921875, 0.31378173828125, 0.353271484375, 0.39276123046875, 0.4322509765625, 0.47174072265625, 0.51123046875, 0.55072021484375, 0.5902099609375, 0.62969970703125, 0.669189453125, 0.70867919921875, 0.7481689453125, 0.78765869140625, 0.8271484375, 0.86663818359375, 0.9061279296875, 0.94561767578125, 0.985107421875, 1.02459716796875, 1.0640869140625, 1.10357666015625, 1.14306640625, 1.18255615234375, 1.2220458984375, 1.26153564453125, 1.301025390625, 1.34051513671875, 1.3800048828125, 1.41949462890625, 1.458984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 3.0, 9.0, 19.0, 12.0, 19.0, 42.0, 37.0, 29.0, 52.0, 60.0, 94.0, 125.0, 213.0, 345.0, 728.0, 2014.0, 11538.0, 4043797.0, 127707.0, 4819.0, 1175.0, 550.0, 271.0, 166.0, 91.0, 85.0, 65.0, 33.0, 48.0, 34.0, 13.0, 14.0, 16.0, 9.0, 4.0, 5.0, 6.0, 3.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.6270751953125, -4.476806640625, -4.3265380859375, -4.17626953125, -4.0260009765625, -3.875732421875, -3.7254638671875, -3.5751953125, -3.4249267578125, -3.274658203125, -3.1243896484375, -2.97412109375, -2.8238525390625, -2.673583984375, -2.5233154296875, -2.373046875, -2.2227783203125, -2.072509765625, -1.9222412109375, -1.77197265625, -1.6217041015625, -1.471435546875, -1.3211669921875, -1.1708984375, -1.0206298828125, -0.870361328125, -0.7200927734375, -0.56982421875, -0.4195556640625, -0.269287109375, -0.1190185546875, 0.03125, 0.1815185546875, 0.331787109375, 0.4820556640625, 0.63232421875, 0.7825927734375, 0.932861328125, 1.0831298828125, 1.2333984375, 1.3836669921875, 1.533935546875, 1.6842041015625, 1.83447265625, 1.9847412109375, 2.135009765625, 2.2852783203125, 2.435546875, 2.5858154296875, 2.736083984375, 2.8863525390625, 3.03662109375, 3.1868896484375, 3.337158203125, 3.4874267578125, 3.6376953125, 3.7879638671875, 3.938232421875, 4.0885009765625, 4.23876953125, 4.3890380859375, 4.539306640625, 4.6895751953125, 4.83984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 18.0, 65.0, 656.0, 3172.0, 110.0, 28.0, 13.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.0078125, -3.929473876953125, -3.85113525390625, -3.772796630859375, -3.6944580078125, -3.616119384765625, -3.53778076171875, -3.459442138671875, -3.381103515625, -3.302764892578125, -3.22442626953125, -3.146087646484375, -3.0677490234375, -2.989410400390625, -2.91107177734375, -2.832733154296875, -2.75439453125, -2.676055908203125, -2.59771728515625, -2.519378662109375, -2.4410400390625, -2.362701416015625, -2.28436279296875, -2.206024169921875, -2.127685546875, -2.049346923828125, -1.97100830078125, -1.892669677734375, -1.8143310546875, -1.735992431640625, -1.65765380859375, -1.579315185546875, -1.5009765625, -1.422637939453125, -1.34429931640625, -1.265960693359375, -1.1876220703125, -1.109283447265625, -1.03094482421875, -0.952606201171875, -0.874267578125, -0.795928955078125, -0.71759033203125, -0.639251708984375, -0.5609130859375, -0.482574462890625, -0.40423583984375, -0.325897216796875, -0.24755859375, -0.169219970703125, -0.09088134765625, -0.012542724609375, 0.0657958984375, 0.144134521484375, 0.22247314453125, 0.300811767578125, 0.379150390625, 0.457489013671875, 0.53582763671875, 0.614166259765625, 0.6925048828125, 0.770843505859375, 0.84918212890625, 0.927520751953125, 1.005859375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 26.0, 82.0, 229.0, 317.0, 195.0, 68.0, 43.0, 14.0, 6.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.72571086883545, -12.409829139709473, -12.093947410583496, -11.778066635131836, -11.46218490600586, -11.146303176879883, -10.830421447753906, -10.51453971862793, -10.19865894317627, -9.882777214050293, -9.566895484924316, -9.251014709472656, -8.93513298034668, -8.619251251220703, -8.303369522094727, -7.987488269805908, -7.671606540679932, -7.355724811553955, -7.039843559265137, -6.72396183013916, -6.408080577850342, -6.092198848724365, -5.776317596435547, -5.46043586730957, -5.144554138183594, -4.828672409057617, -4.512791156768799, -4.196909427642822, -3.881028175354004, -3.5651464462280273, -3.24926495552063, -2.9333834648132324, -2.6175026893615723, -2.301621198654175, -1.9857397079467773, -1.6698580980300903, -1.3539766073226929, -1.0380951166152954, -0.7222135066986084, -0.40633201599121094, -0.09045052528381348, 0.22543099522590637, 0.5413125157356262, 0.8571940660476685, 1.173075556755066, 1.4889570474624634, 1.8048386573791504, 2.120720148086548, 2.4366016387939453, 2.7524831295013428, 3.0683646202087402, 3.384246349334717, 3.700127601623535, 4.016009330749512, 4.331891059875488, 4.647772312164307, 4.963653564453125, 5.279535293579102, 5.59541654586792, 5.9112982749938965, 6.227179527282715, 6.543061256408691, 6.858942985534668, 7.174824237823486, 7.490705966949463]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 14.0, 14.0, 7.0, 16.0, 15.0, 24.0, 21.0, 34.0, 63.0, 46.0, 64.0, 60.0, 59.0, 65.0, 66.0, 60.0, 49.0, 51.0, 47.0, 42.0, 38.0, 44.0, 23.0, 26.0, 10.0, 12.0, 7.0, 7.0, 8.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.124757766723633, -5.965134620666504, -5.805510997772217, -5.645887851715088, -5.486264228820801, -5.326641082763672, -5.167017936706543, -5.007394790649414, -4.847771167755127, -4.688148021697998, -4.528524398803711, -4.368901252746582, -4.209278106689453, -4.049654483795166, -3.890031337738037, -3.730407953262329, -3.570784568786621, -3.411161184310913, -3.251537799835205, -3.091914653778076, -2.932291269302368, -2.77266788482666, -2.6130447387695312, -2.4534213542938232, -2.2937979698181152, -2.1341745853424072, -1.9745513200759888, -1.8149280548095703, -1.6553046703338623, -1.4956812858581543, -1.3360580205917358, -1.1764347553253174, -1.0168113708496094, -0.8571880459785461, -0.6975647211074829, -0.5379413962364197, -0.37831807136535645, -0.2186947464942932, -0.05907142162322998, 0.10055184364318848, 0.2601752281188965, 0.4197985529899597, 0.579421877861023, 0.7390452027320862, 0.8986685276031494, 1.0582919120788574, 1.2179151773452759, 1.3775384426116943, 1.5371618270874023, 1.6967852115631104, 1.8564084768295288, 2.0160317420959473, 2.1756551265716553, 2.3352785110473633, 2.494901657104492, 2.6545250415802, 2.814148426055908, 2.973771810531616, 3.133395195007324, 3.293018341064453, 3.452641725540161, 3.612265110015869, 3.771888256072998, 3.931511640548706, 4.091135025024414]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 21.0, 25.0, 46.0, 73.0, 137.0, 264.0, 555.0, 1444.0, 4905.0, 26790.0, 257524.0, 660762.0, 80762.0, 10829.0, 2633.0, 973.0, 367.0, 183.0, 95.0, 59.0, 33.0, 20.0, 11.0, 12.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30078125, -3.187957763671875, -3.07513427734375, -2.962310791015625, -2.8494873046875, -2.736663818359375, -2.62384033203125, -2.511016845703125, -2.398193359375, -2.285369873046875, -2.17254638671875, -2.059722900390625, -1.9468994140625, -1.834075927734375, -1.72125244140625, -1.608428955078125, -1.49560546875, -1.382781982421875, -1.26995849609375, -1.157135009765625, -1.0443115234375, -0.931488037109375, -0.81866455078125, -0.705841064453125, -0.593017578125, -0.480194091796875, -0.36737060546875, -0.254547119140625, -0.1417236328125, -0.028900146484375, 0.08392333984375, 0.196746826171875, 0.3095703125, 0.422393798828125, 0.53521728515625, 0.648040771484375, 0.7608642578125, 0.873687744140625, 0.98651123046875, 1.099334716796875, 1.212158203125, 1.324981689453125, 1.43780517578125, 1.550628662109375, 1.6634521484375, 1.776275634765625, 1.88909912109375, 2.001922607421875, 2.11474609375, 2.227569580078125, 2.34039306640625, 2.453216552734375, 2.5660400390625, 2.678863525390625, 2.79168701171875, 2.904510498046875, 3.017333984375, 3.130157470703125, 3.24298095703125, 3.355804443359375, 3.4686279296875, 3.581451416015625, 3.69427490234375, 3.807098388671875, 3.919921875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 10.0, 6.0, 7.0, 6.0, 15.0, 15.0, 23.0, 22.0, 35.0, 41.0, 44.0, 56.0, 63.0, 72.0, 68.0, 56.0, 62.0, 68.0, 52.0, 48.0, 45.0, 35.0, 37.0, 26.0, 22.0, 19.0, 12.0, 12.0, 14.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0927734375, -1.058074951171875, -1.02337646484375, -0.988677978515625, -0.9539794921875, -0.919281005859375, -0.88458251953125, -0.849884033203125, -0.815185546875, -0.780487060546875, -0.74578857421875, -0.711090087890625, -0.6763916015625, -0.641693115234375, -0.60699462890625, -0.572296142578125, -0.53759765625, -0.502899169921875, -0.46820068359375, -0.433502197265625, -0.3988037109375, -0.364105224609375, -0.32940673828125, -0.294708251953125, -0.260009765625, -0.225311279296875, -0.19061279296875, -0.155914306640625, -0.1212158203125, -0.086517333984375, -0.05181884765625, -0.017120361328125, 0.017578125, 0.052276611328125, 0.08697509765625, 0.121673583984375, 0.1563720703125, 0.191070556640625, 0.22576904296875, 0.260467529296875, 0.295166015625, 0.329864501953125, 0.36456298828125, 0.399261474609375, 0.4339599609375, 0.468658447265625, 0.50335693359375, 0.538055419921875, 0.57275390625, 0.607452392578125, 0.64215087890625, 0.676849365234375, 0.7115478515625, 0.746246337890625, 0.78094482421875, 0.815643310546875, 0.850341796875, 0.885040283203125, 0.91973876953125, 0.954437255859375, 0.9891357421875, 1.023834228515625, 1.05853271484375, 1.093231201171875, 1.1279296875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 3.0, 4.0, 7.0, 5.0, 9.0, 18.0, 30.0, 38.0, 70.0, 93.0, 170.0, 323.0, 798.0, 1668.0, 6907.0, 133496.0, 873908.0, 25408.0, 3333.0, 1188.0, 462.0, 253.0, 123.0, 74.0, 52.0, 37.0, 20.0, 18.0, 5.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.28515625, -5.110595703125, -4.93603515625, -4.761474609375, -4.5869140625, -4.412353515625, -4.23779296875, -4.063232421875, -3.888671875, -3.714111328125, -3.53955078125, -3.364990234375, -3.1904296875, -3.015869140625, -2.84130859375, -2.666748046875, -2.4921875, -2.317626953125, -2.14306640625, -1.968505859375, -1.7939453125, -1.619384765625, -1.44482421875, -1.270263671875, -1.095703125, -0.921142578125, -0.74658203125, -0.572021484375, -0.3974609375, -0.222900390625, -0.04833984375, 0.126220703125, 0.30078125, 0.475341796875, 0.64990234375, 0.824462890625, 0.9990234375, 1.173583984375, 1.34814453125, 1.522705078125, 1.697265625, 1.871826171875, 2.04638671875, 2.220947265625, 2.3955078125, 2.570068359375, 2.74462890625, 2.919189453125, 3.09375, 3.268310546875, 3.44287109375, 3.617431640625, 3.7919921875, 3.966552734375, 4.14111328125, 4.315673828125, 4.490234375, 4.664794921875, 4.83935546875, 5.013916015625, 5.1884765625, 5.363037109375, 5.53759765625, 5.712158203125, 5.88671875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 6.0, 1.0, 4.0, 8.0, 10.0, 15.0, 43.0, 39.0, 52.0, 62.0, 82.0, 100.0, 83.0, 82.0, 93.0, 88.0, 65.0, 51.0, 34.0, 24.0, 14.0, 21.0, 13.0, 8.0, 6.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91796875, -6.718994140625, -6.52001953125, -6.321044921875, -6.1220703125, -5.923095703125, -5.72412109375, -5.525146484375, -5.326171875, -5.127197265625, -4.92822265625, -4.729248046875, -4.5302734375, -4.331298828125, -4.13232421875, -3.933349609375, -3.734375, -3.535400390625, -3.33642578125, -3.137451171875, -2.9384765625, -2.739501953125, -2.54052734375, -2.341552734375, -2.142578125, -1.943603515625, -1.74462890625, -1.545654296875, -1.3466796875, -1.147705078125, -0.94873046875, -0.749755859375, -0.55078125, -0.351806640625, -0.15283203125, 0.046142578125, 0.2451171875, 0.444091796875, 0.64306640625, 0.842041015625, 1.041015625, 1.239990234375, 1.43896484375, 1.637939453125, 1.8369140625, 2.035888671875, 2.23486328125, 2.433837890625, 2.6328125, 2.831787109375, 3.03076171875, 3.229736328125, 3.4287109375, 3.627685546875, 3.82666015625, 4.025634765625, 4.224609375, 4.423583984375, 4.62255859375, 4.821533203125, 5.0205078125, 5.219482421875, 5.41845703125, 5.617431640625, 5.81640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 9.0, 2.0, 5.0, 8.0, 5.0, 17.0, 19.0, 41.0, 48.0, 79.0, 109.0, 191.0, 318.0, 650.0, 1562.0, 5063.0, 22197.0, 168527.0, 736332.0, 92754.0, 14415.0, 3653.0, 1249.0, 552.0, 292.0, 155.0, 101.0, 71.0, 37.0, 24.0, 18.0, 9.0, 7.0, 11.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.1181640625, -1.0836181640625, -1.049072265625, -1.0145263671875, -0.97998046875, -0.9454345703125, -0.910888671875, -0.8763427734375, -0.841796875, -0.8072509765625, -0.772705078125, -0.7381591796875, -0.70361328125, -0.6690673828125, -0.634521484375, -0.5999755859375, -0.5654296875, -0.5308837890625, -0.496337890625, -0.4617919921875, -0.42724609375, -0.3927001953125, -0.358154296875, -0.3236083984375, -0.2890625, -0.2545166015625, -0.219970703125, -0.1854248046875, -0.15087890625, -0.1163330078125, -0.081787109375, -0.0472412109375, -0.0126953125, 0.0218505859375, 0.056396484375, 0.0909423828125, 0.12548828125, 0.1600341796875, 0.194580078125, 0.2291259765625, 0.263671875, 0.2982177734375, 0.332763671875, 0.3673095703125, 0.40185546875, 0.4364013671875, 0.470947265625, 0.5054931640625, 0.5400390625, 0.5745849609375, 0.609130859375, 0.6436767578125, 0.67822265625, 0.7127685546875, 0.747314453125, 0.7818603515625, 0.81640625, 0.8509521484375, 0.885498046875, 0.9200439453125, 0.95458984375, 0.9891357421875, 1.023681640625, 1.0582275390625, 1.0927734375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 12.0, 13.0, 15.0, 16.0, 25.0, 37.0, 41.0, 56.0, 85.0, 153.0, 171.0, 94.0, 67.0, 43.0, 34.0, 26.0, 28.0, 14.0, 10.0, 12.0, 13.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003161430358886719, -0.00030786171555519104, -0.0002995803952217102, -0.00029129907488822937, -0.00028301775455474854, -0.0002747364342212677, -0.00026645511388778687, -0.00025817379355430603, -0.0002498924732208252, -0.00024161115288734436, -0.00023332983255386353, -0.0002250485122203827, -0.00021676719188690186, -0.00020848587155342102, -0.00020020455121994019, -0.00019192323088645935, -0.00018364191055297852, -0.00017536059021949768, -0.00016707926988601685, -0.000158797949552536, -0.00015051662921905518, -0.00014223530888557434, -0.0001339539885520935, -0.00012567266821861267, -0.00011739134788513184, -0.000109110027551651, -0.00010082870721817017, -9.254738688468933e-05, -8.42660665512085e-05, -7.598474621772766e-05, -6.770342588424683e-05, -5.942210555076599e-05, -5.1140785217285156e-05, -4.285946488380432e-05, -3.4578144550323486e-05, -2.629682421684265e-05, -1.8015503883361816e-05, -9.734183549880981e-06, -1.4528632164001465e-06, 6.8284571170806885e-06, 1.5109777450561523e-05, 2.339109778404236e-05, 3.167241811752319e-05, 3.995373845100403e-05, 4.823505878448486e-05, 5.65163791179657e-05, 6.479769945144653e-05, 7.307901978492737e-05, 8.13603401184082e-05, 8.964166045188904e-05, 9.792298078536987e-05, 0.00010620430111885071, 0.00011448562145233154, 0.00012276694178581238, 0.0001310482621192932, 0.00013932958245277405, 0.00014761090278625488, 0.00015589222311973572, 0.00016417354345321655, 0.0001724548637866974, 0.00018073618412017822, 0.00018901750445365906, 0.0001972988247871399, 0.00020558014512062073, 0.00021386146545410156]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 13.0, 7.0, 19.0, 14.0, 37.0, 33.0, 76.0, 107.0, 190.0, 328.0, 485.0, 1085.0, 2765.0, 9987.0, 59542.0, 706190.0, 235176.0, 23622.0, 5323.0, 1772.0, 747.0, 400.0, 219.0, 129.0, 97.0, 65.0, 39.0, 16.0, 27.0, 12.0, 7.0, 11.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9755859375, -0.9377288818359375, -0.899871826171875, -0.8620147705078125, -0.82415771484375, -0.7863006591796875, -0.748443603515625, -0.7105865478515625, -0.6727294921875, -0.6348724365234375, -0.597015380859375, -0.5591583251953125, -0.52130126953125, -0.4834442138671875, -0.445587158203125, -0.4077301025390625, -0.369873046875, -0.3320159912109375, -0.294158935546875, -0.2563018798828125, -0.21844482421875, -0.1805877685546875, -0.142730712890625, -0.1048736572265625, -0.0670166015625, -0.0291595458984375, 0.008697509765625, 0.0465545654296875, 0.08441162109375, 0.1222686767578125, 0.160125732421875, 0.1979827880859375, 0.23583984375, 0.2736968994140625, 0.311553955078125, 0.3494110107421875, 0.38726806640625, 0.4251251220703125, 0.462982177734375, 0.5008392333984375, 0.5386962890625, 0.5765533447265625, 0.614410400390625, 0.6522674560546875, 0.69012451171875, 0.7279815673828125, 0.765838623046875, 0.8036956787109375, 0.841552734375, 0.8794097900390625, 0.917266845703125, 0.9551239013671875, 0.99298095703125, 1.0308380126953125, 1.068695068359375, 1.1065521240234375, 1.1444091796875, 1.1822662353515625, 1.220123291015625, 1.2579803466796875, 1.29583740234375, 1.3336944580078125, 1.371551513671875, 1.4094085693359375, 1.447265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 10.0, 16.0, 26.0, 16.0, 23.0, 27.0, 41.0, 61.0, 87.0, 96.0, 100.0, 93.0, 93.0, 52.0, 56.0, 40.0, 33.0, 25.0, 17.0, 21.0, 13.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9970703125, -0.9666748046875, -0.936279296875, -0.9058837890625, -0.87548828125, -0.8450927734375, -0.814697265625, -0.7843017578125, -0.75390625, -0.7235107421875, -0.693115234375, -0.6627197265625, -0.63232421875, -0.6019287109375, -0.571533203125, -0.5411376953125, -0.5107421875, -0.4803466796875, -0.449951171875, -0.4195556640625, -0.38916015625, -0.3587646484375, -0.328369140625, -0.2979736328125, -0.267578125, -0.2371826171875, -0.206787109375, -0.1763916015625, -0.14599609375, -0.1156005859375, -0.085205078125, -0.0548095703125, -0.0244140625, 0.0059814453125, 0.036376953125, 0.0667724609375, 0.09716796875, 0.1275634765625, 0.157958984375, 0.1883544921875, 0.21875, 0.2491455078125, 0.279541015625, 0.3099365234375, 0.34033203125, 0.3707275390625, 0.401123046875, 0.4315185546875, 0.4619140625, 0.4923095703125, 0.522705078125, 0.5531005859375, 0.58349609375, 0.6138916015625, 0.644287109375, 0.6746826171875, 0.705078125, 0.7354736328125, 0.765869140625, 0.7962646484375, 0.82666015625, 0.8570556640625, 0.887451171875, 0.9178466796875, 0.9482421875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 24.0, 93.0, 167.0, 297.0, 245.0, 103.0, 36.0, 16.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.54161834716797, -49.354942321777344, -48.16826248168945, -46.98158645629883, -45.79490661621094, -44.60823059082031, -43.42155456542969, -42.23487854003906, -41.04819869995117, -39.86152267456055, -38.674842834472656, -37.48816680908203, -36.301490783691406, -35.114810943603516, -33.92813491821289, -32.741455078125, -31.554779052734375, -30.368101119995117, -29.18142318725586, -27.994747161865234, -26.808069229125977, -25.62139129638672, -24.434715270996094, -23.248037338256836, -22.061359405517578, -20.87468147277832, -19.688003540039062, -18.501327514648438, -17.31464958190918, -16.127971649169922, -14.94129467010498, -13.754617691040039, -12.567939758300781, -11.381261825561523, -10.194584846496582, -9.00790786743164, -7.821229934692383, -6.634552478790283, -5.447875022888184, -4.261198043823242, -3.0745201110839844, -1.8878426551818848, -0.7011651992797852, 0.48551225662231445, 1.672189712524414, 2.8588671684265137, 4.045544624328613, 5.232221603393555, 6.4188995361328125, 7.605576992034912, 8.792254447937012, 9.978931427001953, 11.165609359741211, 12.352287292480469, 13.53896427154541, 14.725641250610352, 15.91231918334961, 17.098997116088867, 18.285675048828125, 19.47235107421875, 20.659029006958008, 21.845706939697266, 23.03238296508789, 24.21906089782715, 25.405738830566406]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 13.0, 3.0, 10.0, 11.0, 5.0, 12.0, 8.0, 16.0, 20.0, 28.0, 21.0, 23.0, 25.0, 38.0, 36.0, 47.0, 45.0, 44.0, 47.0, 52.0, 45.0, 44.0, 52.0, 46.0, 32.0, 32.0, 25.0, 36.0, 30.0, 20.0, 23.0, 18.0, 18.0, 12.0, 9.0, 11.0, 9.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-13.95029067993164, -13.510836601257324, -13.071383476257324, -12.631929397583008, -12.192475318908691, -11.753021240234375, -11.313568115234375, -10.874114036560059, -10.434659957885742, -9.995205879211426, -9.555752754211426, -9.11629867553711, -8.676844596862793, -8.237390518188477, -7.797937393188477, -7.35848331451416, -6.91903018951416, -6.479576587677002, -6.0401225090026855, -5.600668907165527, -5.161214828491211, -4.721761226654053, -4.2823076248168945, -3.8428537845611572, -3.40339994430542, -2.9639461040496826, -2.5244922637939453, -2.085038661956787, -1.6455848217010498, -1.2061309814453125, -0.7666773796081543, -0.327223539352417, 0.11223030090332031, 0.5516840815544128, 0.9911378622055054, 1.4305915832519531, 1.8700454235076904, 2.3094992637634277, 2.748952865600586, 3.1884067058563232, 3.6278605461120605, 4.067314147949219, 4.506768226623535, 4.946221828460693, 5.385675430297852, 5.825129508972168, 6.264583110809326, 6.704036712646484, 7.143490791320801, 7.582944393157959, 8.022397994995117, 8.461852073669434, 8.90130615234375, 9.34075927734375, 9.780213356018066, 10.219667434692383, 10.659120559692383, 11.0985746383667, 11.5380277633667, 11.977481842041016, 12.416935920715332, 12.856389999389648, 13.295843124389648, 13.735297203063965, 14.174751281738281]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 8.0, 3.0, 2.0, 7.0, 6.0, 31.0, 33.0, 56.0, 103.0, 195.0, 355.0, 818.0, 1950.0, 5724.0, 27201.0, 987052.0, 3111235.0, 46887.0, 8000.0, 2548.0, 1011.0, 427.0, 254.0, 117.0, 61.0, 62.0, 36.0, 23.0, 16.0, 12.0, 10.0, 6.0, 6.0, 7.0, 7.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.736328125, -1.657867431640625, -1.57940673828125, -1.500946044921875, -1.4224853515625, -1.344024658203125, -1.26556396484375, -1.187103271484375, -1.108642578125, -1.030181884765625, -0.95172119140625, -0.873260498046875, -0.7947998046875, -0.716339111328125, -0.63787841796875, -0.559417724609375, -0.48095703125, -0.402496337890625, -0.32403564453125, -0.245574951171875, -0.1671142578125, -0.088653564453125, -0.01019287109375, 0.068267822265625, 0.146728515625, 0.225189208984375, 0.30364990234375, 0.382110595703125, 0.4605712890625, 0.539031982421875, 0.61749267578125, 0.695953369140625, 0.7744140625, 0.852874755859375, 0.93133544921875, 1.009796142578125, 1.0882568359375, 1.166717529296875, 1.24517822265625, 1.323638916015625, 1.402099609375, 1.480560302734375, 1.55902099609375, 1.637481689453125, 1.7159423828125, 1.794403076171875, 1.87286376953125, 1.951324462890625, 2.02978515625, 2.108245849609375, 2.18670654296875, 2.265167236328125, 2.3436279296875, 2.422088623046875, 2.50054931640625, 2.579010009765625, 2.657470703125, 2.735931396484375, 2.81439208984375, 2.892852783203125, 2.9713134765625, 3.049774169921875, 3.12823486328125, 3.206695556640625, 3.28515625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 12.0, 17.0, 29.0, 36.0, 44.0, 52.0, 43.0, 65.0, 76.0, 78.0, 70.0, 72.0, 69.0, 55.0, 62.0, 43.0, 41.0, 28.0, 19.0, 20.0, 18.0, 12.0, 12.0, 5.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.109375, -1.07177734375, -1.0341796875, -0.99658203125, -0.958984375, -0.92138671875, -0.8837890625, -0.84619140625, -0.80859375, -0.77099609375, -0.7333984375, -0.69580078125, -0.658203125, -0.62060546875, -0.5830078125, -0.54541015625, -0.5078125, -0.47021484375, -0.4326171875, -0.39501953125, -0.357421875, -0.31982421875, -0.2822265625, -0.24462890625, -0.20703125, -0.16943359375, -0.1318359375, -0.09423828125, -0.056640625, -0.01904296875, 0.0185546875, 0.05615234375, 0.09375, 0.13134765625, 0.1689453125, 0.20654296875, 0.244140625, 0.28173828125, 0.3193359375, 0.35693359375, 0.39453125, 0.43212890625, 0.4697265625, 0.50732421875, 0.544921875, 0.58251953125, 0.6201171875, 0.65771484375, 0.6953125, 0.73291015625, 0.7705078125, 0.80810546875, 0.845703125, 0.88330078125, 0.9208984375, 0.95849609375, 0.99609375, 1.03369140625, 1.0712890625, 1.10888671875, 1.146484375, 1.18408203125, 1.2216796875, 1.25927734375, 1.296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 6.0, 16.0, 23.0, 38.0, 82.0, 262.0, 1252.0, 8280.0, 119302.0, 3980353.0, 76592.0, 6545.0, 1089.0, 290.0, 85.0, 32.0, 12.0, 5.0, 8.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.902313232421875, -3.78900146484375, -3.675689697265625, -3.5623779296875, -3.449066162109375, -3.33575439453125, -3.222442626953125, -3.109130859375, -2.995819091796875, -2.88250732421875, -2.769195556640625, -2.6558837890625, -2.542572021484375, -2.42926025390625, -2.315948486328125, -2.20263671875, -2.089324951171875, -1.97601318359375, -1.862701416015625, -1.7493896484375, -1.636077880859375, -1.52276611328125, -1.409454345703125, -1.296142578125, -1.182830810546875, -1.06951904296875, -0.956207275390625, -0.8428955078125, -0.729583740234375, -0.61627197265625, -0.502960205078125, -0.3896484375, -0.276336669921875, -0.16302490234375, -0.049713134765625, 0.0635986328125, 0.176910400390625, 0.29022216796875, 0.403533935546875, 0.516845703125, 0.630157470703125, 0.74346923828125, 0.856781005859375, 0.9700927734375, 1.083404541015625, 1.19671630859375, 1.310028076171875, 1.42333984375, 1.536651611328125, 1.64996337890625, 1.763275146484375, 1.8765869140625, 1.989898681640625, 2.10321044921875, 2.216522216796875, 2.329833984375, 2.443145751953125, 2.55645751953125, 2.669769287109375, 2.7830810546875, 2.896392822265625, 3.00970458984375, 3.123016357421875, 3.236328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 5.0, 7.0, 8.0, 12.0, 19.0, 21.0, 28.0, 55.0, 85.0, 154.0, 360.0, 960.0, 1212.0, 605.0, 244.0, 107.0, 58.0, 41.0, 25.0, 19.0, 10.0, 7.0, 4.0, 7.0, 5.0, 2.0, 8.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.703125, -1.632843017578125, -1.56256103515625, -1.492279052734375, -1.4219970703125, -1.351715087890625, -1.28143310546875, -1.211151123046875, -1.140869140625, -1.070587158203125, -1.00030517578125, -0.930023193359375, -0.8597412109375, -0.789459228515625, -0.71917724609375, -0.648895263671875, -0.57861328125, -0.508331298828125, -0.43804931640625, -0.367767333984375, -0.2974853515625, -0.227203369140625, -0.15692138671875, -0.086639404296875, -0.016357421875, 0.053924560546875, 0.12420654296875, 0.194488525390625, 0.2647705078125, 0.335052490234375, 0.40533447265625, 0.475616455078125, 0.5458984375, 0.616180419921875, 0.68646240234375, 0.756744384765625, 0.8270263671875, 0.897308349609375, 0.96759033203125, 1.037872314453125, 1.108154296875, 1.178436279296875, 1.24871826171875, 1.319000244140625, 1.3892822265625, 1.459564208984375, 1.52984619140625, 1.600128173828125, 1.67041015625, 1.740692138671875, 1.81097412109375, 1.881256103515625, 1.9515380859375, 2.021820068359375, 2.09210205078125, 2.162384033203125, 2.232666015625, 2.302947998046875, 2.37322998046875, 2.443511962890625, 2.5137939453125, 2.584075927734375, 2.65435791015625, 2.724639892578125, 2.794921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 8.0, 14.0, 44.0, 83.0, 154.0, 195.0, 196.0, 126.0, 74.0, 45.0, 16.0, 16.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.387663841247559, -13.848751068115234, -13.30983829498291, -12.770925521850586, -12.232012748718262, -11.693099975585938, -11.154186248779297, -10.615274429321289, -10.076360702514648, -9.537447929382324, -8.99853515625, -8.459622383117676, -7.920709609985352, -7.381796836853027, -6.842883586883545, -6.303970813751221, -5.765058517456055, -5.2261457443237305, -4.687232971191406, -4.148320198059082, -3.6094071865081787, -3.0704944133758545, -2.531581401824951, -1.992668628692627, -1.4537558555603027, -0.9148430228233337, -0.37593019008636475, 0.16298270225524902, 0.7018954753875732, 1.2408082485198975, 1.7797212600708008, 2.318634033203125, 2.8575477600097656, 3.39646053314209, 3.935373306274414, 4.474286079406738, 5.0131988525390625, 5.552111625671387, 6.091024875640869, 6.629937648773193, 7.168850421905518, 7.707763195037842, 8.246676445007324, 8.785589218139648, 9.324501991271973, 9.863414764404297, 10.402327537536621, 10.941240310668945, 11.48015308380127, 12.019065856933594, 12.557978630065918, 13.096891403198242, 13.635804176330566, 14.17471694946289, 14.713630676269531, 15.252542495727539, 15.79145622253418, 16.33036994934082, 16.869281768798828, 17.40819549560547, 17.947107315063477, 18.486021041870117, 19.024932861328125, 19.563846588134766, 20.102758407592773]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 8.0, 7.0, 8.0, 9.0, 11.0, 17.0, 15.0, 19.0, 18.0, 22.0, 23.0, 27.0, 27.0, 50.0, 33.0, 51.0, 56.0, 35.0, 33.0, 47.0, 48.0, 41.0, 53.0, 39.0, 32.0, 41.0, 26.0, 26.0, 41.0, 20.0, 28.0, 10.0, 9.0, 7.0, 12.0, 11.0, 5.0, 7.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.431278228759766, -7.219869136810303, -7.008459568023682, -6.797050476074219, -6.585641384124756, -6.374232292175293, -6.162822723388672, -5.951413631439209, -5.740004539489746, -5.528595447540283, -5.317185878753662, -5.105776786804199, -4.894367694854736, -4.682958602905273, -4.471549034118652, -4.2601399421691895, -4.048730373382568, -3.8373210430145264, -3.6259119510650635, -3.4145026206970215, -3.2030935287475586, -2.9916841983795166, -2.7802748680114746, -2.5688657760620117, -2.3574564456939697, -2.1460471153259277, -1.9346380233764648, -1.7232286930084229, -1.5118194818496704, -1.300410270690918, -1.089000940322876, -0.8775917291641235, -0.6661825180053711, -0.45477327704429626, -0.24336403608322144, -0.03195476531982422, 0.17945444583892822, 0.39086365699768066, 0.6022729873657227, 0.8136821985244751, 1.0250914096832275, 1.23650062084198, 1.4479098320007324, 1.6593191623687744, 1.8707283735275269, 2.0821375846862793, 2.2935469150543213, 2.5049562454223633, 2.716365337371826, 2.927774667739868, 3.139183759689331, 3.350593090057373, 3.562002182006836, 3.773411512374878, 3.98482084274292, 4.196229934692383, 4.407639503479004, 4.619048595428467, 4.830458164215088, 5.041867256164551, 5.253276348114014, 5.464685440063477, 5.676095008850098, 5.8875041007995605, 6.098913192749023]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 4.0, 2.0, 7.0, 12.0, 14.0, 14.0, 20.0, 46.0, 71.0, 171.0, 332.0, 916.0, 2620.0, 9705.0, 57378.0, 571653.0, 357902.0, 37340.0, 7043.0, 1994.0, 711.0, 307.0, 135.0, 64.0, 32.0, 31.0, 15.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.865234375, -2.769378662109375, -2.67352294921875, -2.577667236328125, -2.4818115234375, -2.385955810546875, -2.29010009765625, -2.194244384765625, -2.098388671875, -2.002532958984375, -1.90667724609375, -1.810821533203125, -1.7149658203125, -1.619110107421875, -1.52325439453125, -1.427398681640625, -1.33154296875, -1.235687255859375, -1.13983154296875, -1.043975830078125, -0.9481201171875, -0.852264404296875, -0.75640869140625, -0.660552978515625, -0.564697265625, -0.468841552734375, -0.37298583984375, -0.277130126953125, -0.1812744140625, -0.085418701171875, 0.01043701171875, 0.106292724609375, 0.2021484375, 0.298004150390625, 0.39385986328125, 0.489715576171875, 0.5855712890625, 0.681427001953125, 0.77728271484375, 0.873138427734375, 0.968994140625, 1.064849853515625, 1.16070556640625, 1.256561279296875, 1.3524169921875, 1.448272705078125, 1.54412841796875, 1.639984130859375, 1.73583984375, 1.831695556640625, 1.92755126953125, 2.023406982421875, 2.1192626953125, 2.215118408203125, 2.31097412109375, 2.406829833984375, 2.502685546875, 2.598541259765625, 2.69439697265625, 2.790252685546875, 2.8861083984375, 2.981964111328125, 3.07781982421875, 3.173675537109375, 3.26953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 4.0, 9.0, 8.0, 13.0, 22.0, 23.0, 24.0, 35.0, 39.0, 52.0, 44.0, 49.0, 58.0, 59.0, 60.0, 51.0, 66.0, 55.0, 58.0, 47.0, 42.0, 31.0, 24.0, 25.0, 19.0, 20.0, 7.0, 14.0, 9.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.115234375, -1.0856170654296875, -1.055999755859375, -1.0263824462890625, -0.99676513671875, -0.9671478271484375, -0.937530517578125, -0.9079132080078125, -0.8782958984375, -0.8486785888671875, -0.819061279296875, -0.7894439697265625, -0.75982666015625, -0.7302093505859375, -0.700592041015625, -0.6709747314453125, -0.641357421875, -0.6117401123046875, -0.582122802734375, -0.5525054931640625, -0.52288818359375, -0.4932708740234375, -0.463653564453125, -0.4340362548828125, -0.4044189453125, -0.3748016357421875, -0.345184326171875, -0.3155670166015625, -0.28594970703125, -0.2563323974609375, -0.226715087890625, -0.1970977783203125, -0.16748046875, -0.1378631591796875, -0.108245849609375, -0.0786285400390625, -0.04901123046875, -0.0193939208984375, 0.010223388671875, 0.0398406982421875, 0.0694580078125, 0.0990753173828125, 0.128692626953125, 0.1583099365234375, 0.18792724609375, 0.2175445556640625, 0.247161865234375, 0.2767791748046875, 0.306396484375, 0.3360137939453125, 0.365631103515625, 0.3952484130859375, 0.42486572265625, 0.4544830322265625, 0.484100341796875, 0.5137176513671875, 0.5433349609375, 0.5729522705078125, 0.602569580078125, 0.6321868896484375, 0.66180419921875, 0.6914215087890625, 0.721038818359375, 0.7506561279296875, 0.7802734375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 4.0, 4.0, 2.0, 2.0, 4.0, 13.0, 7.0, 9.0, 16.0, 44.0, 48.0, 72.0, 119.0, 225.0, 343.0, 870.0, 2404.0, 10256.0, 169535.0, 827253.0, 30392.0, 4263.0, 1359.0, 570.0, 299.0, 152.0, 110.0, 57.0, 30.0, 19.0, 18.0, 17.0, 6.0, 5.0, 8.0, 2.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.046875, -4.89947509765625, -4.7520751953125, -4.60467529296875, -4.457275390625, -4.30987548828125, -4.1624755859375, -4.01507568359375, -3.86767578125, -3.72027587890625, -3.5728759765625, -3.42547607421875, -3.278076171875, -3.13067626953125, -2.9832763671875, -2.83587646484375, -2.6884765625, -2.54107666015625, -2.3936767578125, -2.24627685546875, -2.098876953125, -1.95147705078125, -1.8040771484375, -1.65667724609375, -1.50927734375, -1.36187744140625, -1.2144775390625, -1.06707763671875, -0.919677734375, -0.77227783203125, -0.6248779296875, -0.47747802734375, -0.330078125, -0.18267822265625, -0.0352783203125, 0.11212158203125, 0.259521484375, 0.40692138671875, 0.5543212890625, 0.70172119140625, 0.84912109375, 0.99652099609375, 1.1439208984375, 1.29132080078125, 1.438720703125, 1.58612060546875, 1.7335205078125, 1.88092041015625, 2.0283203125, 2.17572021484375, 2.3231201171875, 2.47052001953125, 2.617919921875, 2.76531982421875, 2.9127197265625, 3.06011962890625, 3.20751953125, 3.35491943359375, 3.5023193359375, 3.64971923828125, 3.797119140625, 3.94451904296875, 4.0919189453125, 4.23931884765625, 4.38671875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 4.0, 8.0, 19.0, 21.0, 26.0, 24.0, 25.0, 34.0, 58.0, 56.0, 66.0, 66.0, 79.0, 77.0, 58.0, 55.0, 71.0, 48.0, 41.0, 42.0, 26.0, 27.0, 17.0, 9.0, 7.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.58203125, -4.41961669921875, -4.2572021484375, -4.09478759765625, -3.932373046875, -3.76995849609375, -3.6075439453125, -3.44512939453125, -3.28271484375, -3.12030029296875, -2.9578857421875, -2.79547119140625, -2.633056640625, -2.47064208984375, -2.3082275390625, -2.14581298828125, -1.9833984375, -1.82098388671875, -1.6585693359375, -1.49615478515625, -1.333740234375, -1.17132568359375, -1.0089111328125, -0.84649658203125, -0.68408203125, -0.52166748046875, -0.3592529296875, -0.19683837890625, -0.034423828125, 0.12799072265625, 0.2904052734375, 0.45281982421875, 0.615234375, 0.77764892578125, 0.9400634765625, 1.10247802734375, 1.264892578125, 1.42730712890625, 1.5897216796875, 1.75213623046875, 1.91455078125, 2.07696533203125, 2.2393798828125, 2.40179443359375, 2.564208984375, 2.72662353515625, 2.8890380859375, 3.05145263671875, 3.2138671875, 3.37628173828125, 3.5386962890625, 3.70111083984375, 3.863525390625, 4.02593994140625, 4.1883544921875, 4.35076904296875, 4.51318359375, 4.67559814453125, 4.8380126953125, 5.00042724609375, 5.162841796875, 5.32525634765625, 5.4876708984375, 5.65008544921875, 5.8125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 10.0, 7.0, 5.0, 10.0, 16.0, 18.0, 36.0, 44.0, 108.0, 179.0, 368.0, 993.0, 3739.0, 30815.0, 879605.0, 120987.0, 8704.0, 1717.0, 599.0, 271.0, 129.0, 76.0, 45.0, 31.0, 12.0, 9.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7158203125, -1.6491241455078125, -1.582427978515625, -1.5157318115234375, -1.44903564453125, -1.3823394775390625, -1.315643310546875, -1.2489471435546875, -1.1822509765625, -1.1155548095703125, -1.048858642578125, -0.9821624755859375, -0.91546630859375, -0.8487701416015625, -0.782073974609375, -0.7153778076171875, -0.648681640625, -0.5819854736328125, -0.515289306640625, -0.4485931396484375, -0.38189697265625, -0.3152008056640625, -0.248504638671875, -0.1818084716796875, -0.1151123046875, -0.0484161376953125, 0.018280029296875, 0.0849761962890625, 0.15167236328125, 0.2183685302734375, 0.285064697265625, 0.3517608642578125, 0.41845703125, 0.4851531982421875, 0.551849365234375, 0.6185455322265625, 0.68524169921875, 0.7519378662109375, 0.818634033203125, 0.8853302001953125, 0.9520263671875, 1.0187225341796875, 1.085418701171875, 1.1521148681640625, 1.21881103515625, 1.2855072021484375, 1.352203369140625, 1.4188995361328125, 1.485595703125, 1.5522918701171875, 1.618988037109375, 1.6856842041015625, 1.75238037109375, 1.8190765380859375, 1.885772705078125, 1.9524688720703125, 2.0191650390625, 2.0858612060546875, 2.152557373046875, 2.2192535400390625, 2.28594970703125, 2.3526458740234375, 2.419342041015625, 2.4860382080078125, 2.552734375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 5.0, 2.0, 8.0, 6.0, 14.0, 17.0, 10.0, 17.0, 13.0, 30.0, 34.0, 53.0, 72.0, 144.0, 175.0, 133.0, 68.0, 37.0, 35.0, 13.0, 22.0, 11.0, 11.0, 8.0, 8.0, 6.0, 8.0, 10.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00022077560424804688, -0.00021348148584365845, -0.00020618736743927002, -0.0001988932490348816, -0.00019159913063049316, -0.00018430501222610474, -0.0001770108938217163, -0.00016971677541732788, -0.00016242265701293945, -0.00015512853860855103, -0.0001478344202041626, -0.00014054030179977417, -0.00013324618339538574, -0.00012595206499099731, -0.00011865794658660889, -0.00011136382818222046, -0.00010406970977783203, -9.67755913734436e-05, -8.948147296905518e-05, -8.218735456466675e-05, -7.489323616027832e-05, -6.759911775588989e-05, -6.0304999351501465e-05, -5.301088094711304e-05, -4.571676254272461e-05, -3.842264413833618e-05, -3.1128525733947754e-05, -2.3834407329559326e-05, -1.65402889251709e-05, -9.24617052078247e-06, -1.952052116394043e-06, 5.342066287994385e-06, 1.2636184692382812e-05, 1.993030309677124e-05, 2.7224421501159668e-05, 3.4518539905548096e-05, 4.1812658309936523e-05, 4.910677671432495e-05, 5.640089511871338e-05, 6.36950135231018e-05, 7.098913192749023e-05, 7.828325033187866e-05, 8.557736873626709e-05, 9.287148714065552e-05, 0.00010016560554504395, 0.00010745972394943237, 0.0001147538423538208, 0.00012204796075820923, 0.00012934207916259766, 0.00013663619756698608, 0.0001439303159713745, 0.00015122443437576294, 0.00015851855278015137, 0.0001658126711845398, 0.00017310678958892822, 0.00018040090799331665, 0.00018769502639770508, 0.0001949891448020935, 0.00020228326320648193, 0.00020957738161087036, 0.0002168715000152588, 0.00022416561841964722, 0.00023145973682403564, 0.00023875385522842407, 0.0002460479736328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 9.0, 8.0, 16.0, 29.0, 30.0, 52.0, 71.0, 87.0, 107.0, 180.0, 277.0, 442.0, 675.0, 1220.0, 2434.0, 5528.0, 15005.0, 55119.0, 596784.0, 309410.0, 39692.0, 11783.0, 4585.0, 2092.0, 1099.0, 592.0, 360.0, 242.0, 158.0, 101.0, 106.0, 50.0, 47.0, 31.0, 30.0, 20.0, 24.0, 19.0, 8.0, 7.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.169921875, -1.13323974609375, -1.0965576171875, -1.05987548828125, -1.023193359375, -0.98651123046875, -0.9498291015625, -0.91314697265625, -0.87646484375, -0.83978271484375, -0.8031005859375, -0.76641845703125, -0.729736328125, -0.69305419921875, -0.6563720703125, -0.61968994140625, -0.5830078125, -0.54632568359375, -0.5096435546875, -0.47296142578125, -0.436279296875, -0.39959716796875, -0.3629150390625, -0.32623291015625, -0.28955078125, -0.25286865234375, -0.2161865234375, -0.17950439453125, -0.142822265625, -0.10614013671875, -0.0694580078125, -0.03277587890625, 0.00390625, 0.04058837890625, 0.0772705078125, 0.11395263671875, 0.150634765625, 0.18731689453125, 0.2239990234375, 0.26068115234375, 0.29736328125, 0.33404541015625, 0.3707275390625, 0.40740966796875, 0.444091796875, 0.48077392578125, 0.5174560546875, 0.55413818359375, 0.5908203125, 0.62750244140625, 0.6641845703125, 0.70086669921875, 0.737548828125, 0.77423095703125, 0.8109130859375, 0.84759521484375, 0.88427734375, 0.92095947265625, 0.9576416015625, 0.99432373046875, 1.031005859375, 1.06768798828125, 1.1043701171875, 1.14105224609375, 1.177734375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 8.0, 10.0, 11.0, 14.0, 19.0, 26.0, 29.0, 37.0, 52.0, 83.0, 113.0, 112.0, 112.0, 84.0, 75.0, 50.0, 28.0, 34.0, 18.0, 17.0, 8.0, 9.0, 7.0, 6.0, 5.0, 6.0, 2.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.431640625, -1.392608642578125, -1.35357666015625, -1.314544677734375, -1.2755126953125, -1.236480712890625, -1.19744873046875, -1.158416748046875, -1.119384765625, -1.080352783203125, -1.04132080078125, -1.002288818359375, -0.9632568359375, -0.924224853515625, -0.88519287109375, -0.846160888671875, -0.80712890625, -0.768096923828125, -0.72906494140625, -0.690032958984375, -0.6510009765625, -0.611968994140625, -0.57293701171875, -0.533905029296875, -0.494873046875, -0.455841064453125, -0.41680908203125, -0.377777099609375, -0.3387451171875, -0.299713134765625, -0.26068115234375, -0.221649169921875, -0.1826171875, -0.143585205078125, -0.10455322265625, -0.065521240234375, -0.0264892578125, 0.012542724609375, 0.05157470703125, 0.090606689453125, 0.129638671875, 0.168670654296875, 0.20770263671875, 0.246734619140625, 0.2857666015625, 0.324798583984375, 0.36383056640625, 0.402862548828125, 0.44189453125, 0.480926513671875, 0.51995849609375, 0.558990478515625, 0.5980224609375, 0.637054443359375, 0.67608642578125, 0.715118408203125, 0.754150390625, 0.793182373046875, 0.83221435546875, 0.871246337890625, 0.9102783203125, 0.949310302734375, 0.98834228515625, 1.027374267578125, 1.06640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 12.0, 11.0, 25.0, 71.0, 96.0, 139.0, 209.0, 161.0, 111.0, 62.0, 41.0, 16.0, 11.0, 9.0, 5.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.048908233642578, -17.47550392150879, -16.902101516723633, -16.328697204589844, -15.755294799804688, -15.181891441345215, -14.608488082885742, -14.035083770751953, -13.461681365966797, -12.888278007507324, -12.314874649047852, -11.741471290588379, -11.168067932128906, -10.594664573669434, -10.021261215209961, -9.447856903076172, -8.8744535446167, -8.301050186157227, -7.727646827697754, -7.154243469238281, -6.580840110778809, -6.007436752319336, -5.434032917022705, -4.860629558563232, -4.28722620010376, -3.713822841644287, -3.1404194831848145, -2.5670158863067627, -1.99361252784729, -1.4202091693878174, -0.8468055725097656, -0.27340221405029297, 0.3000011444091797, 0.8734045624732971, 1.4468079805374146, 2.0202114582061768, 2.5936148166656494, 3.167018175125122, 3.740421772003174, 4.3138251304626465, 4.887228488922119, 5.460631847381592, 6.0340352058410645, 6.607439041137695, 7.180842399597168, 7.754245758056641, 8.327649116516113, 8.901052474975586, 9.474455833435059, 10.047859191894531, 10.621262550354004, 11.194665908813477, 11.76806926727295, 12.341472625732422, 12.914876937866211, 13.488279342651367, 14.061683654785156, 14.635087013244629, 15.208490371704102, 15.781893730163574, 16.355297088623047, 16.928701400756836, 17.502103805541992, 18.07550811767578, 18.648910522460938]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 12.0, 11.0, 10.0, 17.0, 20.0, 24.0, 25.0, 25.0, 23.0, 38.0, 46.0, 47.0, 52.0, 56.0, 65.0, 61.0, 50.0, 54.0, 51.0, 46.0, 53.0, 42.0, 32.0, 21.0, 24.0, 20.0, 25.0, 14.0, 16.0, 6.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.131839752197266, -16.66941261291504, -16.206985473632812, -15.744560241699219, -15.282133102416992, -14.819705963134766, -14.357279777526855, -13.894853591918945, -13.432426452636719, -12.969999313354492, -12.507573127746582, -12.045146942138672, -11.582719802856445, -11.120292663574219, -10.657866477966309, -10.195440292358398, -9.733013153076172, -9.270586013793945, -8.808159828186035, -8.345733642578125, -7.883306503295898, -7.42087984085083, -6.958453178405762, -6.496026515960693, -6.033599853515625, -5.571173191070557, -5.108746528625488, -4.64631986618042, -4.183893203735352, -3.721466541290283, -3.259039878845215, -2.7966132164001465, -2.334186553955078, -1.8717598915100098, -1.4093332290649414, -0.946906566619873, -0.4844799041748047, -0.022053241729736328, 0.44037342071533203, 0.9028000831604004, 1.3652267456054688, 1.827653408050537, 2.2900800704956055, 2.752506732940674, 3.214933395385742, 3.6773600578308105, 4.139786720275879, 4.602213382720947, 5.064640045166016, 5.527066707611084, 5.989493370056152, 6.451920032501221, 6.914346694946289, 7.376773357391357, 7.839200019836426, 8.301626205444336, 8.764053344726562, 9.226480484008789, 9.6889066696167, 10.15133285522461, 10.613759994506836, 11.076187133789062, 11.538613319396973, 12.001039505004883, 12.46346664428711]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 9.0, 13.0, 22.0, 20.0, 25.0, 48.0, 73.0, 118.0, 206.0, 356.0, 599.0, 1275.0, 2915.0, 7943.0, 31434.0, 414439.0, 3494688.0, 204999.0, 24206.0, 6440.0, 2327.0, 986.0, 481.0, 263.0, 145.0, 75.0, 45.0, 33.0, 16.0, 23.0, 11.0, 10.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3876953125, -1.3351287841796875, -1.282562255859375, -1.2299957275390625, -1.17742919921875, -1.1248626708984375, -1.072296142578125, -1.0197296142578125, -0.9671630859375, -0.9145965576171875, -0.862030029296875, -0.8094635009765625, -0.75689697265625, -0.7043304443359375, -0.651763916015625, -0.5991973876953125, -0.546630859375, -0.4940643310546875, -0.441497802734375, -0.3889312744140625, -0.33636474609375, -0.2837982177734375, -0.231231689453125, -0.1786651611328125, -0.1260986328125, -0.0735321044921875, -0.020965576171875, 0.0316009521484375, 0.08416748046875, 0.1367340087890625, 0.189300537109375, 0.2418670654296875, 0.29443359375, 0.3470001220703125, 0.399566650390625, 0.4521331787109375, 0.50469970703125, 0.5572662353515625, 0.609832763671875, 0.6623992919921875, 0.7149658203125, 0.7675323486328125, 0.820098876953125, 0.8726654052734375, 0.92523193359375, 0.9777984619140625, 1.030364990234375, 1.0829315185546875, 1.135498046875, 1.1880645751953125, 1.240631103515625, 1.2931976318359375, 1.34576416015625, 1.3983306884765625, 1.450897216796875, 1.5034637451171875, 1.5560302734375, 1.6085968017578125, 1.661163330078125, 1.7137298583984375, 1.76629638671875, 1.8188629150390625, 1.871429443359375, 1.9239959716796875, 1.9765625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 12.0, 11.0, 9.0, 15.0, 29.0, 29.0, 21.0, 32.0, 41.0, 52.0, 61.0, 62.0, 72.0, 52.0, 66.0, 57.0, 45.0, 58.0, 48.0, 41.0, 23.0, 31.0, 25.0, 23.0, 14.0, 14.0, 11.0, 6.0, 7.0, 9.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.271484375, -1.240966796875, -1.21044921875, -1.179931640625, -1.1494140625, -1.118896484375, -1.08837890625, -1.057861328125, -1.02734375, -0.996826171875, -0.96630859375, -0.935791015625, -0.9052734375, -0.874755859375, -0.84423828125, -0.813720703125, -0.783203125, -0.752685546875, -0.72216796875, -0.691650390625, -0.6611328125, -0.630615234375, -0.60009765625, -0.569580078125, -0.5390625, -0.508544921875, -0.47802734375, -0.447509765625, -0.4169921875, -0.386474609375, -0.35595703125, -0.325439453125, -0.294921875, -0.264404296875, -0.23388671875, -0.203369140625, -0.1728515625, -0.142333984375, -0.11181640625, -0.081298828125, -0.05078125, -0.020263671875, 0.01025390625, 0.040771484375, 0.0712890625, 0.101806640625, 0.13232421875, 0.162841796875, 0.193359375, 0.223876953125, 0.25439453125, 0.284912109375, 0.3154296875, 0.345947265625, 0.37646484375, 0.406982421875, 0.4375, 0.468017578125, 0.49853515625, 0.529052734375, 0.5595703125, 0.590087890625, 0.62060546875, 0.651123046875, 0.681640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 8.0, 13.0, 19.0, 28.0, 38.0, 63.0, 111.0, 169.0, 254.0, 398.0, 711.0, 1289.0, 2493.0, 4820.0, 10870.0, 30161.0, 126522.0, 1500399.0, 2275549.0, 177196.0, 38106.0, 13190.0, 5772.0, 2748.0, 1446.0, 733.0, 455.0, 259.0, 169.0, 97.0, 61.0, 46.0, 23.0, 22.0, 11.0, 9.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.130096435546875, -1.09124755859375, -1.052398681640625, -1.0135498046875, -0.974700927734375, -0.93585205078125, -0.897003173828125, -0.858154296875, -0.819305419921875, -0.78045654296875, -0.741607666015625, -0.7027587890625, -0.663909912109375, -0.62506103515625, -0.586212158203125, -0.54736328125, -0.508514404296875, -0.46966552734375, -0.430816650390625, -0.3919677734375, -0.353118896484375, -0.31427001953125, -0.275421142578125, -0.236572265625, -0.197723388671875, -0.15887451171875, -0.120025634765625, -0.0811767578125, -0.042327880859375, -0.00347900390625, 0.035369873046875, 0.07421875, 0.113067626953125, 0.15191650390625, 0.190765380859375, 0.2296142578125, 0.268463134765625, 0.30731201171875, 0.346160888671875, 0.385009765625, 0.423858642578125, 0.46270751953125, 0.501556396484375, 0.5404052734375, 0.579254150390625, 0.61810302734375, 0.656951904296875, 0.69580078125, 0.734649658203125, 0.77349853515625, 0.812347412109375, 0.8511962890625, 0.890045166015625, 0.92889404296875, 0.967742919921875, 1.006591796875, 1.045440673828125, 1.08428955078125, 1.123138427734375, 1.1619873046875, 1.200836181640625, 1.23968505859375, 1.278533935546875, 1.3173828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 15.0, 7.0, 16.0, 29.0, 33.0, 53.0, 74.0, 146.0, 268.0, 516.0, 772.0, 862.0, 568.0, 277.0, 151.0, 89.0, 42.0, 33.0, 28.0, 14.0, 14.0, 9.0, 6.0, 9.0, 3.0, 4.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.8720703125, -1.8215484619140625, -1.771026611328125, -1.7205047607421875, -1.66998291015625, -1.6194610595703125, -1.568939208984375, -1.5184173583984375, -1.4678955078125, -1.4173736572265625, -1.366851806640625, -1.3163299560546875, -1.26580810546875, -1.2152862548828125, -1.164764404296875, -1.1142425537109375, -1.063720703125, -1.0131988525390625, -0.962677001953125, -0.9121551513671875, -0.86163330078125, -0.8111114501953125, -0.760589599609375, -0.7100677490234375, -0.6595458984375, -0.6090240478515625, -0.558502197265625, -0.5079803466796875, -0.45745849609375, -0.4069366455078125, -0.356414794921875, -0.3058929443359375, -0.25537109375, -0.2048492431640625, -0.154327392578125, -0.1038055419921875, -0.05328369140625, -0.0027618408203125, 0.047760009765625, 0.0982818603515625, 0.1488037109375, 0.1993255615234375, 0.249847412109375, 0.3003692626953125, 0.35089111328125, 0.4014129638671875, 0.451934814453125, 0.5024566650390625, 0.552978515625, 0.6035003662109375, 0.654022216796875, 0.7045440673828125, 0.75506591796875, 0.8055877685546875, 0.856109619140625, 0.9066314697265625, 0.9571533203125, 1.0076751708984375, 1.058197021484375, 1.1087188720703125, 1.15924072265625, 1.2097625732421875, 1.260284423828125, 1.3108062744140625, 1.361328125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 10.0, 26.0, 61.0, 160.0, 237.0, 277.0, 133.0, 45.0, 24.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.537506103515625, -15.904003143310547, -15.270500183105469, -14.63699722290039, -14.003494262695312, -13.369991302490234, -12.736489295959473, -12.102986335754395, -11.469483375549316, -10.835980415344238, -10.20247745513916, -9.568974494934082, -8.93547248840332, -8.301969528198242, -7.668466567993164, -7.034963607788086, -6.401460647583008, -5.76795768737793, -5.134454727172852, -4.500952243804932, -3.8674492835998535, -3.2339463233947754, -2.6004436016082764, -1.9669408798217773, -1.3334379196166992, -0.6999350786209106, -0.06643223762512207, 0.5670706033706665, 1.200573444366455, 1.8340764045715332, 2.4675791263580322, 3.1010818481445312, 3.7345829010009766, 4.368085861206055, 5.001588821411133, 5.635091304779053, 6.268594264984131, 6.902097225189209, 7.535599708557129, 8.169102668762207, 8.802605628967285, 9.436108589172363, 10.069611549377441, 10.70311450958252, 11.336616516113281, 11.97011947631836, 12.603622436523438, 13.237125396728516, 13.870628356933594, 14.504131317138672, 15.13763427734375, 15.771137237548828, 16.404640197753906, 17.038143157958984, 17.671646118164062, 18.30514907836914, 18.93865203857422, 19.572154998779297, 20.205657958984375, 20.839160919189453, 21.47266387939453, 22.10616683959961, 22.739669799804688, 23.373172760009766, 24.00667381286621]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 12.0, 12.0, 15.0, 16.0, 20.0, 21.0, 36.0, 24.0, 48.0, 47.0, 56.0, 74.0, 59.0, 80.0, 73.0, 69.0, 54.0, 54.0, 61.0, 43.0, 31.0, 18.0, 22.0, 23.0, 8.0, 8.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875286102294922, -8.577290534973145, -8.279294967651367, -7.981299877166748, -7.683304786682129, -7.385309219360352, -7.087313652038574, -6.789318561553955, -6.491323471069336, -6.193327903747559, -5.8953328132629395, -5.597337245941162, -5.299342155456543, -5.001346588134766, -4.703351020812988, -4.405355930328369, -4.107360363006592, -3.8093650341033936, -3.5113697052001953, -3.213374137878418, -2.915379047393799, -2.6173834800720215, -2.3193881511688232, -2.021392822265625, -1.7233974933624268, -1.4254021644592285, -1.1274068355560303, -0.8294113874435425, -0.5314160585403442, -0.233420729637146, 0.0645747184753418, 0.36257004737854004, 0.6605653762817383, 0.9585607051849365, 1.2565560340881348, 1.5545514822006226, 1.8525468111038208, 2.1505422592163086, 2.448537588119507, 2.746532917022705, 3.0445282459259033, 3.3425235748291016, 3.6405189037323, 3.938514232635498, 4.236509799957275, 4.5345048904418945, 4.832500457763672, 5.130496025085449, 5.428491115570068, 5.726486682891846, 6.024481773376465, 6.322477340698242, 6.620472431182861, 6.918467998504639, 7.216463088989258, 7.514458656311035, 7.8124542236328125, 8.11044979095459, 8.408445358276367, 8.706439971923828, 9.004435539245605, 9.302431106567383, 9.60042667388916, 9.898422241210938, 10.196416854858398]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 7.0, 3.0, 2.0, 12.0, 9.0, 16.0, 26.0, 25.0, 40.0, 51.0, 70.0, 93.0, 144.0, 246.0, 335.0, 536.0, 866.0, 1638.0, 2948.0, 6012.0, 13236.0, 32538.0, 90933.0, 304612.0, 395443.0, 124279.0, 42075.0, 16594.0, 7313.0, 3606.0, 1912.0, 1062.0, 616.0, 410.0, 247.0, 188.0, 103.0, 71.0, 57.0, 51.0, 33.0, 19.0, 19.0, 15.0, 10.0, 11.0, 8.0, 9.0, 1.0, 5.0, 5.0, 1.0, 0.0, 2.0], "bins": [-1.3974609375, -1.3565216064453125, -1.315582275390625, -1.2746429443359375, -1.23370361328125, -1.1927642822265625, -1.151824951171875, -1.1108856201171875, -1.0699462890625, -1.0290069580078125, -0.988067626953125, -0.9471282958984375, -0.90618896484375, -0.8652496337890625, -0.824310302734375, -0.7833709716796875, -0.742431640625, -0.7014923095703125, -0.660552978515625, -0.6196136474609375, -0.57867431640625, -0.5377349853515625, -0.496795654296875, -0.4558563232421875, -0.4149169921875, -0.3739776611328125, -0.333038330078125, -0.2920989990234375, -0.25115966796875, -0.2102203369140625, -0.169281005859375, -0.1283416748046875, -0.08740234375, -0.0464630126953125, -0.005523681640625, 0.0354156494140625, 0.07635498046875, 0.1172943115234375, 0.158233642578125, 0.1991729736328125, 0.2401123046875, 0.2810516357421875, 0.321990966796875, 0.3629302978515625, 0.40386962890625, 0.4448089599609375, 0.485748291015625, 0.5266876220703125, 0.567626953125, 0.6085662841796875, 0.649505615234375, 0.6904449462890625, 0.73138427734375, 0.7723236083984375, 0.813262939453125, 0.8542022705078125, 0.8951416015625, 0.9360809326171875, 0.977020263671875, 1.0179595947265625, 1.05889892578125, 1.0998382568359375, 1.140777587890625, 1.1817169189453125, 1.22265625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 3.0, 12.0, 12.0, 19.0, 16.0, 31.0, 30.0, 31.0, 41.0, 36.0, 65.0, 70.0, 43.0, 59.0, 67.0, 62.0, 57.0, 59.0, 53.0, 38.0, 33.0, 35.0, 24.0, 27.0, 20.0, 13.0, 12.0, 6.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-1.373046875, -1.341217041015625, -1.30938720703125, -1.277557373046875, -1.2457275390625, -1.213897705078125, -1.18206787109375, -1.150238037109375, -1.118408203125, -1.086578369140625, -1.05474853515625, -1.022918701171875, -0.9910888671875, -0.959259033203125, -0.92742919921875, -0.895599365234375, -0.86376953125, -0.831939697265625, -0.80010986328125, -0.768280029296875, -0.7364501953125, -0.704620361328125, -0.67279052734375, -0.640960693359375, -0.609130859375, -0.577301025390625, -0.54547119140625, -0.513641357421875, -0.4818115234375, -0.449981689453125, -0.41815185546875, -0.386322021484375, -0.3544921875, -0.322662353515625, -0.29083251953125, -0.259002685546875, -0.2271728515625, -0.195343017578125, -0.16351318359375, -0.131683349609375, -0.099853515625, -0.068023681640625, -0.03619384765625, -0.004364013671875, 0.0274658203125, 0.059295654296875, 0.09112548828125, 0.122955322265625, 0.15478515625, 0.186614990234375, 0.21844482421875, 0.250274658203125, 0.2821044921875, 0.313934326171875, 0.34576416015625, 0.377593994140625, 0.409423828125, 0.441253662109375, 0.47308349609375, 0.504913330078125, 0.5367431640625, 0.568572998046875, 0.60040283203125, 0.632232666015625, 0.6640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 12.0, 8.0, 9.0, 13.0, 22.0, 24.0, 33.0, 46.0, 75.0, 100.0, 149.0, 238.0, 421.0, 646.0, 1349.0, 3120.0, 9788.0, 41501.0, 267117.0, 616258.0, 81822.0, 16833.0, 4827.0, 1895.0, 885.0, 466.0, 291.0, 192.0, 122.0, 85.0, 59.0, 34.0, 27.0, 21.0, 21.0, 6.0, 12.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.3583984375, -2.28515625, -2.2119140625, -2.138671875, -2.0654296875, -1.9921875, -1.9189453125, -1.845703125, -1.7724609375, -1.69921875, -1.6259765625, -1.552734375, -1.4794921875, -1.40625, -1.3330078125, -1.259765625, -1.1865234375, -1.11328125, -1.0400390625, -0.966796875, -0.8935546875, -0.8203125, -0.7470703125, -0.673828125, -0.6005859375, -0.52734375, -0.4541015625, -0.380859375, -0.3076171875, -0.234375, -0.1611328125, -0.087890625, -0.0146484375, 0.05859375, 0.1318359375, 0.205078125, 0.2783203125, 0.3515625, 0.4248046875, 0.498046875, 0.5712890625, 0.64453125, 0.7177734375, 0.791015625, 0.8642578125, 0.9375, 1.0107421875, 1.083984375, 1.1572265625, 1.23046875, 1.3037109375, 1.376953125, 1.4501953125, 1.5234375, 1.5966796875, 1.669921875, 1.7431640625, 1.81640625, 1.8896484375, 1.962890625, 2.0361328125, 2.109375, 2.1826171875, 2.255859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 8.0, 10.0, 12.0, 17.0, 18.0, 21.0, 24.0, 32.0, 30.0, 43.0, 47.0, 43.0, 54.0, 57.0, 54.0, 59.0, 56.0, 43.0, 47.0, 50.0, 38.0, 39.0, 27.0, 45.0, 21.0, 26.0, 16.0, 7.0, 10.0, 8.0, 7.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.275390625, -3.158843994140625, -3.04229736328125, -2.925750732421875, -2.8092041015625, -2.692657470703125, -2.57611083984375, -2.459564208984375, -2.343017578125, -2.226470947265625, -2.10992431640625, -1.993377685546875, -1.8768310546875, -1.760284423828125, -1.64373779296875, -1.527191162109375, -1.41064453125, -1.294097900390625, -1.17755126953125, -1.061004638671875, -0.9444580078125, -0.827911376953125, -0.71136474609375, -0.594818115234375, -0.478271484375, -0.361724853515625, -0.24517822265625, -0.128631591796875, -0.0120849609375, 0.104461669921875, 0.22100830078125, 0.337554931640625, 0.4541015625, 0.570648193359375, 0.68719482421875, 0.803741455078125, 0.9202880859375, 1.036834716796875, 1.15338134765625, 1.269927978515625, 1.386474609375, 1.503021240234375, 1.61956787109375, 1.736114501953125, 1.8526611328125, 1.969207763671875, 2.08575439453125, 2.202301025390625, 2.31884765625, 2.435394287109375, 2.55194091796875, 2.668487548828125, 2.7850341796875, 2.901580810546875, 3.01812744140625, 3.134674072265625, 3.251220703125, 3.367767333984375, 3.48431396484375, 3.600860595703125, 3.7174072265625, 3.833953857421875, 3.95050048828125, 4.067047119140625, 4.18359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 9.0, 13.0, 32.0, 44.0, 69.0, 147.0, 339.0, 1285.0, 10963.0, 886479.0, 143118.0, 4720.0, 784.0, 244.0, 121.0, 78.0, 47.0, 23.0, 12.0, 8.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.833984375, -2.738983154296875, -2.64398193359375, -2.548980712890625, -2.4539794921875, -2.358978271484375, -2.26397705078125, -2.168975830078125, -2.073974609375, -1.978973388671875, -1.88397216796875, -1.788970947265625, -1.6939697265625, -1.598968505859375, -1.50396728515625, -1.408966064453125, -1.31396484375, -1.218963623046875, -1.12396240234375, -1.028961181640625, -0.9339599609375, -0.838958740234375, -0.74395751953125, -0.648956298828125, -0.553955078125, -0.458953857421875, -0.36395263671875, -0.268951416015625, -0.1739501953125, -0.078948974609375, 0.01605224609375, 0.111053466796875, 0.2060546875, 0.301055908203125, 0.39605712890625, 0.491058349609375, 0.5860595703125, 0.681060791015625, 0.77606201171875, 0.871063232421875, 0.966064453125, 1.061065673828125, 1.15606689453125, 1.251068115234375, 1.3460693359375, 1.441070556640625, 1.53607177734375, 1.631072998046875, 1.72607421875, 1.821075439453125, 1.91607666015625, 2.011077880859375, 2.1060791015625, 2.201080322265625, 2.29608154296875, 2.391082763671875, 2.486083984375, 2.581085205078125, 2.67608642578125, 2.771087646484375, 2.8660888671875, 2.961090087890625, 3.05609130859375, 3.151092529296875, 3.24609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 6.0, 9.0, 12.0, 11.0, 11.0, 17.0, 23.0, 38.0, 90.0, 129.0, 187.0, 171.0, 102.0, 47.0, 29.0, 33.0, 17.0, 17.0, 15.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002875328063964844, -0.0002784356474876404, -0.0002693384885787964, -0.0002602413296699524, -0.0002511441707611084, -0.0002420470118522644, -0.0002329498529434204, -0.00022385269403457642, -0.00021475553512573242, -0.00020565837621688843, -0.00019656121730804443, -0.00018746405839920044, -0.00017836689949035645, -0.00016926974058151245, -0.00016017258167266846, -0.00015107542276382446, -0.00014197826385498047, -0.00013288110494613647, -0.00012378394603729248, -0.00011468678712844849, -0.00010558962821960449, -9.64924693107605e-05, -8.73953104019165e-05, -7.829815149307251e-05, -6.920099258422852e-05, -6.010383367538452e-05, -5.100667476654053e-05, -4.190951585769653e-05, -3.281235694885254e-05, -2.3715198040008545e-05, -1.461803913116455e-05, -5.520880222320557e-06, 3.5762786865234375e-06, 1.2673437595367432e-05, 2.1770596504211426e-05, 3.086775541305542e-05, 3.9964914321899414e-05, 4.906207323074341e-05, 5.81592321395874e-05, 6.72563910484314e-05, 7.635354995727539e-05, 8.545070886611938e-05, 9.454786777496338e-05, 0.00010364502668380737, 0.00011274218559265137, 0.00012183934450149536, 0.00013093650341033936, 0.00014003366231918335, 0.00014913082122802734, 0.00015822798013687134, 0.00016732513904571533, 0.00017642229795455933, 0.00018551945686340332, 0.00019461661577224731, 0.0002037137746810913, 0.0002128109335899353, 0.0002219080924987793, 0.0002310052514076233, 0.00024010241031646729, 0.0002491995692253113, 0.0002582967281341553, 0.00026739388704299927, 0.00027649104595184326, 0.00028558820486068726, 0.00029468536376953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 5.0, 1.0, 4.0, 3.0, 6.0, 7.0, 8.0, 13.0, 17.0, 27.0, 30.0, 41.0, 51.0, 88.0, 121.0, 170.0, 288.0, 484.0, 736.0, 1262.0, 2295.0, 4154.0, 9432.0, 28688.0, 232729.0, 682584.0, 58218.0, 14310.0, 5939.0, 2808.0, 1560.0, 918.0, 501.0, 318.0, 232.0, 132.0, 98.0, 70.0, 51.0, 40.0, 32.0, 32.0, 19.0, 8.0, 8.0, 7.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.017578125, -0.9827423095703125, -0.947906494140625, -0.9130706787109375, -0.87823486328125, -0.8433990478515625, -0.808563232421875, -0.7737274169921875, -0.7388916015625, -0.7040557861328125, -0.669219970703125, -0.6343841552734375, -0.59954833984375, -0.5647125244140625, -0.529876708984375, -0.4950408935546875, -0.460205078125, -0.4253692626953125, -0.390533447265625, -0.3556976318359375, -0.32086181640625, -0.2860260009765625, -0.251190185546875, -0.2163543701171875, -0.1815185546875, -0.1466827392578125, -0.111846923828125, -0.0770111083984375, -0.04217529296875, -0.0073394775390625, 0.027496337890625, 0.0623321533203125, 0.09716796875, 0.1320037841796875, 0.166839599609375, 0.2016754150390625, 0.23651123046875, 0.2713470458984375, 0.306182861328125, 0.3410186767578125, 0.3758544921875, 0.4106903076171875, 0.445526123046875, 0.4803619384765625, 0.51519775390625, 0.5500335693359375, 0.584869384765625, 0.6197052001953125, 0.654541015625, 0.6893768310546875, 0.724212646484375, 0.7590484619140625, 0.79388427734375, 0.8287200927734375, 0.863555908203125, 0.8983917236328125, 0.9332275390625, 0.9680633544921875, 1.002899169921875, 1.0377349853515625, 1.07257080078125, 1.1074066162109375, 1.142242431640625, 1.1770782470703125, 1.2119140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 11.0, 12.0, 13.0, 25.0, 55.0, 74.0, 126.0, 167.0, 163.0, 114.0, 74.0, 45.0, 27.0, 17.0, 12.0, 10.0, 10.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5107421875, -1.467620849609375, -1.42449951171875, -1.381378173828125, -1.3382568359375, -1.295135498046875, -1.25201416015625, -1.208892822265625, -1.165771484375, -1.122650146484375, -1.07952880859375, -1.036407470703125, -0.9932861328125, -0.950164794921875, -0.90704345703125, -0.863922119140625, -0.82080078125, -0.777679443359375, -0.73455810546875, -0.691436767578125, -0.6483154296875, -0.605194091796875, -0.56207275390625, -0.518951416015625, -0.475830078125, -0.432708740234375, -0.38958740234375, -0.346466064453125, -0.3033447265625, -0.260223388671875, -0.21710205078125, -0.173980712890625, -0.130859375, -0.087738037109375, -0.04461669921875, -0.001495361328125, 0.0416259765625, 0.084747314453125, 0.12786865234375, 0.170989990234375, 0.214111328125, 0.257232666015625, 0.30035400390625, 0.343475341796875, 0.3865966796875, 0.429718017578125, 0.47283935546875, 0.515960693359375, 0.55908203125, 0.602203369140625, 0.64532470703125, 0.688446044921875, 0.7315673828125, 0.774688720703125, 0.81781005859375, 0.860931396484375, 0.904052734375, 0.947174072265625, 0.99029541015625, 1.033416748046875, 1.0765380859375, 1.119659423828125, 1.16278076171875, 1.205902099609375, 1.2490234375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 1.0, 6.0, 3.0, 5.0, 14.0, 15.0, 37.0, 99.0, 207.0, 293.0, 174.0, 81.0, 29.0, 13.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.14150619506836, -23.37288475036621, -22.604263305664062, -21.835641860961914, -21.067020416259766, -20.298398971557617, -19.52977752685547, -18.761154174804688, -17.992534637451172, -17.223913192749023, -16.455291748046875, -15.686670303344727, -14.918048858642578, -14.14942741394043, -13.380805015563965, -12.612183570861816, -11.843561172485352, -11.074939727783203, -10.306318283081055, -9.537696838378906, -8.769075393676758, -8.00045394897461, -7.2318315505981445, -6.463210105895996, -5.694588661193848, -4.925967216491699, -4.157345771789551, -3.388723850250244, -2.6201024055480957, -1.8514809608459473, -1.0828590393066406, -0.3142375946044922, 0.45438385009765625, 1.2230054140090942, 1.9916269779205322, 2.7602486610412598, 3.528870105743408, 4.297491550445557, 5.066113471984863, 5.834734916687012, 6.60335636138916, 7.371977806091309, 8.140599250793457, 8.909221649169922, 9.67784309387207, 10.446464538574219, 11.215085983276367, 11.983707427978516, 12.752328872680664, 13.520950317382812, 14.289571762084961, 15.05819320678711, 15.826814651489258, 16.595436096191406, 17.364059448242188, 18.132678985595703, 18.901302337646484, 19.669923782348633, 20.43854522705078, 21.20716667175293, 21.975788116455078, 22.744409561157227, 23.513031005859375, 24.281654357910156, 25.050273895263672]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 7.0, 6.0, 8.0, 12.0, 13.0, 18.0, 26.0, 18.0, 16.0, 33.0, 29.0, 22.0, 37.0, 39.0, 57.0, 54.0, 52.0, 65.0, 69.0, 55.0, 50.0, 36.0, 36.0, 40.0, 29.0, 20.0, 26.0, 29.0, 16.0, 15.0, 12.0, 15.0, 11.0, 5.0, 2.0, 5.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.717267990112305, -13.298589706420898, -12.879911422729492, -12.461234092712402, -12.042555809020996, -11.62387752532959, -11.205199241638184, -10.786521911621094, -10.367843627929688, -9.949165344238281, -9.530487060546875, -9.111809730529785, -8.693131446838379, -8.274453163146973, -7.855774879455566, -7.437097072601318, -7.018418788909912, -6.599740505218506, -6.181062698364258, -5.762384414672852, -5.3437066078186035, -4.925028324127197, -4.506350517272949, -4.087672233581543, -3.668994188308716, -3.2503161430358887, -2.8316380977630615, -2.4129600524902344, -1.9942818880081177, -1.575603723526001, -1.1569256782531738, -0.7382476329803467, -0.31956958770751953, 0.09910848736763, 0.5177865624427795, 0.9364646673202515, 1.3551427125930786, 1.7738208770751953, 2.1924989223480225, 2.6111769676208496, 3.0298550128936768, 3.448533058166504, 3.867211103439331, 4.285889148712158, 4.7045674324035645, 5.1232452392578125, 5.541923522949219, 5.960601806640625, 6.379279613494873, 6.797957897186279, 7.216635704040527, 7.635313987731934, 8.05399227142334, 8.47266960144043, 8.891347885131836, 9.310026168823242, 9.728704452514648, 10.147382736206055, 10.566061019897461, 10.98473834991455, 11.403416633605957, 11.822094917297363, 12.24077320098877, 12.65945053100586, 13.078128814697266]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 4.0, 7.0, 12.0, 17.0, 11.0, 30.0, 36.0, 57.0, 63.0, 125.0, 225.0, 387.0, 834.0, 2007.0, 5599.0, 19134.0, 120366.0, 2096736.0, 1821296.0, 100898.0, 17658.0, 4923.0, 1838.0, 840.0, 424.0, 239.0, 148.0, 101.0, 65.0, 49.0, 43.0, 30.0, 17.0, 14.0, 11.0, 6.0, 5.0, 7.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4990234375, -1.4521331787109375, -1.405242919921875, -1.3583526611328125, -1.31146240234375, -1.2645721435546875, -1.217681884765625, -1.1707916259765625, -1.1239013671875, -1.0770111083984375, -1.030120849609375, -0.9832305908203125, -0.93634033203125, -0.8894500732421875, -0.842559814453125, -0.7956695556640625, -0.748779296875, -0.7018890380859375, -0.654998779296875, -0.6081085205078125, -0.56121826171875, -0.5143280029296875, -0.467437744140625, -0.4205474853515625, -0.3736572265625, -0.3267669677734375, -0.279876708984375, -0.2329864501953125, -0.18609619140625, -0.1392059326171875, -0.092315673828125, -0.0454254150390625, 0.00146484375, 0.0483551025390625, 0.095245361328125, 0.1421356201171875, 0.18902587890625, 0.2359161376953125, 0.282806396484375, 0.3296966552734375, 0.3765869140625, 0.4234771728515625, 0.470367431640625, 0.5172576904296875, 0.56414794921875, 0.6110382080078125, 0.657928466796875, 0.7048187255859375, 0.751708984375, 0.7985992431640625, 0.845489501953125, 0.8923797607421875, 0.93927001953125, 0.9861602783203125, 1.033050537109375, 1.0799407958984375, 1.1268310546875, 1.1737213134765625, 1.220611572265625, 1.2675018310546875, 1.31439208984375, 1.3612823486328125, 1.408172607421875, 1.4550628662109375, 1.501953125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 10.0, 10.0, 13.0, 20.0, 30.0, 33.0, 44.0, 54.0, 63.0, 55.0, 65.0, 76.0, 72.0, 68.0, 63.0, 74.0, 52.0, 44.0, 26.0, 41.0, 17.0, 11.0, 15.0, 12.0, 11.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-1.556640625, -1.5214080810546875, -1.486175537109375, -1.4509429931640625, -1.41571044921875, -1.3804779052734375, -1.345245361328125, -1.3100128173828125, -1.2747802734375, -1.2395477294921875, -1.204315185546875, -1.1690826416015625, -1.13385009765625, -1.0986175537109375, -1.063385009765625, -1.0281524658203125, -0.992919921875, -0.9576873779296875, -0.922454833984375, -0.8872222900390625, -0.85198974609375, -0.8167572021484375, -0.781524658203125, -0.7462921142578125, -0.7110595703125, -0.6758270263671875, -0.640594482421875, -0.6053619384765625, -0.57012939453125, -0.5348968505859375, -0.499664306640625, -0.4644317626953125, -0.42919921875, -0.3939666748046875, -0.358734130859375, -0.3235015869140625, -0.28826904296875, -0.2530364990234375, -0.217803955078125, -0.1825714111328125, -0.1473388671875, -0.1121063232421875, -0.076873779296875, -0.0416412353515625, -0.00640869140625, 0.0288238525390625, 0.064056396484375, 0.0992889404296875, 0.134521484375, 0.1697540283203125, 0.204986572265625, 0.2402191162109375, 0.27545166015625, 0.3106842041015625, 0.345916748046875, 0.3811492919921875, 0.4163818359375, 0.4516143798828125, 0.486846923828125, 0.5220794677734375, 0.55731201171875, 0.5925445556640625, 0.627777099609375, 0.6630096435546875, 0.6982421875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 14.0, 12.0, 23.0, 41.0, 44.0, 83.0, 163.0, 260.0, 464.0, 1056.0, 2782.0, 9897.0, 56960.0, 1173884.0, 2816408.0, 109803.0, 15472.0, 3770.0, 1435.0, 674.0, 386.0, 225.0, 148.0, 77.0, 53.0, 49.0, 25.0, 19.0, 6.0, 10.0, 11.0, 9.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.560546875, -1.495880126953125, -1.43121337890625, -1.366546630859375, -1.3018798828125, -1.237213134765625, -1.17254638671875, -1.107879638671875, -1.043212890625, -0.978546142578125, -0.91387939453125, -0.849212646484375, -0.7845458984375, -0.719879150390625, -0.65521240234375, -0.590545654296875, -0.52587890625, -0.461212158203125, -0.39654541015625, -0.331878662109375, -0.2672119140625, -0.202545166015625, -0.13787841796875, -0.073211669921875, -0.008544921875, 0.056121826171875, 0.12078857421875, 0.185455322265625, 0.2501220703125, 0.314788818359375, 0.37945556640625, 0.444122314453125, 0.5087890625, 0.573455810546875, 0.63812255859375, 0.702789306640625, 0.7674560546875, 0.832122802734375, 0.89678955078125, 0.961456298828125, 1.026123046875, 1.090789794921875, 1.15545654296875, 1.220123291015625, 1.2847900390625, 1.349456787109375, 1.41412353515625, 1.478790283203125, 1.54345703125, 1.608123779296875, 1.67279052734375, 1.737457275390625, 1.8021240234375, 1.866790771484375, 1.93145751953125, 1.996124267578125, 2.060791015625, 2.125457763671875, 2.19012451171875, 2.254791259765625, 2.3194580078125, 2.384124755859375, 2.44879150390625, 2.513458251953125, 2.578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 5.0, 6.0, 12.0, 19.0, 16.0, 23.0, 41.0, 78.0, 121.0, 239.0, 498.0, 845.0, 926.0, 579.0, 256.0, 165.0, 73.0, 59.0, 33.0, 27.0, 15.0, 15.0, 9.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8031158447265625, -1.728302001953125, -1.6534881591796875, -1.57867431640625, -1.5038604736328125, -1.429046630859375, -1.3542327880859375, -1.2794189453125, -1.2046051025390625, -1.129791259765625, -1.0549774169921875, -0.98016357421875, -0.9053497314453125, -0.830535888671875, -0.7557220458984375, -0.680908203125, -0.6060943603515625, -0.531280517578125, -0.4564666748046875, -0.38165283203125, -0.3068389892578125, -0.232025146484375, -0.1572113037109375, -0.0823974609375, -0.0075836181640625, 0.067230224609375, 0.1420440673828125, 0.21685791015625, 0.2916717529296875, 0.366485595703125, 0.4412994384765625, 0.51611328125, 0.5909271240234375, 0.665740966796875, 0.7405548095703125, 0.81536865234375, 0.8901824951171875, 0.964996337890625, 1.0398101806640625, 1.1146240234375, 1.1894378662109375, 1.264251708984375, 1.3390655517578125, 1.41387939453125, 1.4886932373046875, 1.563507080078125, 1.6383209228515625, 1.713134765625, 1.7879486083984375, 1.862762451171875, 1.9375762939453125, 2.01239013671875, 2.0872039794921875, 2.162017822265625, 2.2368316650390625, 2.3116455078125, 2.3864593505859375, 2.461273193359375, 2.5360870361328125, 2.61090087890625, 2.6857147216796875, 2.760528564453125, 2.8353424072265625, 2.91015625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 2.0, 5.0, 5.0, 19.0, 46.0, 113.0, 244.0, 282.0, 171.0, 67.0, 26.0, 15.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.295491218566895, -7.4835896492004395, -6.671687602996826, -5.859786033630371, -5.047883987426758, -4.235982418060303, -3.4240808486938477, -2.6121788024902344, -1.8002772331237793, -0.9883754849433899, -0.1764737367630005, 0.6354279518127441, 1.4473297595977783, 2.2592315673828125, 3.0711331367492676, 3.883035182952881, 4.694936752319336, 5.506838321685791, 6.318740367889404, 7.130641937255859, 7.942543983459473, 8.754446029663086, 9.566347122192383, 10.378249168395996, 11.19015121459961, 12.002053260803223, 12.81395435333252, 13.625856399536133, 14.437758445739746, 15.24966049194336, 16.061561584472656, 16.873462677001953, 17.685365676879883, 18.49726676940918, 19.30916976928711, 20.121070861816406, 20.932971954345703, 21.744874954223633, 22.55677604675293, 23.36867904663086, 24.180580139160156, 24.992481231689453, 25.804384231567383, 26.61628532409668, 27.428186416625977, 28.240089416503906, 29.051990509033203, 29.8638916015625, 30.675792694091797, 31.487693786621094, 32.29959487915039, 33.11149597167969, 33.92340087890625, 34.73530197143555, 35.547203063964844, 36.35910415649414, 37.1710090637207, 37.98291015625, 38.7948112487793, 39.606712341308594, 40.418617248535156, 41.23051834106445, 42.04241943359375, 42.85432052612305, 43.666221618652344]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 8.0, 8.0, 19.0, 19.0, 13.0, 29.0, 19.0, 31.0, 45.0, 40.0, 43.0, 70.0, 50.0, 69.0, 69.0, 72.0, 64.0, 62.0, 37.0, 47.0, 30.0, 36.0, 31.0, 21.0, 21.0, 15.0, 12.0, 11.0, 2.0, 3.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.203764915466309, -9.852551460266113, -9.501338005065918, -9.150124549865723, -8.798912048339844, -8.447698593139648, -8.096485137939453, -7.745271682739258, -7.3940582275390625, -7.042844772338867, -6.691631317138672, -6.340418338775635, -5.9892048835754395, -5.637991428375244, -5.286778450012207, -4.935564994812012, -4.584351539611816, -4.233138084411621, -3.881924867630005, -3.5307116508483887, -3.1794981956481934, -2.828284740447998, -2.477071523666382, -2.1258583068847656, -1.7746448516845703, -1.4234315156936646, -1.0722181797027588, -0.721004843711853, -0.36979150772094727, -0.018578171730041504, 0.33263516426086426, 0.6838483810424805, 1.0350608825683594, 1.3862742185592651, 1.737487554550171, 2.088700771331787, 2.4399142265319824, 2.7911276817321777, 3.142340898513794, 3.49355411529541, 3.8447675704956055, 4.195981025695801, 4.547194480895996, 4.898407459259033, 5.2496209144592285, 5.600834369659424, 5.952047348022461, 6.303260803222656, 6.654474258422852, 7.005687713623047, 7.356901168823242, 7.708114147186279, 8.059328079223633, 8.410540580749512, 8.761754035949707, 9.112967491149902, 9.464180946350098, 9.815394401550293, 10.166607856750488, 10.517821311950684, 10.869033813476562, 11.220247268676758, 11.571460723876953, 11.922674179077148, 12.273887634277344]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 9.0, 4.0, 6.0, 7.0, 13.0, 18.0, 27.0, 39.0, 65.0, 63.0, 140.0, 215.0, 376.0, 674.0, 1224.0, 2870.0, 7422.0, 23827.0, 87005.0, 351805.0, 420873.0, 107770.0, 28908.0, 8825.0, 3217.0, 1387.0, 707.0, 375.0, 242.0, 167.0, 96.0, 69.0, 43.0, 18.0, 13.0, 8.0, 7.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.7265625, -1.6710052490234375, -1.615447998046875, -1.5598907470703125, -1.50433349609375, -1.4487762451171875, -1.393218994140625, -1.3376617431640625, -1.2821044921875, -1.2265472412109375, -1.170989990234375, -1.1154327392578125, -1.05987548828125, -1.0043182373046875, -0.948760986328125, -0.8932037353515625, -0.837646484375, -0.7820892333984375, -0.726531982421875, -0.6709747314453125, -0.61541748046875, -0.5598602294921875, -0.504302978515625, -0.4487457275390625, -0.3931884765625, -0.3376312255859375, -0.282073974609375, -0.2265167236328125, -0.17095947265625, -0.1154022216796875, -0.059844970703125, -0.0042877197265625, 0.05126953125, 0.1068267822265625, 0.162384033203125, 0.2179412841796875, 0.27349853515625, 0.3290557861328125, 0.384613037109375, 0.4401702880859375, 0.4957275390625, 0.5512847900390625, 0.606842041015625, 0.6623992919921875, 0.71795654296875, 0.7735137939453125, 0.829071044921875, 0.8846282958984375, 0.940185546875, 0.9957427978515625, 1.051300048828125, 1.1068572998046875, 1.16241455078125, 1.2179718017578125, 1.273529052734375, 1.3290863037109375, 1.3846435546875, 1.4402008056640625, 1.495758056640625, 1.5513153076171875, 1.60687255859375, 1.6624298095703125, 1.717987060546875, 1.7735443115234375, 1.8291015625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 7.0, 5.0, 15.0, 10.0, 14.0, 26.0, 27.0, 25.0, 34.0, 36.0, 41.0, 44.0, 48.0, 44.0, 52.0, 52.0, 53.0, 50.0, 48.0, 48.0, 50.0, 49.0, 40.0, 32.0, 20.0, 21.0, 22.0, 12.0, 21.0, 5.0, 10.0, 6.0, 9.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71240234375, -0.687042236328125, -0.66168212890625, -0.636322021484375, -0.6109619140625, -0.585601806640625, -0.56024169921875, -0.534881591796875, -0.509521484375, -0.484161376953125, -0.45880126953125, -0.433441162109375, -0.4080810546875, -0.382720947265625, -0.35736083984375, -0.332000732421875, -0.306640625, -0.281280517578125, -0.25592041015625, -0.230560302734375, -0.2052001953125, -0.179840087890625, -0.15447998046875, -0.129119873046875, -0.103759765625, -0.078399658203125, -0.05303955078125, -0.027679443359375, -0.0023193359375, 0.023040771484375, 0.04840087890625, 0.073760986328125, 0.09912109375, 0.124481201171875, 0.14984130859375, 0.175201416015625, 0.2005615234375, 0.225921630859375, 0.25128173828125, 0.276641845703125, 0.302001953125, 0.327362060546875, 0.35272216796875, 0.378082275390625, 0.4034423828125, 0.428802490234375, 0.45416259765625, 0.479522705078125, 0.5048828125, 0.530242919921875, 0.55560302734375, 0.580963134765625, 0.6063232421875, 0.631683349609375, 0.65704345703125, 0.682403564453125, 0.707763671875, 0.733123779296875, 0.75848388671875, 0.783843994140625, 0.8092041015625, 0.834564208984375, 0.85992431640625, 0.885284423828125, 0.91064453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 0.0, 2.0, 3.0, 2.0, 9.0, 14.0, 7.0, 35.0, 54.0, 58.0, 107.0, 166.0, 261.0, 480.0, 813.0, 1736.0, 4637.0, 21949.0, 316219.0, 659795.0, 32019.0, 5925.0, 2015.0, 943.0, 544.0, 286.0, 157.0, 111.0, 67.0, 41.0, 29.0, 26.0, 15.0, 9.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.4921875, -4.364166259765625, -4.23614501953125, -4.108123779296875, -3.9801025390625, -3.852081298828125, -3.72406005859375, -3.596038818359375, -3.468017578125, -3.339996337890625, -3.21197509765625, -3.083953857421875, -2.9559326171875, -2.827911376953125, -2.69989013671875, -2.571868896484375, -2.44384765625, -2.315826416015625, -2.18780517578125, -2.059783935546875, -1.9317626953125, -1.803741455078125, -1.67572021484375, -1.547698974609375, -1.419677734375, -1.291656494140625, -1.16363525390625, -1.035614013671875, -0.9075927734375, -0.779571533203125, -0.65155029296875, -0.523529052734375, -0.3955078125, -0.267486572265625, -0.13946533203125, -0.011444091796875, 0.1165771484375, 0.244598388671875, 0.37261962890625, 0.500640869140625, 0.628662109375, 0.756683349609375, 0.88470458984375, 1.012725830078125, 1.1407470703125, 1.268768310546875, 1.39678955078125, 1.524810791015625, 1.65283203125, 1.780853271484375, 1.90887451171875, 2.036895751953125, 2.1649169921875, 2.292938232421875, 2.42095947265625, 2.548980712890625, 2.677001953125, 2.805023193359375, 2.93304443359375, 3.061065673828125, 3.1890869140625, 3.317108154296875, 3.44512939453125, 3.573150634765625, 3.701171875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 2.0, 4.0, 3.0, 5.0, 6.0, 8.0, 13.0, 13.0, 15.0, 15.0, 15.0, 27.0, 36.0, 33.0, 35.0, 36.0, 53.0, 47.0, 51.0, 51.0, 49.0, 53.0, 62.0, 41.0, 37.0, 40.0, 37.0, 25.0, 30.0, 28.0, 25.0, 15.0, 19.0, 16.0, 8.0, 8.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.576171875, -3.455352783203125, -3.33453369140625, -3.213714599609375, -3.0928955078125, -2.972076416015625, -2.85125732421875, -2.730438232421875, -2.609619140625, -2.488800048828125, -2.36798095703125, -2.247161865234375, -2.1263427734375, -2.005523681640625, -1.88470458984375, -1.763885498046875, -1.64306640625, -1.522247314453125, -1.40142822265625, -1.280609130859375, -1.1597900390625, -1.038970947265625, -0.91815185546875, -0.797332763671875, -0.676513671875, -0.555694580078125, -0.43487548828125, -0.314056396484375, -0.1932373046875, -0.072418212890625, 0.04840087890625, 0.169219970703125, 0.2900390625, 0.410858154296875, 0.53167724609375, 0.652496337890625, 0.7733154296875, 0.894134521484375, 1.01495361328125, 1.135772705078125, 1.256591796875, 1.377410888671875, 1.49822998046875, 1.619049072265625, 1.7398681640625, 1.860687255859375, 1.98150634765625, 2.102325439453125, 2.22314453125, 2.343963623046875, 2.46478271484375, 2.585601806640625, 2.7064208984375, 2.827239990234375, 2.94805908203125, 3.068878173828125, 3.189697265625, 3.310516357421875, 3.43133544921875, 3.552154541015625, 3.6729736328125, 3.793792724609375, 3.91461181640625, 4.035430908203125, 4.15625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 10.0, 9.0, 7.0, 18.0, 22.0, 32.0, 50.0, 72.0, 128.0, 199.0, 348.0, 716.0, 1661.0, 5185.0, 23808.0, 384578.0, 597005.0, 25741.0, 5523.0, 1699.0, 746.0, 400.0, 201.0, 121.0, 86.0, 49.0, 41.0, 36.0, 18.0, 14.0, 6.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5419921875, -1.488861083984375, -1.43572998046875, -1.382598876953125, -1.3294677734375, -1.276336669921875, -1.22320556640625, -1.170074462890625, -1.116943359375, -1.063812255859375, -1.01068115234375, -0.957550048828125, -0.9044189453125, -0.851287841796875, -0.79815673828125, -0.745025634765625, -0.69189453125, -0.638763427734375, -0.58563232421875, -0.532501220703125, -0.4793701171875, -0.426239013671875, -0.37310791015625, -0.319976806640625, -0.266845703125, -0.213714599609375, -0.16058349609375, -0.107452392578125, -0.0543212890625, -0.001190185546875, 0.05194091796875, 0.105072021484375, 0.158203125, 0.211334228515625, 0.26446533203125, 0.317596435546875, 0.3707275390625, 0.423858642578125, 0.47698974609375, 0.530120849609375, 0.583251953125, 0.636383056640625, 0.68951416015625, 0.742645263671875, 0.7957763671875, 0.848907470703125, 0.90203857421875, 0.955169677734375, 1.00830078125, 1.061431884765625, 1.11456298828125, 1.167694091796875, 1.2208251953125, 1.273956298828125, 1.32708740234375, 1.380218505859375, 1.433349609375, 1.486480712890625, 1.53961181640625, 1.592742919921875, 1.6458740234375, 1.699005126953125, 1.75213623046875, 1.805267333984375, 1.8583984375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 6.0, 11.0, 3.0, 18.0, 21.0, 21.0, 32.0, 30.0, 36.0, 71.0, 103.0, 207.0, 145.0, 84.0, 43.0, 32.0, 25.0, 23.0, 19.0, 16.0, 14.0, 10.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0003323554992675781, -0.00032153353095054626, -0.0003107115626335144, -0.00029988959431648254, -0.0002890676259994507, -0.0002782456576824188, -0.00026742368936538696, -0.0002566017210483551, -0.00024577975273132324, -0.00023495778441429138, -0.00022413581609725952, -0.00021331384778022766, -0.0002024918794631958, -0.00019166991114616394, -0.00018084794282913208, -0.00017002597451210022, -0.00015920400619506836, -0.0001483820378780365, -0.00013756006956100464, -0.00012673810124397278, -0.00011591613292694092, -0.00010509416460990906, -9.42721962928772e-05, -8.345022797584534e-05, -7.262825965881348e-05, -6.180629134178162e-05, -5.0984323024749756e-05, -4.0162354707717896e-05, -2.9340386390686035e-05, -1.8518418073654175e-05, -7.696449756622314e-06, 3.125518560409546e-06, 1.3947486877441406e-05, 2.4769455194473267e-05, 3.559142351150513e-05, 4.641339182853699e-05, 5.723536014556885e-05, 6.805732846260071e-05, 7.887929677963257e-05, 8.970126509666443e-05, 0.00010052323341369629, 0.00011134520173072815, 0.00012216717004776, 0.00013298913836479187, 0.00014381110668182373, 0.0001546330749988556, 0.00016545504331588745, 0.0001762770116329193, 0.00018709897994995117, 0.00019792094826698303, 0.0002087429165840149, 0.00021956488490104675, 0.0002303868532180786, 0.00024120882153511047, 0.00025203078985214233, 0.0002628527581691742, 0.00027367472648620605, 0.0002844966948032379, 0.0002953186631202698, 0.00030614063143730164, 0.0003169625997543335, 0.00032778456807136536, 0.0003386065363883972, 0.0003494285047054291, 0.00036025047302246094]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 1.0, 5.0, 14.0, 5.0, 8.0, 15.0, 17.0, 23.0, 47.0, 48.0, 53.0, 106.0, 114.0, 179.0, 301.0, 516.0, 972.0, 1751.0, 4061.0, 10835.0, 42017.0, 713710.0, 232642.0, 26282.0, 8121.0, 3172.0, 1485.0, 793.0, 458.0, 242.0, 172.0, 112.0, 79.0, 58.0, 41.0, 31.0, 27.0, 13.0, 6.0, 6.0, 10.0, 5.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.396484375, -1.346343994140625, -1.29620361328125, -1.246063232421875, -1.1959228515625, -1.145782470703125, -1.09564208984375, -1.045501708984375, -0.995361328125, -0.945220947265625, -0.89508056640625, -0.844940185546875, -0.7947998046875, -0.744659423828125, -0.69451904296875, -0.644378662109375, -0.59423828125, -0.544097900390625, -0.49395751953125, -0.443817138671875, -0.3936767578125, -0.343536376953125, -0.29339599609375, -0.243255615234375, -0.193115234375, -0.142974853515625, -0.09283447265625, -0.042694091796875, 0.0074462890625, 0.057586669921875, 0.10772705078125, 0.157867431640625, 0.2080078125, 0.258148193359375, 0.30828857421875, 0.358428955078125, 0.4085693359375, 0.458709716796875, 0.50885009765625, 0.558990478515625, 0.609130859375, 0.659271240234375, 0.70941162109375, 0.759552001953125, 0.8096923828125, 0.859832763671875, 0.90997314453125, 0.960113525390625, 1.01025390625, 1.060394287109375, 1.11053466796875, 1.160675048828125, 1.2108154296875, 1.260955810546875, 1.31109619140625, 1.361236572265625, 1.411376953125, 1.461517333984375, 1.51165771484375, 1.561798095703125, 1.6119384765625, 1.662078857421875, 1.71221923828125, 1.762359619140625, 1.8125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 3.0, 12.0, 14.0, 16.0, 19.0, 37.0, 59.0, 81.0, 119.0, 199.0, 151.0, 77.0, 42.0, 44.0, 35.0, 16.0, 12.0, 14.0, 4.0, 7.0, 8.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6181640625, -1.5615997314453125, -1.505035400390625, -1.4484710693359375, -1.39190673828125, -1.3353424072265625, -1.278778076171875, -1.2222137451171875, -1.1656494140625, -1.1090850830078125, -1.052520751953125, -0.9959564208984375, -0.93939208984375, -0.8828277587890625, -0.826263427734375, -0.7696990966796875, -0.713134765625, -0.6565704345703125, -0.600006103515625, -0.5434417724609375, -0.48687744140625, -0.4303131103515625, -0.373748779296875, -0.3171844482421875, -0.2606201171875, -0.2040557861328125, -0.147491455078125, -0.0909271240234375, -0.03436279296875, 0.0222015380859375, 0.078765869140625, 0.1353302001953125, 0.19189453125, 0.2484588623046875, 0.305023193359375, 0.3615875244140625, 0.41815185546875, 0.4747161865234375, 0.531280517578125, 0.5878448486328125, 0.6444091796875, 0.7009735107421875, 0.757537841796875, 0.8141021728515625, 0.87066650390625, 0.9272308349609375, 0.983795166015625, 1.0403594970703125, 1.096923828125, 1.1534881591796875, 1.210052490234375, 1.2666168212890625, 1.32318115234375, 1.3797454833984375, 1.436309814453125, 1.4928741455078125, 1.5494384765625, 1.6060028076171875, 1.662567138671875, 1.7191314697265625, 1.77569580078125, 1.8322601318359375, 1.888824462890625, 1.9453887939453125, 2.001953125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 12.0, 10.0, 31.0, 102.0, 238.0, 374.0, 147.0, 43.0, 16.0, 10.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.743255615234375, -37.613624572753906, -36.48399353027344, -35.3543586730957, -34.224727630615234, -33.095096588134766, -31.965463638305664, -30.835830688476562, -29.706199645996094, -28.576568603515625, -27.446935653686523, -26.317302703857422, -25.187671661376953, -24.058040618896484, -22.928407669067383, -21.79877471923828, -20.669143676757812, -19.539512634277344, -18.409879684448242, -17.28024673461914, -16.150615692138672, -15.020983695983887, -13.891351699829102, -12.761719703674316, -11.632087707519531, -10.502455711364746, -9.372823715209961, -8.243191719055176, -7.113559722900391, -5.9839277267456055, -4.85429573059082, -3.724663734436035, -2.5950279235839844, -1.4653959274291992, -0.33576393127441406, 0.7938680648803711, 1.9235000610351562, 3.0531320571899414, 4.182764053344727, 5.312396049499512, 6.442028045654297, 7.571660041809082, 8.701292037963867, 9.830924034118652, 10.960556030273438, 12.090188026428223, 13.219820022583008, 14.349452018737793, 15.479084014892578, 16.608715057373047, 17.73834800720215, 18.86798095703125, 19.99761199951172, 21.127243041992188, 22.25687599182129, 23.38650894165039, 24.51613998413086, 25.645771026611328, 26.77540397644043, 27.90503692626953, 29.03466796875, 30.16429901123047, 31.29393196105957, 32.42356491088867, 33.55319595336914]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 9.0, 12.0, 12.0, 9.0, 19.0, 12.0, 24.0, 17.0, 24.0, 28.0, 28.0, 43.0, 44.0, 55.0, 67.0, 68.0, 56.0, 67.0, 52.0, 49.0, 43.0, 43.0, 36.0, 35.0, 27.0, 14.0, 14.0, 9.0, 27.0, 9.0, 8.0, 9.0, 7.0, 9.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.664671897888184, -13.19759464263916, -12.730517387390137, -12.263440132141113, -11.796363830566406, -11.329286575317383, -10.86220932006836, -10.395132064819336, -9.928054809570312, -9.460977554321289, -8.993900299072266, -8.526823043823242, -8.059745788574219, -7.5926690101623535, -7.125592231750488, -6.658514976501465, -6.191437721252441, -5.724360466003418, -5.2572832107543945, -4.790206432342529, -4.323129177093506, -3.8560519218444824, -3.388974905014038, -2.9218978881835938, -2.4548206329345703, -1.9877434968948364, -1.5206663608551025, -1.0535892248153687, -0.5865120887756348, -0.11943483352661133, 0.347642183303833, 0.8147192001342773, 1.2817955017089844, 1.7488726377487183, 2.215949773788452, 2.6830267906188965, 3.15010404586792, 3.6171813011169434, 4.084258079528809, 4.551335334777832, 5.0184125900268555, 5.485489845275879, 5.952567100524902, 6.419643878936768, 6.886721134185791, 7.3537983894348145, 7.82087516784668, 8.287952423095703, 8.755029678344727, 9.22210693359375, 9.689184188842773, 10.156261444091797, 10.62333869934082, 11.090415954589844, 11.55749225616455, 12.024569511413574, 12.491646766662598, 12.958724021911621, 13.425801277160645, 13.892878532409668, 14.359954833984375, 14.827032089233398, 15.294109344482422, 15.761186599731445, 16.22826385498047]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 20.0, 9.0, 17.0, 22.0, 21.0, 31.0, 45.0, 75.0, 106.0, 157.0, 229.0, 410.0, 785.0, 1627.0, 4104.0, 13560.0, 80675.0, 2372923.0, 1642268.0, 59678.0, 10842.0, 3479.0, 1461.0, 642.0, 401.0, 229.0, 152.0, 84.0, 60.0, 50.0, 30.0, 25.0, 18.0, 15.0, 5.0, 11.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.123046875, -2.0655670166015625, -2.008087158203125, -1.9506072998046875, -1.89312744140625, -1.8356475830078125, -1.778167724609375, -1.7206878662109375, -1.6632080078125, -1.6057281494140625, -1.548248291015625, -1.4907684326171875, -1.43328857421875, -1.3758087158203125, -1.318328857421875, -1.2608489990234375, -1.203369140625, -1.1458892822265625, -1.088409423828125, -1.0309295654296875, -0.97344970703125, -0.9159698486328125, -0.858489990234375, -0.8010101318359375, -0.7435302734375, -0.6860504150390625, -0.628570556640625, -0.5710906982421875, -0.51361083984375, -0.4561309814453125, -0.398651123046875, -0.3411712646484375, -0.28369140625, -0.2262115478515625, -0.168731689453125, -0.1112518310546875, -0.05377197265625, 0.0037078857421875, 0.061187744140625, 0.1186676025390625, 0.1761474609375, 0.2336273193359375, 0.291107177734375, 0.3485870361328125, 0.40606689453125, 0.4635467529296875, 0.521026611328125, 0.5785064697265625, 0.635986328125, 0.6934661865234375, 0.750946044921875, 0.8084259033203125, 0.86590576171875, 0.9233856201171875, 0.980865478515625, 1.0383453369140625, 1.0958251953125, 1.1533050537109375, 1.210784912109375, 1.2682647705078125, 1.32574462890625, 1.3832244873046875, 1.440704345703125, 1.4981842041015625, 1.5556640625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 8.0, 6.0, 12.0, 19.0, 23.0, 23.0, 25.0, 44.0, 40.0, 44.0, 59.0, 55.0, 55.0, 60.0, 66.0, 69.0, 55.0, 52.0, 46.0, 47.0, 38.0, 30.0, 32.0, 17.0, 17.0, 13.0, 8.0, 14.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.24609375, -1.2142868041992188, -1.1824798583984375, -1.1506729125976562, -1.118865966796875, -1.0870590209960938, -1.0552520751953125, -1.0234451293945312, -0.99163818359375, -0.9598312377929688, -0.9280242919921875, -0.8962173461914062, -0.864410400390625, -0.8326034545898438, -0.8007965087890625, -0.7689895629882812, -0.7371826171875, -0.7053756713867188, -0.6735687255859375, -0.6417617797851562, -0.609954833984375, -0.5781478881835938, -0.5463409423828125, -0.5145339965820312, -0.48272705078125, -0.45092010498046875, -0.4191131591796875, -0.38730621337890625, -0.355499267578125, -0.32369232177734375, -0.2918853759765625, -0.26007843017578125, -0.228271484375, -0.19646453857421875, -0.1646575927734375, -0.13285064697265625, -0.101043701171875, -0.06923675537109375, -0.0374298095703125, -0.00562286376953125, 0.02618408203125, 0.05799102783203125, 0.0897979736328125, 0.12160491943359375, 0.153411865234375, 0.18521881103515625, 0.2170257568359375, 0.24883270263671875, 0.2806396484375, 0.31244659423828125, 0.3442535400390625, 0.37606048583984375, 0.407867431640625, 0.43967437744140625, 0.4714813232421875, 0.5032882690429688, 0.53509521484375, 0.5669021606445312, 0.5987091064453125, 0.6305160522460938, 0.662322998046875, 0.6941299438476562, 0.7259368896484375, 0.7577438354492188, 0.78955078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 23.0, 39.0, 46.0, 69.0, 120.0, 182.0, 313.0, 546.0, 1091.0, 2641.0, 8765.0, 62946.0, 2846079.0, 1222434.0, 38811.0, 6291.0, 1938.0, 789.0, 438.0, 258.0, 151.0, 85.0, 66.0, 60.0, 29.0, 12.0, 18.0, 9.0, 4.0, 0.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.43914794921875, -2.3626708984375, -2.28619384765625, -2.209716796875, -2.13323974609375, -2.0567626953125, -1.98028564453125, -1.90380859375, -1.82733154296875, -1.7508544921875, -1.67437744140625, -1.597900390625, -1.52142333984375, -1.4449462890625, -1.36846923828125, -1.2919921875, -1.21551513671875, -1.1390380859375, -1.06256103515625, -0.986083984375, -0.90960693359375, -0.8331298828125, -0.75665283203125, -0.68017578125, -0.60369873046875, -0.5272216796875, -0.45074462890625, -0.374267578125, -0.29779052734375, -0.2213134765625, -0.14483642578125, -0.068359375, 0.00811767578125, 0.0845947265625, 0.16107177734375, 0.237548828125, 0.31402587890625, 0.3905029296875, 0.46697998046875, 0.54345703125, 0.61993408203125, 0.6964111328125, 0.77288818359375, 0.849365234375, 0.92584228515625, 1.0023193359375, 1.07879638671875, 1.1552734375, 1.23175048828125, 1.3082275390625, 1.38470458984375, 1.461181640625, 1.53765869140625, 1.6141357421875, 1.69061279296875, 1.76708984375, 1.84356689453125, 1.9200439453125, 1.99652099609375, 2.072998046875, 2.14947509765625, 2.2259521484375, 2.30242919921875, 2.37890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 12.0, 7.0, 33.0, 69.0, 142.0, 579.0, 1379.0, 1201.0, 388.0, 118.0, 73.0, 32.0, 16.0, 11.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6171875, -3.4962158203125, -3.375244140625, -3.2542724609375, -3.13330078125, -3.0123291015625, -2.891357421875, -2.7703857421875, -2.6494140625, -2.5284423828125, -2.407470703125, -2.2864990234375, -2.16552734375, -2.0445556640625, -1.923583984375, -1.8026123046875, -1.681640625, -1.5606689453125, -1.439697265625, -1.3187255859375, -1.19775390625, -1.0767822265625, -0.955810546875, -0.8348388671875, -0.7138671875, -0.5928955078125, -0.471923828125, -0.3509521484375, -0.22998046875, -0.1090087890625, 0.011962890625, 0.1329345703125, 0.25390625, 0.3748779296875, 0.495849609375, 0.6168212890625, 0.73779296875, 0.8587646484375, 0.979736328125, 1.1007080078125, 1.2216796875, 1.3426513671875, 1.463623046875, 1.5845947265625, 1.70556640625, 1.8265380859375, 1.947509765625, 2.0684814453125, 2.189453125, 2.3104248046875, 2.431396484375, 2.5523681640625, 2.67333984375, 2.7943115234375, 2.915283203125, 3.0362548828125, 3.1572265625, 3.2781982421875, 3.399169921875, 3.5201416015625, 3.64111328125, 3.7620849609375, 3.883056640625, 4.0040283203125, 4.125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 9.0, 16.0, 27.0, 61.0, 175.0, 303.0, 239.0, 114.0, 32.0, 9.0, 7.0, 4.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.57048797607422, -31.726947784423828, -30.883407592773438, -30.039867401123047, -29.196327209472656, -28.352787017822266, -27.509246826171875, -26.665706634521484, -25.822166442871094, -24.978626251220703, -24.135086059570312, -23.291545867919922, -22.44800567626953, -21.60446548461914, -20.76092529296875, -19.91738510131836, -19.07384490966797, -18.230304718017578, -17.386764526367188, -16.543224334716797, -15.699684143066406, -14.856143951416016, -14.012603759765625, -13.169063568115234, -12.325523376464844, -11.481983184814453, -10.638442993164062, -9.794902801513672, -8.951362609863281, -8.10782241821289, -7.2642822265625, -6.420742034912109, -5.577201843261719, -4.733661651611328, -3.8901214599609375, -3.046581268310547, -2.2030410766601562, -1.3595008850097656, -0.515960693359375, 0.3275794982910156, 1.1711196899414062, 2.014659881591797, 2.8582000732421875, 3.701740264892578, 4.545280456542969, 5.388820648193359, 6.23236083984375, 7.075901031494141, 7.919441223144531, 8.762981414794922, 9.606521606445312, 10.450061798095703, 11.293601989746094, 12.137142181396484, 12.980682373046875, 13.824222564697266, 14.667762756347656, 15.511302947998047, 16.354843139648438, 17.198383331298828, 18.04192352294922, 18.88546371459961, 19.72900390625, 20.57254409790039, 21.41608428955078]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 19.0, 24.0, 19.0, 39.0, 54.0, 59.0, 88.0, 114.0, 124.0, 115.0, 99.0, 79.0, 63.0, 42.0, 24.0, 9.0, 12.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.962499618530273, -21.369991302490234, -20.777481079101562, -20.184972763061523, -19.592464447021484, -18.999956130981445, -18.407447814941406, -17.814937591552734, -17.222429275512695, -16.629920959472656, -16.037410736083984, -15.444902420043945, -14.852394104003906, -14.259885787963867, -13.667376518249512, -13.074867248535156, -12.482358932495117, -11.889850616455078, -11.297341346740723, -10.704832077026367, -10.112323760986328, -9.519815444946289, -8.927306175231934, -8.334796905517578, -7.742288589477539, -7.149779796600342, -6.5572710037231445, -5.964762210845947, -5.37225341796875, -4.779744625091553, -4.1872358322143555, -3.594727039337158, -3.0022201538085938, -2.4097113609313965, -1.8172025680541992, -1.224693775177002, -0.6321849822998047, -0.03967618942260742, 0.5528326034545898, 1.145341396331787, 1.7378501892089844, 2.3303589820861816, 2.922867774963379, 3.515376567840576, 4.107885360717773, 4.700394153594971, 5.292902946472168, 5.885411739349365, 6.4779205322265625, 7.07042932510376, 7.662938117980957, 8.255447387695312, 8.847955703735352, 9.44046401977539, 10.032973289489746, 10.625482559204102, 11.21799087524414, 11.81049919128418, 12.403008460998535, 12.99551773071289, 13.58802604675293, 14.180534362792969, 14.773043632507324, 15.36555290222168, 15.958061218261719]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 12.0, 9.0, 13.0, 23.0, 29.0, 38.0, 57.0, 71.0, 84.0, 128.0, 240.0, 371.0, 635.0, 1230.0, 2664.0, 7036.0, 22328.0, 99135.0, 513193.0, 318948.0, 58282.0, 14793.0, 4810.0, 2025.0, 933.0, 506.0, 307.0, 178.0, 125.0, 88.0, 59.0, 40.0, 36.0, 27.0, 29.0, 19.0, 5.0, 12.0, 7.0, 5.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.08203125, -2.0204925537109375, -1.958953857421875, -1.8974151611328125, -1.83587646484375, -1.7743377685546875, -1.712799072265625, -1.6512603759765625, -1.5897216796875, -1.5281829833984375, -1.466644287109375, -1.4051055908203125, -1.34356689453125, -1.2820281982421875, -1.220489501953125, -1.1589508056640625, -1.097412109375, -1.0358734130859375, -0.974334716796875, -0.9127960205078125, -0.85125732421875, -0.7897186279296875, -0.728179931640625, -0.6666412353515625, -0.6051025390625, -0.5435638427734375, -0.482025146484375, -0.4204864501953125, -0.35894775390625, -0.2974090576171875, -0.235870361328125, -0.1743316650390625, -0.11279296875, -0.0512542724609375, 0.010284423828125, 0.0718231201171875, 0.13336181640625, 0.1949005126953125, 0.256439208984375, 0.3179779052734375, 0.3795166015625, 0.4410552978515625, 0.502593994140625, 0.5641326904296875, 0.62567138671875, 0.6872100830078125, 0.748748779296875, 0.8102874755859375, 0.871826171875, 0.9333648681640625, 0.994903564453125, 1.0564422607421875, 1.11798095703125, 1.1795196533203125, 1.241058349609375, 1.3025970458984375, 1.3641357421875, 1.4256744384765625, 1.487213134765625, 1.5487518310546875, 1.61029052734375, 1.6718292236328125, 1.733367919921875, 1.7949066162109375, 1.8564453125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 10.0, 6.0, 4.0, 2.0, 9.0, 14.0, 17.0, 29.0, 35.0, 35.0, 47.0, 49.0, 51.0, 71.0, 65.0, 73.0, 64.0, 80.0, 71.0, 55.0, 51.0, 45.0, 19.0, 22.0, 33.0, 17.0, 20.0, 4.0, 7.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7373046875, -0.701751708984375, -0.66619873046875, -0.630645751953125, -0.5950927734375, -0.559539794921875, -0.52398681640625, -0.488433837890625, -0.452880859375, -0.417327880859375, -0.38177490234375, -0.346221923828125, -0.3106689453125, -0.275115966796875, -0.23956298828125, -0.204010009765625, -0.16845703125, -0.132904052734375, -0.09735107421875, -0.061798095703125, -0.0262451171875, 0.009307861328125, 0.04486083984375, 0.080413818359375, 0.115966796875, 0.151519775390625, 0.18707275390625, 0.222625732421875, 0.2581787109375, 0.293731689453125, 0.32928466796875, 0.364837646484375, 0.400390625, 0.435943603515625, 0.47149658203125, 0.507049560546875, 0.5426025390625, 0.578155517578125, 0.61370849609375, 0.649261474609375, 0.684814453125, 0.720367431640625, 0.75592041015625, 0.791473388671875, 0.8270263671875, 0.862579345703125, 0.89813232421875, 0.933685302734375, 0.96923828125, 1.004791259765625, 1.04034423828125, 1.075897216796875, 1.1114501953125, 1.147003173828125, 1.18255615234375, 1.218109130859375, 1.253662109375, 1.289215087890625, 1.32476806640625, 1.360321044921875, 1.3958740234375, 1.431427001953125, 1.46697998046875, 1.502532958984375, 1.5380859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 9.0, 8.0, 22.0, 27.0, 40.0, 62.0, 84.0, 180.0, 287.0, 558.0, 1154.0, 3088.0, 12705.0, 150014.0, 831051.0, 39467.0, 6078.0, 1943.0, 791.0, 379.0, 221.0, 113.0, 71.0, 53.0, 31.0, 28.0, 16.0, 14.0, 9.0, 4.0, 8.0, 6.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.4892578125, -4.345703125, -4.2021484375, -4.05859375, -3.9150390625, -3.771484375, -3.6279296875, -3.484375, -3.3408203125, -3.197265625, -3.0537109375, -2.91015625, -2.7666015625, -2.623046875, -2.4794921875, -2.3359375, -2.1923828125, -2.048828125, -1.9052734375, -1.76171875, -1.6181640625, -1.474609375, -1.3310546875, -1.1875, -1.0439453125, -0.900390625, -0.7568359375, -0.61328125, -0.4697265625, -0.326171875, -0.1826171875, -0.0390625, 0.1044921875, 0.248046875, 0.3916015625, 0.53515625, 0.6787109375, 0.822265625, 0.9658203125, 1.109375, 1.2529296875, 1.396484375, 1.5400390625, 1.68359375, 1.8271484375, 1.970703125, 2.1142578125, 2.2578125, 2.4013671875, 2.544921875, 2.6884765625, 2.83203125, 2.9755859375, 3.119140625, 3.2626953125, 3.40625, 3.5498046875, 3.693359375, 3.8369140625, 3.98046875, 4.1240234375, 4.267578125, 4.4111328125, 4.5546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 8.0, 15.0, 24.0, 17.0, 31.0, 29.0, 40.0, 37.0, 69.0, 80.0, 69.0, 60.0, 81.0, 82.0, 72.0, 66.0, 43.0, 37.0, 21.0, 20.0, 19.0, 16.0, 13.0, 7.0, 9.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8984375, -4.73516845703125, -4.5718994140625, -4.40863037109375, -4.245361328125, -4.08209228515625, -3.9188232421875, -3.75555419921875, -3.59228515625, -3.42901611328125, -3.2657470703125, -3.10247802734375, -2.939208984375, -2.77593994140625, -2.6126708984375, -2.44940185546875, -2.2861328125, -2.12286376953125, -1.9595947265625, -1.79632568359375, -1.633056640625, -1.46978759765625, -1.3065185546875, -1.14324951171875, -0.97998046875, -0.81671142578125, -0.6534423828125, -0.49017333984375, -0.326904296875, -0.16363525390625, -0.0003662109375, 0.16290283203125, 0.326171875, 0.48944091796875, 0.6527099609375, 0.81597900390625, 0.979248046875, 1.14251708984375, 1.3057861328125, 1.46905517578125, 1.63232421875, 1.79559326171875, 1.9588623046875, 2.12213134765625, 2.285400390625, 2.44866943359375, 2.6119384765625, 2.77520751953125, 2.9384765625, 3.10174560546875, 3.2650146484375, 3.42828369140625, 3.591552734375, 3.75482177734375, 3.9180908203125, 4.08135986328125, 4.24462890625, 4.40789794921875, 4.5711669921875, 4.73443603515625, 4.897705078125, 5.06097412109375, 5.2242431640625, 5.38751220703125, 5.55078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 10.0, 9.0, 14.0, 24.0, 29.0, 26.0, 73.0, 97.0, 137.0, 267.0, 559.0, 1226.0, 3257.0, 12807.0, 110832.0, 872083.0, 36653.0, 6561.0, 2070.0, 829.0, 380.0, 202.0, 128.0, 82.0, 54.0, 32.0, 21.0, 19.0, 14.0, 8.0, 11.0, 4.0, 8.0, 6.0, 2.0, 6.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.115234375, -2.049713134765625, -1.98419189453125, -1.918670654296875, -1.8531494140625, -1.787628173828125, -1.72210693359375, -1.656585693359375, -1.591064453125, -1.525543212890625, -1.46002197265625, -1.394500732421875, -1.3289794921875, -1.263458251953125, -1.19793701171875, -1.132415771484375, -1.06689453125, -1.001373291015625, -0.93585205078125, -0.870330810546875, -0.8048095703125, -0.739288330078125, -0.67376708984375, -0.608245849609375, -0.542724609375, -0.477203369140625, -0.41168212890625, -0.346160888671875, -0.2806396484375, -0.215118408203125, -0.14959716796875, -0.084075927734375, -0.0185546875, 0.046966552734375, 0.11248779296875, 0.178009033203125, 0.2435302734375, 0.309051513671875, 0.37457275390625, 0.440093994140625, 0.505615234375, 0.571136474609375, 0.63665771484375, 0.702178955078125, 0.7677001953125, 0.833221435546875, 0.89874267578125, 0.964263916015625, 1.02978515625, 1.095306396484375, 1.16082763671875, 1.226348876953125, 1.2918701171875, 1.357391357421875, 1.42291259765625, 1.488433837890625, 1.553955078125, 1.619476318359375, 1.68499755859375, 1.750518798828125, 1.8160400390625, 1.881561279296875, 1.94708251953125, 2.012603759765625, 2.078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 4.0, 3.0, 3.0, 8.0, 12.0, 7.0, 8.0, 16.0, 14.0, 12.0, 13.0, 29.0, 33.0, 70.0, 105.0, 160.0, 168.0, 102.0, 50.0, 33.0, 25.0, 17.0, 13.0, 13.0, 17.0, 10.0, 4.0, 5.0, 9.0, 3.0, 10.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.00030231475830078125, -0.0002931058406829834, -0.00028389692306518555, -0.0002746880054473877, -0.00026547908782958984, -0.000256270170211792, -0.00024706125259399414, -0.0002378523349761963, -0.00022864341735839844, -0.00021943449974060059, -0.00021022558212280273, -0.00020101666450500488, -0.00019180774688720703, -0.00018259882926940918, -0.00017338991165161133, -0.00016418099403381348, -0.00015497207641601562, -0.00014576315879821777, -0.00013655424118041992, -0.00012734532356262207, -0.00011813640594482422, -0.00010892748832702637, -9.971857070922852e-05, -9.050965309143066e-05, -8.130073547363281e-05, -7.209181785583496e-05, -6.288290023803711e-05, -5.367398262023926e-05, -4.4465065002441406e-05, -3.5256147384643555e-05, -2.6047229766845703e-05, -1.683831214904785e-05, -7.62939453125e-06, 1.5795230865478516e-06, 1.0788440704345703e-05, 1.9997358322143555e-05, 2.9206275939941406e-05, 3.841519355773926e-05, 4.762411117553711e-05, 5.683302879333496e-05, 6.604194641113281e-05, 7.525086402893066e-05, 8.445978164672852e-05, 9.366869926452637e-05, 0.00010287761688232422, 0.00011208653450012207, 0.00012129545211791992, 0.00013050436973571777, 0.00013971328735351562, 0.00014892220497131348, 0.00015813112258911133, 0.00016734004020690918, 0.00017654895782470703, 0.00018575787544250488, 0.00019496679306030273, 0.00020417571067810059, 0.00021338462829589844, 0.0002225935459136963, 0.00023180246353149414, 0.000241011381149292, 0.00025022029876708984, 0.0002594292163848877, 0.00026863813400268555, 0.0002778470516204834, 0.00028705596923828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 3.0, 8.0, 4.0, 8.0, 18.0, 23.0, 28.0, 45.0, 47.0, 68.0, 95.0, 131.0, 203.0, 233.0, 357.0, 633.0, 1050.0, 2071.0, 4715.0, 11965.0, 36370.0, 279697.0, 638041.0, 46886.0, 14432.0, 5764.0, 2429.0, 1200.0, 696.0, 450.0, 258.0, 164.0, 126.0, 82.0, 46.0, 55.0, 35.0, 37.0, 15.0, 19.0, 11.0, 12.0, 4.0, 5.0, 6.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.2705078125, -1.23211669921875, -1.1937255859375, -1.15533447265625, -1.116943359375, -1.07855224609375, -1.0401611328125, -1.00177001953125, -0.96337890625, -0.92498779296875, -0.8865966796875, -0.84820556640625, -0.809814453125, -0.77142333984375, -0.7330322265625, -0.69464111328125, -0.65625, -0.61785888671875, -0.5794677734375, -0.54107666015625, -0.502685546875, -0.46429443359375, -0.4259033203125, -0.38751220703125, -0.34912109375, -0.31072998046875, -0.2723388671875, -0.23394775390625, -0.195556640625, -0.15716552734375, -0.1187744140625, -0.08038330078125, -0.0419921875, -0.00360107421875, 0.0347900390625, 0.07318115234375, 0.111572265625, 0.14996337890625, 0.1883544921875, 0.22674560546875, 0.26513671875, 0.30352783203125, 0.3419189453125, 0.38031005859375, 0.418701171875, 0.45709228515625, 0.4954833984375, 0.53387451171875, 0.572265625, 0.61065673828125, 0.6490478515625, 0.68743896484375, 0.725830078125, 0.76422119140625, 0.8026123046875, 0.84100341796875, 0.87939453125, 0.91778564453125, 0.9561767578125, 0.99456787109375, 1.032958984375, 1.07135009765625, 1.1097412109375, 1.14813232421875, 1.1865234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 5.0, 3.0, 4.0, 6.0, 7.0, 13.0, 11.0, 24.0, 29.0, 47.0, 76.0, 111.0, 160.0, 144.0, 108.0, 68.0, 43.0, 30.0, 24.0, 13.0, 10.0, 9.0, 7.0, 6.0, 2.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.244140625, -1.2050323486328125, -1.165924072265625, -1.1268157958984375, -1.08770751953125, -1.0485992431640625, -1.009490966796875, -0.9703826904296875, -0.9312744140625, -0.8921661376953125, -0.853057861328125, -0.8139495849609375, -0.77484130859375, -0.7357330322265625, -0.696624755859375, -0.6575164794921875, -0.618408203125, -0.5792999267578125, -0.540191650390625, -0.5010833740234375, -0.46197509765625, -0.4228668212890625, -0.383758544921875, -0.3446502685546875, -0.3055419921875, -0.2664337158203125, -0.227325439453125, -0.1882171630859375, -0.14910888671875, -0.1100006103515625, -0.070892333984375, -0.0317840576171875, 0.00732421875, 0.0464324951171875, 0.085540771484375, 0.1246490478515625, 0.16375732421875, 0.2028656005859375, 0.241973876953125, 0.2810821533203125, 0.3201904296875, 0.3592987060546875, 0.398406982421875, 0.4375152587890625, 0.47662353515625, 0.5157318115234375, 0.554840087890625, 0.5939483642578125, 0.633056640625, 0.6721649169921875, 0.711273193359375, 0.7503814697265625, 0.78948974609375, 0.8285980224609375, 0.867706298828125, 0.9068145751953125, 0.9459228515625, 0.9850311279296875, 1.024139404296875, 1.0632476806640625, 1.10235595703125, 1.1414642333984375, 1.180572509765625, 1.2196807861328125, 1.2587890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 12.0, 18.0, 38.0, 155.0, 369.0, 276.0, 67.0, 31.0, 6.0, 4.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.00312805175781, -36.84510803222656, -35.68709182739258, -34.52907180786133, -33.37105178833008, -32.213035583496094, -31.055015563964844, -29.896995544433594, -28.738977432250977, -27.58095932006836, -26.42293930053711, -25.264921188354492, -24.106903076171875, -22.948883056640625, -21.790864944458008, -20.63284683227539, -19.47482681274414, -18.316808700561523, -17.158788681030273, -16.000770568847656, -14.842751502990723, -13.684732437133789, -12.526714324951172, -11.368695259094238, -10.210676193237305, -9.052657127380371, -7.894638538360596, -6.73661994934082, -5.578600883483887, -4.420581817626953, -3.2625632286071777, -2.1045446395874023, -0.9465217590332031, 0.21149706840515137, 1.3695158958435059, 2.5275347232818604, 3.685553550720215, 4.843572616577148, 6.001591205596924, 7.159609794616699, 8.317628860473633, 9.475647926330566, 10.6336669921875, 11.791685104370117, 12.94970417022705, 14.107723236083984, 15.265741348266602, 16.42375946044922, 17.58177947998047, 18.739797592163086, 19.897817611694336, 21.055835723876953, 22.213855743408203, 23.37187385559082, 24.529891967773438, 25.687911987304688, 26.845930099487305, 28.003948211669922, 29.161968231201172, 30.31998634338379, 31.478004455566406, 32.636024475097656, 33.794044494628906, 34.95206069946289, 36.11008071899414]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 4.0, 4.0, 8.0, 10.0, 13.0, 14.0, 15.0, 18.0, 19.0, 26.0, 24.0, 46.0, 43.0, 51.0, 57.0, 66.0, 85.0, 70.0, 65.0, 55.0, 40.0, 44.0, 44.0, 32.0, 19.0, 14.0, 21.0, 16.0, 18.0, 11.0, 15.0, 11.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0589599609375, -16.572635650634766, -16.08631134033203, -15.59998607635498, -15.113661766052246, -14.627336502075195, -14.141012191772461, -13.654687881469727, -13.168363571166992, -12.682039260864258, -12.195713996887207, -11.709389686584473, -11.223065376281738, -10.736740112304688, -10.250415802001953, -9.764091491699219, -9.277767181396484, -8.79144287109375, -8.3051176071167, -7.818793296813965, -7.3324689865112305, -6.846144199371338, -6.359819412231445, -5.873495101928711, -5.38716983795166, -4.900845050811768, -4.414520740509033, -3.9281959533691406, -3.4418716430664062, -2.9555468559265137, -2.4692223072052, -1.9828977584838867, -1.4965734481811523, -1.0102488994598389, -0.5239242911338806, -0.03759968280792236, 0.4487248659133911, 0.9350495338439941, 1.4213740825653076, 1.907698631286621, 2.3940231800079346, 2.880347728729248, 3.3666722774505615, 3.852996826171875, 4.339321613311768, 4.82564640045166, 5.3119707107543945, 5.798295021057129, 6.2846198081970215, 6.770944595336914, 7.257268905639648, 7.743593692779541, 8.229918479919434, 8.716242790222168, 9.202567100524902, 9.688892364501953, 10.175216674804688, 10.661540985107422, 11.147866249084473, 11.634190559387207, 12.120514869689941, 12.606840133666992, 13.093164443969727, 13.579488754272461, 14.065813064575195]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 7.0, 10.0, 17.0, 20.0, 24.0, 35.0, 51.0, 78.0, 131.0, 255.0, 436.0, 921.0, 2413.0, 8023.0, 58271.0, 3413676.0, 680727.0, 21096.0, 4642.0, 1762.0, 757.0, 374.0, 218.0, 123.0, 72.0, 45.0, 25.0, 18.0, 25.0, 14.0, 3.0, 4.0, 3.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0234375, -2.941253662109375, -2.85906982421875, -2.776885986328125, -2.6947021484375, -2.612518310546875, -2.53033447265625, -2.448150634765625, -2.365966796875, -2.283782958984375, -2.20159912109375, -2.119415283203125, -2.0372314453125, -1.955047607421875, -1.87286376953125, -1.790679931640625, -1.70849609375, -1.626312255859375, -1.54412841796875, -1.461944580078125, -1.3797607421875, -1.297576904296875, -1.21539306640625, -1.133209228515625, -1.051025390625, -0.968841552734375, -0.88665771484375, -0.804473876953125, -0.7222900390625, -0.640106201171875, -0.55792236328125, -0.475738525390625, -0.3935546875, -0.311370849609375, -0.22918701171875, -0.147003173828125, -0.0648193359375, 0.017364501953125, 0.09954833984375, 0.181732177734375, 0.263916015625, 0.346099853515625, 0.42828369140625, 0.510467529296875, 0.5926513671875, 0.674835205078125, 0.75701904296875, 0.839202880859375, 0.92138671875, 1.003570556640625, 1.08575439453125, 1.167938232421875, 1.2501220703125, 1.332305908203125, 1.41448974609375, 1.496673583984375, 1.578857421875, 1.661041259765625, 1.74322509765625, 1.825408935546875, 1.9075927734375, 1.989776611328125, 2.07196044921875, 2.154144287109375, 2.236328125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 10.0, 12.0, 8.0, 12.0, 22.0, 44.0, 40.0, 45.0, 81.0, 68.0, 81.0, 66.0, 75.0, 70.0, 76.0, 54.0, 52.0, 43.0, 48.0, 28.0, 21.0, 14.0, 10.0, 8.0, 2.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1357421875, -1.0981903076171875, -1.060638427734375, -1.0230865478515625, -0.98553466796875, -0.9479827880859375, -0.910430908203125, -0.8728790283203125, -0.8353271484375, -0.7977752685546875, -0.760223388671875, -0.7226715087890625, -0.68511962890625, -0.6475677490234375, -0.610015869140625, -0.5724639892578125, -0.534912109375, -0.4973602294921875, -0.459808349609375, -0.4222564697265625, -0.38470458984375, -0.3471527099609375, -0.309600830078125, -0.2720489501953125, -0.2344970703125, -0.1969451904296875, -0.159393310546875, -0.1218414306640625, -0.08428955078125, -0.0467376708984375, -0.009185791015625, 0.0283660888671875, 0.06591796875, 0.1034698486328125, 0.141021728515625, 0.1785736083984375, 0.21612548828125, 0.2536773681640625, 0.291229248046875, 0.3287811279296875, 0.3663330078125, 0.4038848876953125, 0.441436767578125, 0.4789886474609375, 0.51654052734375, 0.5540924072265625, 0.591644287109375, 0.6291961669921875, 0.666748046875, 0.7042999267578125, 0.741851806640625, 0.7794036865234375, 0.81695556640625, 0.8545074462890625, 0.892059326171875, 0.9296112060546875, 0.9671630859375, 1.0047149658203125, 1.042266845703125, 1.0798187255859375, 1.11737060546875, 1.1549224853515625, 1.192474365234375, 1.2300262451171875, 1.267578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 10.0, 14.0, 15.0, 35.0, 58.0, 91.0, 169.0, 314.0, 637.0, 1228.0, 2644.0, 9633.0, 738979.0, 3420603.0, 14453.0, 2989.0, 1179.0, 547.0, 288.0, 155.0, 86.0, 56.0, 36.0, 24.0, 9.0, 12.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.9453125, -5.79327392578125, -5.6412353515625, -5.48919677734375, -5.337158203125, -5.18511962890625, -5.0330810546875, -4.88104248046875, -4.72900390625, -4.57696533203125, -4.4249267578125, -4.27288818359375, -4.120849609375, -3.96881103515625, -3.8167724609375, -3.66473388671875, -3.5126953125, -3.36065673828125, -3.2086181640625, -3.05657958984375, -2.904541015625, -2.75250244140625, -2.6004638671875, -2.44842529296875, -2.29638671875, -2.14434814453125, -1.9923095703125, -1.84027099609375, -1.688232421875, -1.53619384765625, -1.3841552734375, -1.23211669921875, -1.080078125, -0.92803955078125, -0.7760009765625, -0.62396240234375, -0.471923828125, -0.31988525390625, -0.1678466796875, -0.01580810546875, 0.13623046875, 0.28826904296875, 0.4403076171875, 0.59234619140625, 0.744384765625, 0.89642333984375, 1.0484619140625, 1.20050048828125, 1.3525390625, 1.50457763671875, 1.6566162109375, 1.80865478515625, 1.960693359375, 2.11273193359375, 2.2647705078125, 2.41680908203125, 2.56884765625, 2.72088623046875, 2.8729248046875, 3.02496337890625, 3.177001953125, 3.32904052734375, 3.4810791015625, 3.63311767578125, 3.78515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 2.0, 10.0, 25.0, 65.0, 241.0, 1347.0, 1833.0, 393.0, 98.0, 30.0, 15.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.00390625, -4.83221435546875, -4.6605224609375, -4.48883056640625, -4.317138671875, -4.14544677734375, -3.9737548828125, -3.80206298828125, -3.63037109375, -3.45867919921875, -3.2869873046875, -3.11529541015625, -2.943603515625, -2.77191162109375, -2.6002197265625, -2.42852783203125, -2.2568359375, -2.08514404296875, -1.9134521484375, -1.74176025390625, -1.570068359375, -1.39837646484375, -1.2266845703125, -1.05499267578125, -0.88330078125, -0.71160888671875, -0.5399169921875, -0.36822509765625, -0.196533203125, -0.02484130859375, 0.1468505859375, 0.31854248046875, 0.490234375, 0.66192626953125, 0.8336181640625, 1.00531005859375, 1.177001953125, 1.34869384765625, 1.5203857421875, 1.69207763671875, 1.86376953125, 2.03546142578125, 2.2071533203125, 2.37884521484375, 2.550537109375, 2.72222900390625, 2.8939208984375, 3.06561279296875, 3.2373046875, 3.40899658203125, 3.5806884765625, 3.75238037109375, 3.924072265625, 4.09576416015625, 4.2674560546875, 4.43914794921875, 4.61083984375, 4.78253173828125, 4.9542236328125, 5.12591552734375, 5.297607421875, 5.46929931640625, 5.6409912109375, 5.81268310546875, 5.984375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 15.0, 13.0, 163.0, 637.0, 147.0, 19.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.47325897216797, -99.37967681884766, -97.28609466552734, -95.1925048828125, -93.09892272949219, -91.00534057617188, -88.91175842285156, -86.81817626953125, -84.72459411621094, -82.63101196289062, -80.53742980957031, -78.44384765625, -76.35025787353516, -74.25667572021484, -72.16309356689453, -70.06951141357422, -67.97592163085938, -65.88233947753906, -63.788753509521484, -61.69517135620117, -59.60158920288086, -57.50800323486328, -55.41442108154297, -53.320838928222656, -51.227256774902344, -49.13367462158203, -47.04008865356445, -44.94650650024414, -42.85292434692383, -40.75933837890625, -38.66575622558594, -36.572174072265625, -34.47859573364258, -32.385013580322266, -30.29142951965332, -28.197845458984375, -26.104263305664062, -24.010679244995117, -21.917095184326172, -19.82351303100586, -17.729928970336914, -15.636345863342285, -13.542762756347656, -11.449178695678711, -9.355595588684082, -7.262012481689453, -5.168428421020508, -3.074845314025879, -0.98126220703125, 1.112321138381958, 3.205904483795166, 5.299488067626953, 7.393071174621582, 9.486654281616211, 11.580238342285156, 13.673821449279785, 15.767404556274414, 17.86098861694336, 19.954570770263672, 22.048154830932617, 24.141738891601562, 26.235321044921875, 28.32890510559082, 30.422489166259766, 32.51607131958008]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 5.0, 13.0, 37.0, 75.0, 112.0, 173.0, 174.0, 174.0, 128.0, 68.0, 25.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.481294631958008, -19.55712127685547, -18.63294792175293, -17.70877456665039, -16.78459930419922, -15.86042594909668, -14.93625259399414, -14.012079238891602, -13.087904930114746, -12.163731575012207, -11.239557266235352, -10.315383911132812, -9.391210556030273, -8.467036247253418, -7.542862892150879, -6.618689060211182, -5.694515228271484, -4.770341396331787, -3.846167802810669, -2.921994209289551, -1.9978203773498535, -1.0736465454101562, -0.1494731903076172, 0.7747006416320801, 1.6988744735717773, 2.6230483055114746, 3.5472218990325928, 4.471395492553711, 5.395569324493408, 6.3197431564331055, 7.2439165115356445, 8.1680908203125, 9.092266082763672, 10.016439437866211, 10.940613746643066, 11.864787101745605, 12.788961410522461, 13.713134765625, 14.637308120727539, 15.561481475830078, 16.48565673828125, 17.40983009338379, 18.334003448486328, 19.2581787109375, 20.18235206604004, 21.106525421142578, 22.030698776245117, 22.954872131347656, 23.879045486450195, 24.803218841552734, 25.727392196655273, 26.651565551757812, 27.575740814208984, 28.499914169311523, 29.424087524414062, 30.3482608795166, 31.27243423461914, 32.19660949707031, 33.12078094482422, 34.04495620727539, 34.9691276550293, 35.89330291748047, 36.817474365234375, 37.74164962768555, 38.66582489013672]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 8.0, 9.0, 8.0, 9.0, 14.0, 23.0, 26.0, 37.0, 50.0, 85.0, 115.0, 178.0, 298.0, 522.0, 1119.0, 3289.0, 12030.0, 72804.0, 554540.0, 350048.0, 40824.0, 8021.0, 2316.0, 943.0, 450.0, 268.0, 163.0, 85.0, 61.0, 60.0, 34.0, 22.0, 16.0, 23.0, 14.0, 9.0, 7.0, 8.0, 1.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8515625, -1.78509521484375, -1.7186279296875, -1.65216064453125, -1.585693359375, -1.51922607421875, -1.4527587890625, -1.38629150390625, -1.31982421875, -1.25335693359375, -1.1868896484375, -1.12042236328125, -1.053955078125, -0.98748779296875, -0.9210205078125, -0.85455322265625, -0.7880859375, -0.72161865234375, -0.6551513671875, -0.58868408203125, -0.522216796875, -0.45574951171875, -0.3892822265625, -0.32281494140625, -0.25634765625, -0.18988037109375, -0.1234130859375, -0.05694580078125, 0.009521484375, 0.07598876953125, 0.1424560546875, 0.20892333984375, 0.275390625, 0.34185791015625, 0.4083251953125, 0.47479248046875, 0.541259765625, 0.60772705078125, 0.6741943359375, 0.74066162109375, 0.80712890625, 0.87359619140625, 0.9400634765625, 1.00653076171875, 1.072998046875, 1.13946533203125, 1.2059326171875, 1.27239990234375, 1.3388671875, 1.40533447265625, 1.4718017578125, 1.53826904296875, 1.604736328125, 1.67120361328125, 1.7376708984375, 1.80413818359375, 1.87060546875, 1.93707275390625, 2.0035400390625, 2.07000732421875, 2.136474609375, 2.20294189453125, 2.2694091796875, 2.33587646484375, 2.40234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 12.0, 6.0, 4.0, 9.0, 11.0, 18.0, 28.0, 30.0, 46.0, 39.0, 46.0, 65.0, 46.0, 61.0, 53.0, 63.0, 68.0, 39.0, 61.0, 41.0, 50.0, 38.0, 32.0, 31.0, 17.0, 20.0, 16.0, 17.0, 11.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.029296875, -0.9992904663085938, -0.9692840576171875, -0.9392776489257812, -0.909271240234375, -0.8792648315429688, -0.8492584228515625, -0.8192520141601562, -0.78924560546875, -0.7592391967773438, -0.7292327880859375, -0.6992263793945312, -0.669219970703125, -0.6392135620117188, -0.6092071533203125, -0.5792007446289062, -0.5491943359375, -0.5191879272460938, -0.4891815185546875, -0.45917510986328125, -0.429168701171875, -0.39916229248046875, -0.3691558837890625, -0.33914947509765625, -0.30914306640625, -0.27913665771484375, -0.2491302490234375, -0.21912384033203125, -0.189117431640625, -0.15911102294921875, -0.1291046142578125, -0.09909820556640625, -0.069091796875, -0.03908538818359375, -0.0090789794921875, 0.02092742919921875, 0.050933837890625, 0.08094024658203125, 0.1109466552734375, 0.14095306396484375, 0.17095947265625, 0.20096588134765625, 0.2309722900390625, 0.26097869873046875, 0.290985107421875, 0.32099151611328125, 0.3509979248046875, 0.38100433349609375, 0.4110107421875, 0.44101715087890625, 0.4710235595703125, 0.5010299682617188, 0.531036376953125, 0.5610427856445312, 0.5910491943359375, 0.6210556030273438, 0.65106201171875, 0.6810684204101562, 0.7110748291015625, 0.7410812377929688, 0.771087646484375, 0.8010940551757812, 0.8311004638671875, 0.8611068725585938, 0.89111328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 16.0, 17.0, 25.0, 31.0, 56.0, 59.0, 104.0, 176.0, 320.0, 583.0, 1231.0, 2844.0, 7836.0, 26142.0, 116573.0, 596738.0, 228001.0, 47229.0, 12729.0, 4342.0, 1750.0, 716.0, 396.0, 208.0, 127.0, 85.0, 62.0, 43.0, 33.0, 16.0, 5.0, 16.0, 5.0, 13.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.41015625, -1.3610382080078125, -1.311920166015625, -1.2628021240234375, -1.21368408203125, -1.1645660400390625, -1.115447998046875, -1.0663299560546875, -1.0172119140625, -0.9680938720703125, -0.918975830078125, -0.8698577880859375, -0.82073974609375, -0.7716217041015625, -0.722503662109375, -0.6733856201171875, -0.624267578125, -0.5751495361328125, -0.526031494140625, -0.4769134521484375, -0.42779541015625, -0.3786773681640625, -0.329559326171875, -0.2804412841796875, -0.2313232421875, -0.1822052001953125, -0.133087158203125, -0.0839691162109375, -0.03485107421875, 0.0142669677734375, 0.063385009765625, 0.1125030517578125, 0.16162109375, 0.2107391357421875, 0.259857177734375, 0.3089752197265625, 0.35809326171875, 0.4072113037109375, 0.456329345703125, 0.5054473876953125, 0.5545654296875, 0.6036834716796875, 0.652801513671875, 0.7019195556640625, 0.75103759765625, 0.8001556396484375, 0.849273681640625, 0.8983917236328125, 0.947509765625, 0.9966278076171875, 1.045745849609375, 1.0948638916015625, 1.14398193359375, 1.1930999755859375, 1.242218017578125, 1.2913360595703125, 1.3404541015625, 1.3895721435546875, 1.438690185546875, 1.4878082275390625, 1.53692626953125, 1.5860443115234375, 1.635162353515625, 1.6842803955078125, 1.7333984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 6.0, 10.0, 9.0, 12.0, 14.0, 22.0, 17.0, 21.0, 36.0, 33.0, 45.0, 44.0, 67.0, 63.0, 45.0, 62.0, 42.0, 39.0, 51.0, 61.0, 33.0, 46.0, 36.0, 31.0, 22.0, 21.0, 21.0, 10.0, 15.0, 12.0, 8.0, 10.0, 8.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.78515625, -2.69049072265625, -2.5958251953125, -2.50115966796875, -2.406494140625, -2.31182861328125, -2.2171630859375, -2.12249755859375, -2.02783203125, -1.93316650390625, -1.8385009765625, -1.74383544921875, -1.649169921875, -1.55450439453125, -1.4598388671875, -1.36517333984375, -1.2705078125, -1.17584228515625, -1.0811767578125, -0.98651123046875, -0.891845703125, -0.79718017578125, -0.7025146484375, -0.60784912109375, -0.51318359375, -0.41851806640625, -0.3238525390625, -0.22918701171875, -0.134521484375, -0.03985595703125, 0.0548095703125, 0.14947509765625, 0.244140625, 0.33880615234375, 0.4334716796875, 0.52813720703125, 0.622802734375, 0.71746826171875, 0.8121337890625, 0.90679931640625, 1.00146484375, 1.09613037109375, 1.1907958984375, 1.28546142578125, 1.380126953125, 1.47479248046875, 1.5694580078125, 1.66412353515625, 1.7587890625, 1.85345458984375, 1.9481201171875, 2.04278564453125, 2.137451171875, 2.23211669921875, 2.3267822265625, 2.42144775390625, 2.51611328125, 2.61077880859375, 2.7054443359375, 2.80010986328125, 2.894775390625, 2.98944091796875, 3.0841064453125, 3.17877197265625, 3.2734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 9.0, 18.0, 11.0, 29.0, 51.0, 93.0, 173.0, 356.0, 1036.0, 3624.0, 17096.0, 136892.0, 792410.0, 80543.0, 12094.0, 2697.0, 789.0, 304.0, 132.0, 74.0, 43.0, 28.0, 10.0, 11.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7373046875, -0.71221923828125, -0.6871337890625, -0.66204833984375, -0.636962890625, -0.61187744140625, -0.5867919921875, -0.56170654296875, -0.53662109375, -0.51153564453125, -0.4864501953125, -0.46136474609375, -0.436279296875, -0.41119384765625, -0.3861083984375, -0.36102294921875, -0.3359375, -0.31085205078125, -0.2857666015625, -0.26068115234375, -0.235595703125, -0.21051025390625, -0.1854248046875, -0.16033935546875, -0.13525390625, -0.11016845703125, -0.0850830078125, -0.05999755859375, -0.034912109375, -0.00982666015625, 0.0152587890625, 0.04034423828125, 0.0654296875, 0.09051513671875, 0.1156005859375, 0.14068603515625, 0.165771484375, 0.19085693359375, 0.2159423828125, 0.24102783203125, 0.26611328125, 0.29119873046875, 0.3162841796875, 0.34136962890625, 0.366455078125, 0.39154052734375, 0.4166259765625, 0.44171142578125, 0.466796875, 0.49188232421875, 0.5169677734375, 0.54205322265625, 0.567138671875, 0.59222412109375, 0.6173095703125, 0.64239501953125, 0.66748046875, 0.69256591796875, 0.7176513671875, 0.74273681640625, 0.767822265625, 0.79290771484375, 0.8179931640625, 0.84307861328125, 0.8681640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 8.0, 9.0, 6.0, 8.0, 22.0, 28.0, 51.0, 59.0, 78.0, 119.0, 159.0, 119.0, 88.0, 84.0, 53.0, 27.0, 20.0, 17.0, 7.0, 8.0, 3.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016307830810546875, -0.00015774555504322052, -0.0001524128019809723, -0.00014708004891872406, -0.00014174729585647583, -0.0001364145427942276, -0.00013108178973197937, -0.00012574903666973114, -0.00012041628360748291, -0.00011508353054523468, -0.00010975077748298645, -0.00010441802442073822, -9.908527135848999e-05, -9.375251829624176e-05, -8.841976523399353e-05, -8.30870121717453e-05, -7.775425910949707e-05, -7.242150604724884e-05, -6.708875298500061e-05, -6.175599992275238e-05, -5.642324686050415e-05, -5.109049379825592e-05, -4.575774073600769e-05, -4.042498767375946e-05, -3.509223461151123e-05, -2.9759481549263e-05, -2.442672848701477e-05, -1.909397542476654e-05, -1.376122236251831e-05, -8.42846930027008e-06, -3.0957162380218506e-06, 2.2370368242263794e-06, 7.569789886474609e-06, 1.290254294872284e-05, 1.823529601097107e-05, 2.35680490732193e-05, 2.890080213546753e-05, 3.423355519771576e-05, 3.956630825996399e-05, 4.489906132221222e-05, 5.023181438446045e-05, 5.556456744670868e-05, 6.089732050895691e-05, 6.623007357120514e-05, 7.156282663345337e-05, 7.68955796957016e-05, 8.222833275794983e-05, 8.756108582019806e-05, 9.289383888244629e-05, 9.822659194469452e-05, 0.00010355934500694275, 0.00010889209806919098, 0.00011422485113143921, 0.00011955760419368744, 0.00012489035725593567, 0.0001302231103181839, 0.00013555586338043213, 0.00014088861644268036, 0.0001462213695049286, 0.00015155412256717682, 0.00015688687562942505, 0.00016221962869167328, 0.0001675523817539215, 0.00017288513481616974, 0.00017821788787841797]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 6.0, 7.0, 6.0, 9.0, 11.0, 19.0, 19.0, 20.0, 52.0, 56.0, 69.0, 114.0, 150.0, 274.0, 429.0, 678.0, 1151.0, 2015.0, 3786.0, 7778.0, 17623.0, 46377.0, 158229.0, 564350.0, 162480.0, 48003.0, 17797.0, 7864.0, 4012.0, 2078.0, 1153.0, 674.0, 410.0, 273.0, 173.0, 117.0, 75.0, 60.0, 40.0, 34.0, 15.0, 11.0, 13.0, 11.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.4306640625, -0.4178123474121094, -0.40496063232421875, -0.3921089172363281, -0.3792572021484375, -0.3664054870605469, -0.35355377197265625, -0.3407020568847656, -0.327850341796875, -0.3149986267089844, -0.30214691162109375, -0.2892951965332031, -0.2764434814453125, -0.2635917663574219, -0.25074005126953125, -0.23788833618164062, -0.22503662109375, -0.21218490600585938, -0.19933319091796875, -0.18648147583007812, -0.1736297607421875, -0.16077804565429688, -0.14792633056640625, -0.13507461547851562, -0.122222900390625, -0.10937118530273438, -0.09651947021484375, -0.08366775512695312, -0.0708160400390625, -0.057964324951171875, -0.04511260986328125, -0.032260894775390625, -0.0194091796875, -0.006557464599609375, 0.00629425048828125, 0.019145965576171875, 0.0319976806640625, 0.044849395751953125, 0.05770111083984375, 0.07055282592773438, 0.083404541015625, 0.09625625610351562, 0.10910797119140625, 0.12195968627929688, 0.1348114013671875, 0.14766311645507812, 0.16051483154296875, 0.17336654663085938, 0.18621826171875, 0.19906997680664062, 0.21192169189453125, 0.22477340698242188, 0.2376251220703125, 0.2504768371582031, 0.26332855224609375, 0.2761802673339844, 0.289031982421875, 0.3018836975097656, 0.31473541259765625, 0.3275871276855469, 0.3404388427734375, 0.3532905578613281, 0.36614227294921875, 0.3789939880371094, 0.391845703125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 3.0, 9.0, 2.0, 9.0, 17.0, 18.0, 31.0, 30.0, 47.0, 47.0, 72.0, 76.0, 111.0, 111.0, 94.0, 75.0, 53.0, 47.0, 33.0, 22.0, 24.0, 12.0, 10.0, 6.0, 6.0, 5.0, 12.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.595703125, -0.577117919921875, -0.55853271484375, -0.539947509765625, -0.5213623046875, -0.502777099609375, -0.48419189453125, -0.465606689453125, -0.447021484375, -0.428436279296875, -0.40985107421875, -0.391265869140625, -0.3726806640625, -0.354095458984375, -0.33551025390625, -0.316925048828125, -0.29833984375, -0.279754638671875, -0.26116943359375, -0.242584228515625, -0.2239990234375, -0.205413818359375, -0.18682861328125, -0.168243408203125, -0.149658203125, -0.131072998046875, -0.11248779296875, -0.093902587890625, -0.0753173828125, -0.056732177734375, -0.03814697265625, -0.019561767578125, -0.0009765625, 0.017608642578125, 0.03619384765625, 0.054779052734375, 0.0733642578125, 0.091949462890625, 0.11053466796875, 0.129119873046875, 0.147705078125, 0.166290283203125, 0.18487548828125, 0.203460693359375, 0.2220458984375, 0.240631103515625, 0.25921630859375, 0.277801513671875, 0.29638671875, 0.314971923828125, 0.33355712890625, 0.352142333984375, 0.3707275390625, 0.389312744140625, 0.40789794921875, 0.426483154296875, 0.445068359375, 0.463653564453125, 0.48223876953125, 0.500823974609375, 0.5194091796875, 0.537994384765625, 0.55657958984375, 0.575164794921875, 0.59375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 8.0, 29.0, 115.0, 293.0, 337.0, 118.0, 43.0, 23.0, 14.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.319219589233398, -11.551124572753906, -10.78303050994873, -10.014935493469238, -9.246841430664062, -8.47874641418457, -7.710651397705078, -6.942556858062744, -6.17446231842041, -5.406367778778076, -4.638273239135742, -3.87017822265625, -3.102083683013916, -2.333989143371582, -1.5658941268920898, -0.7977995872497559, -0.029705047607421875, 0.7383896112442017, 1.5064842700958252, 2.2745790481567383, 3.0426735877990723, 3.8107681274414062, 4.578863143920898, 5.346957683563232, 6.115052223205566, 6.8831467628479, 7.651241302490234, 8.419336318969727, 9.187431335449219, 9.955525398254395, 10.723620414733887, 11.491714477539062, 12.259807586669922, 13.027902603149414, 13.79599666595459, 14.564091682434082, 15.332185745239258, 16.10028076171875, 16.868375778198242, 17.636470794677734, 18.404563903808594, 19.172658920288086, 19.940753936767578, 20.708847045898438, 21.47694206237793, 22.245037078857422, 23.013132095336914, 23.781227111816406, 24.5493221282959, 25.31741714477539, 26.085512161254883, 26.853607177734375, 27.621700286865234, 28.389795303344727, 29.15789031982422, 29.92598533630371, 30.694080352783203, 31.462175369262695, 32.23027038574219, 32.99836349487305, 33.76646041870117, 34.53455352783203, 35.302650451660156, 36.070743560791016, 36.838836669921875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 13.0, 13.0, 6.0, 19.0, 13.0, 22.0, 34.0, 31.0, 42.0, 41.0, 56.0, 61.0, 68.0, 99.0, 79.0, 70.0, 57.0, 57.0, 41.0, 42.0, 30.0, 27.0, 18.0, 8.0, 6.0, 15.0, 7.0, 6.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.066192626953125, -16.628786087036133, -16.191381454467773, -15.753975868225098, -15.316570281982422, -14.879164695739746, -14.44175910949707, -14.004353523254395, -13.566947937011719, -13.129542350769043, -12.692136764526367, -12.254731178283691, -11.817325592041016, -11.37992000579834, -10.942514419555664, -10.505108833312988, -10.067703247070312, -9.630297660827637, -9.192892074584961, -8.755486488342285, -8.31808090209961, -7.880675315856934, -7.443269729614258, -7.005864143371582, -6.56845760345459, -6.131052017211914, -5.693646430969238, -5.2562408447265625, -4.818835258483887, -4.381429672241211, -3.944023847579956, -3.5066182613372803, -3.0692129135131836, -2.631807327270508, -2.194401741027832, -1.7569960355758667, -1.319590449333191, -0.8821847438812256, -0.4447791576385498, -0.0073735713958740234, 0.43003201484680176, 0.8674376010894775, 1.3048431873321533, 1.7422488927841187, 2.179654598236084, 2.6170601844787598, 3.0544657707214355, 3.4918713569641113, 3.929276943206787, 4.366682529449463, 4.804088115692139, 5.2414937019348145, 5.67889928817749, 6.116305351257324, 6.5537109375, 6.991116523742676, 7.428522109985352, 7.865927696228027, 8.303333282470703, 8.740738868713379, 9.178144454956055, 9.61555004119873, 10.052955627441406, 10.490361213684082, 10.927766799926758]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 12.0, 11.0, 25.0, 46.0, 79.0, 161.0, 337.0, 855.0, 3549.0, 36654.0, 3858982.0, 284043.0, 6937.0, 1577.0, 517.0, 244.0, 125.0, 63.0, 28.0, 12.0, 9.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.890625, -1.78955078125, -1.6884765625, -1.58740234375, -1.486328125, -1.38525390625, -1.2841796875, -1.18310546875, -1.08203125, -0.98095703125, -0.8798828125, -0.77880859375, -0.677734375, -0.57666015625, -0.4755859375, -0.37451171875, -0.2734375, -0.17236328125, -0.0712890625, 0.02978515625, 0.130859375, 0.23193359375, 0.3330078125, 0.43408203125, 0.53515625, 0.63623046875, 0.7373046875, 0.83837890625, 0.939453125, 1.04052734375, 1.1416015625, 1.24267578125, 1.34375, 1.44482421875, 1.5458984375, 1.64697265625, 1.748046875, 1.84912109375, 1.9501953125, 2.05126953125, 2.15234375, 2.25341796875, 2.3544921875, 2.45556640625, 2.556640625, 2.65771484375, 2.7587890625, 2.85986328125, 2.9609375, 3.06201171875, 3.1630859375, 3.26416015625, 3.365234375, 3.46630859375, 3.5673828125, 3.66845703125, 3.76953125, 3.87060546875, 3.9716796875, 4.07275390625, 4.173828125, 4.27490234375, 4.3759765625, 4.47705078125, 4.578125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 10.0, 9.0, 19.0, 13.0, 21.0, 40.0, 50.0, 61.0, 56.0, 78.0, 74.0, 77.0, 84.0, 67.0, 62.0, 61.0, 47.0, 37.0, 39.0, 19.0, 17.0, 18.0, 16.0, 4.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12890625, -1.0920867919921875, -1.055267333984375, -1.0184478759765625, -0.98162841796875, -0.9448089599609375, -0.907989501953125, -0.8711700439453125, -0.8343505859375, -0.7975311279296875, -0.760711669921875, -0.7238922119140625, -0.68707275390625, -0.6502532958984375, -0.613433837890625, -0.5766143798828125, -0.539794921875, -0.5029754638671875, -0.466156005859375, -0.4293365478515625, -0.39251708984375, -0.3556976318359375, -0.318878173828125, -0.2820587158203125, -0.2452392578125, -0.2084197998046875, -0.171600341796875, -0.1347808837890625, -0.09796142578125, -0.0611419677734375, -0.024322509765625, 0.0124969482421875, 0.04931640625, 0.0861358642578125, 0.122955322265625, 0.1597747802734375, 0.19659423828125, 0.2334136962890625, 0.270233154296875, 0.3070526123046875, 0.3438720703125, 0.3806915283203125, 0.417510986328125, 0.4543304443359375, 0.49114990234375, 0.5279693603515625, 0.564788818359375, 0.6016082763671875, 0.638427734375, 0.6752471923828125, 0.712066650390625, 0.7488861083984375, 0.78570556640625, 0.8225250244140625, 0.859344482421875, 0.8961639404296875, 0.9329833984375, 0.9698028564453125, 1.006622314453125, 1.0434417724609375, 1.08026123046875, 1.1170806884765625, 1.153900146484375, 1.1907196044921875, 1.2275390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 5.0, 11.0, 15.0, 35.0, 51.0, 113.0, 244.0, 644.0, 2428.0, 17811.0, 937270.0, 3192266.0, 37966.0, 3838.0, 952.0, 349.0, 132.0, 70.0, 30.0, 17.0, 8.0, 12.0, 1.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.146484375, -3.06396484375, -2.9814453125, -2.89892578125, -2.81640625, -2.73388671875, -2.6513671875, -2.56884765625, -2.486328125, -2.40380859375, -2.3212890625, -2.23876953125, -2.15625, -2.07373046875, -1.9912109375, -1.90869140625, -1.826171875, -1.74365234375, -1.6611328125, -1.57861328125, -1.49609375, -1.41357421875, -1.3310546875, -1.24853515625, -1.166015625, -1.08349609375, -1.0009765625, -0.91845703125, -0.8359375, -0.75341796875, -0.6708984375, -0.58837890625, -0.505859375, -0.42333984375, -0.3408203125, -0.25830078125, -0.17578125, -0.09326171875, -0.0107421875, 0.07177734375, 0.154296875, 0.23681640625, 0.3193359375, 0.40185546875, 0.484375, 0.56689453125, 0.6494140625, 0.73193359375, 0.814453125, 0.89697265625, 0.9794921875, 1.06201171875, 1.14453125, 1.22705078125, 1.3095703125, 1.39208984375, 1.474609375, 1.55712890625, 1.6396484375, 1.72216796875, 1.8046875, 1.88720703125, 1.9697265625, 2.05224609375, 2.134765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 13.0, 19.0, 44.0, 50.0, 116.0, 193.0, 414.0, 870.0, 1054.0, 646.0, 317.0, 148.0, 75.0, 38.0, 23.0, 24.0, 7.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4892578125, -1.4222869873046875, -1.355316162109375, -1.2883453369140625, -1.22137451171875, -1.1544036865234375, -1.087432861328125, -1.0204620361328125, -0.9534912109375, -0.8865203857421875, -0.819549560546875, -0.7525787353515625, -0.68560791015625, -0.6186370849609375, -0.551666259765625, -0.4846954345703125, -0.417724609375, -0.3507537841796875, -0.283782958984375, -0.2168121337890625, -0.14984130859375, -0.0828704833984375, -0.015899658203125, 0.0510711669921875, 0.1180419921875, 0.1850128173828125, 0.251983642578125, 0.3189544677734375, 0.38592529296875, 0.4528961181640625, 0.519866943359375, 0.5868377685546875, 0.65380859375, 0.7207794189453125, 0.787750244140625, 0.8547210693359375, 0.92169189453125, 0.9886627197265625, 1.055633544921875, 1.1226043701171875, 1.1895751953125, 1.2565460205078125, 1.323516845703125, 1.3904876708984375, 1.45745849609375, 1.5244293212890625, 1.591400146484375, 1.6583709716796875, 1.725341796875, 1.7923126220703125, 1.859283447265625, 1.9262542724609375, 1.99322509765625, 2.0601959228515625, 2.127166748046875, 2.1941375732421875, 2.2611083984375, 2.3280792236328125, 2.395050048828125, 2.4620208740234375, 2.52899169921875, 2.5959625244140625, 2.662933349609375, 2.7299041748046875, 2.796875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 12.0, 29.0, 74.0, 145.0, 242.0, 229.0, 136.0, 70.0, 34.0, 22.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.026470184326172, -10.496062278747559, -9.965654373168945, -9.435246467590332, -8.904838562011719, -8.374430656433105, -7.844022750854492, -7.313614845275879, -6.783206939697266, -6.252799034118652, -5.722391128540039, -5.191983222961426, -4.6615753173828125, -4.131167411804199, -3.600759506225586, -3.0703516006469727, -2.5399436950683594, -2.009535789489746, -1.4791278839111328, -0.9487199783325195, -0.41831207275390625, 0.11209583282470703, 0.6425037384033203, 1.1729116439819336, 1.7033195495605469, 2.23372745513916, 2.7641353607177734, 3.2945432662963867, 3.824951171875, 4.355359077453613, 4.885766983032227, 5.41617488861084, 5.94658088684082, 6.476988792419434, 7.007396697998047, 7.53780460357666, 8.068212509155273, 8.598620414733887, 9.1290283203125, 9.659436225891113, 10.189844131469727, 10.72025203704834, 11.250659942626953, 11.781067848205566, 12.31147575378418, 12.841883659362793, 13.372291564941406, 13.90269947052002, 14.433107376098633, 14.963515281677246, 15.49392318725586, 16.024330139160156, 16.554738998413086, 17.085147857666016, 17.615554809570312, 18.14596176147461, 18.67637062072754, 19.20677947998047, 19.737186431884766, 20.267593383789062, 20.798002243041992, 21.328411102294922, 21.85881805419922, 22.389225006103516, 22.919633865356445]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 4.0, 5.0, 8.0, 11.0, 10.0, 16.0, 14.0, 20.0, 25.0, 24.0, 24.0, 37.0, 43.0, 39.0, 36.0, 54.0, 57.0, 52.0, 44.0, 56.0, 44.0, 50.0, 41.0, 36.0, 33.0, 36.0, 27.0, 34.0, 21.0, 21.0, 16.0, 12.0, 13.0, 6.0, 6.0, 5.0, 8.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.696881294250488, -5.497603893280029, -5.298326015472412, -5.099048614501953, -4.899770736694336, -4.700493335723877, -4.501215934753418, -4.301938056945801, -4.102660179138184, -3.9033825397491455, -3.7041049003601074, -3.5048274993896484, -3.3055496215820312, -3.1062722206115723, -2.906994581222534, -2.707716941833496, -2.508439540863037, -2.309161901473999, -2.109884262084961, -1.9106067419052124, -1.7113291025161743, -1.5120514631271362, -1.3127739429473877, -1.1134963035583496, -0.9142186641693115, -0.7149410247802734, -0.5156634449958801, -0.3163858652114868, -0.11710822582244873, 0.08216941356658936, 0.2814469337463379, 0.480724573135376, 0.6800022125244141, 0.8792798519134521, 1.0785574913024902, 1.2778350114822388, 1.4771126508712769, 1.676390290260315, 1.8756678104400635, 2.0749454498291016, 2.2742230892181396, 2.4735007286071777, 2.672778367996216, 2.872056007385254, 3.071333408355713, 3.27061128616333, 3.469888687133789, 3.669166326522827, 3.8684439659118652, 4.067721366882324, 4.266999244689941, 4.4662766456604, 4.665554523468018, 4.864831924438477, 5.064109802246094, 5.263387203216553, 5.462664604187012, 5.661942005157471, 5.861219882965088, 6.060497283935547, 6.259775161743164, 6.459052562713623, 6.658329963684082, 6.857607841491699, 7.056885719299316]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 10.0, 5.0, 5.0, 19.0, 13.0, 18.0, 42.0, 56.0, 90.0, 166.0, 271.0, 528.0, 1182.0, 3361.0, 14526.0, 110340.0, 703415.0, 186020.0, 21097.0, 4440.0, 1462.0, 665.0, 316.0, 167.0, 123.0, 63.0, 49.0, 32.0, 12.0, 18.0, 17.0, 10.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6455078125, -1.5812530517578125, -1.516998291015625, -1.4527435302734375, -1.38848876953125, -1.3242340087890625, -1.259979248046875, -1.1957244873046875, -1.1314697265625, -1.0672149658203125, -1.002960205078125, -0.9387054443359375, -0.87445068359375, -0.8101959228515625, -0.745941162109375, -0.6816864013671875, -0.617431640625, -0.5531768798828125, -0.488922119140625, -0.4246673583984375, -0.36041259765625, -0.2961578369140625, -0.231903076171875, -0.1676483154296875, -0.1033935546875, -0.0391387939453125, 0.025115966796875, 0.0893707275390625, 0.15362548828125, 0.2178802490234375, 0.282135009765625, 0.3463897705078125, 0.41064453125, 0.4748992919921875, 0.539154052734375, 0.6034088134765625, 0.66766357421875, 0.7319183349609375, 0.796173095703125, 0.8604278564453125, 0.9246826171875, 0.9889373779296875, 1.053192138671875, 1.1174468994140625, 1.18170166015625, 1.2459564208984375, 1.310211181640625, 1.3744659423828125, 1.438720703125, 1.5029754638671875, 1.567230224609375, 1.6314849853515625, 1.69573974609375, 1.7599945068359375, 1.824249267578125, 1.8885040283203125, 1.9527587890625, 2.0170135498046875, 2.081268310546875, 2.1455230712890625, 2.20977783203125, 2.2740325927734375, 2.338287353515625, 2.4025421142578125, 2.466796875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 10.0, 11.0, 11.0, 16.0, 22.0, 32.0, 35.0, 45.0, 41.0, 53.0, 69.0, 69.0, 65.0, 62.0, 61.0, 76.0, 68.0, 37.0, 42.0, 39.0, 30.0, 31.0, 22.0, 17.0, 11.0, 7.0, 9.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88330078125, -0.8498611450195312, -0.8164215087890625, -0.7829818725585938, -0.749542236328125, -0.7161026000976562, -0.6826629638671875, -0.6492233276367188, -0.61578369140625, -0.5823440551757812, -0.5489044189453125, -0.5154647827148438, -0.482025146484375, -0.44858551025390625, -0.4151458740234375, -0.38170623779296875, -0.3482666015625, -0.31482696533203125, -0.2813873291015625, -0.24794769287109375, -0.214508056640625, -0.18106842041015625, -0.1476287841796875, -0.11418914794921875, -0.08074951171875, -0.04730987548828125, -0.0138702392578125, 0.01956939697265625, 0.053009033203125, 0.08644866943359375, 0.1198883056640625, 0.15332794189453125, 0.186767578125, 0.22020721435546875, 0.2536468505859375, 0.28708648681640625, 0.320526123046875, 0.35396575927734375, 0.3874053955078125, 0.42084503173828125, 0.45428466796875, 0.48772430419921875, 0.5211639404296875, 0.5546035766601562, 0.588043212890625, 0.6214828491210938, 0.6549224853515625, 0.6883621215820312, 0.7218017578125, 0.7552413940429688, 0.7886810302734375, 0.8221206665039062, 0.855560302734375, 0.8889999389648438, 0.9224395751953125, 0.9558792114257812, 0.98931884765625, 1.0227584838867188, 1.0561981201171875, 1.0896377563476562, 1.123077392578125, 1.1565170288085938, 1.1899566650390625, 1.2233963012695312, 1.2568359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 9.0, 23.0, 27.0, 61.0, 108.0, 247.0, 656.0, 1972.0, 11291.0, 219478.0, 786135.0, 23819.0, 3179.0, 839.0, 316.0, 155.0, 86.0, 52.0, 27.0, 25.0, 10.0, 9.0, 8.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.634765625, -3.525146484375, -3.41552734375, -3.305908203125, -3.1962890625, -3.086669921875, -2.97705078125, -2.867431640625, -2.7578125, -2.648193359375, -2.53857421875, -2.428955078125, -2.3193359375, -2.209716796875, -2.10009765625, -1.990478515625, -1.880859375, -1.771240234375, -1.66162109375, -1.552001953125, -1.4423828125, -1.332763671875, -1.22314453125, -1.113525390625, -1.00390625, -0.894287109375, -0.78466796875, -0.675048828125, -0.5654296875, -0.455810546875, -0.34619140625, -0.236572265625, -0.126953125, -0.017333984375, 0.09228515625, 0.201904296875, 0.3115234375, 0.421142578125, 0.53076171875, 0.640380859375, 0.75, 0.859619140625, 0.96923828125, 1.078857421875, 1.1884765625, 1.298095703125, 1.40771484375, 1.517333984375, 1.626953125, 1.736572265625, 1.84619140625, 1.955810546875, 2.0654296875, 2.175048828125, 2.28466796875, 2.394287109375, 2.50390625, 2.613525390625, 2.72314453125, 2.832763671875, 2.9423828125, 3.052001953125, 3.16162109375, 3.271240234375, 3.380859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 8.0, 8.0, 7.0, 5.0, 15.0, 10.0, 22.0, 15.0, 20.0, 29.0, 35.0, 39.0, 38.0, 48.0, 51.0, 71.0, 56.0, 65.0, 63.0, 51.0, 53.0, 42.0, 43.0, 39.0, 24.0, 23.0, 29.0, 20.0, 16.0, 12.0, 10.0, 10.0, 12.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.271484375, -3.17083740234375, -3.0701904296875, -2.96954345703125, -2.868896484375, -2.76824951171875, -2.6676025390625, -2.56695556640625, -2.46630859375, -2.36566162109375, -2.2650146484375, -2.16436767578125, -2.063720703125, -1.96307373046875, -1.8624267578125, -1.76177978515625, -1.6611328125, -1.56048583984375, -1.4598388671875, -1.35919189453125, -1.258544921875, -1.15789794921875, -1.0572509765625, -0.95660400390625, -0.85595703125, -0.75531005859375, -0.6546630859375, -0.55401611328125, -0.453369140625, -0.35272216796875, -0.2520751953125, -0.15142822265625, -0.05078125, 0.04986572265625, 0.1505126953125, 0.25115966796875, 0.351806640625, 0.45245361328125, 0.5531005859375, 0.65374755859375, 0.75439453125, 0.85504150390625, 0.9556884765625, 1.05633544921875, 1.156982421875, 1.25762939453125, 1.3582763671875, 1.45892333984375, 1.5595703125, 1.66021728515625, 1.7608642578125, 1.86151123046875, 1.962158203125, 2.06280517578125, 2.1634521484375, 2.26409912109375, 2.36474609375, 2.46539306640625, 2.5660400390625, 2.66668701171875, 2.767333984375, 2.86798095703125, 2.9686279296875, 3.06927490234375, 3.169921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 8.0, 13.0, 13.0, 22.0, 22.0, 35.0, 77.0, 75.0, 124.0, 246.0, 409.0, 745.0, 1575.0, 3498.0, 8317.0, 24782.0, 115975.0, 756450.0, 99562.0, 22373.0, 7619.0, 3250.0, 1522.0, 720.0, 415.0, 209.0, 147.0, 99.0, 66.0, 42.0, 36.0, 24.0, 18.0, 16.0, 5.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5096359252929688, -0.4929046630859375, -0.47617340087890625, -0.459442138671875, -0.44271087646484375, -0.4259796142578125, -0.40924835205078125, -0.39251708984375, -0.37578582763671875, -0.3590545654296875, -0.34232330322265625, -0.325592041015625, -0.30886077880859375, -0.2921295166015625, -0.27539825439453125, -0.2586669921875, -0.24193572998046875, -0.2252044677734375, -0.20847320556640625, -0.191741943359375, -0.17501068115234375, -0.1582794189453125, -0.14154815673828125, -0.12481689453125, -0.10808563232421875, -0.0913543701171875, -0.07462310791015625, -0.057891845703125, -0.04116058349609375, -0.0244293212890625, -0.00769805908203125, 0.009033203125, 0.02576446533203125, 0.0424957275390625, 0.05922698974609375, 0.075958251953125, 0.09268951416015625, 0.1094207763671875, 0.12615203857421875, 0.14288330078125, 0.15961456298828125, 0.1763458251953125, 0.19307708740234375, 0.209808349609375, 0.22653961181640625, 0.2432708740234375, 0.26000213623046875, 0.2767333984375, 0.29346466064453125, 0.3101959228515625, 0.32692718505859375, 0.343658447265625, 0.36038970947265625, 0.3771209716796875, 0.39385223388671875, 0.41058349609375, 0.42731475830078125, 0.4440460205078125, 0.46077728271484375, 0.477508544921875, 0.49423980712890625, 0.5109710693359375, 0.5277023315429688, 0.54443359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 13.0, 8.0, 22.0, 41.0, 67.0, 105.0, 191.0, 199.0, 111.0, 76.0, 39.0, 21.0, 22.0, 15.0, 10.0, 8.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002390146255493164, -0.00023271329700946808, -0.00022641196846961975, -0.00022011063992977142, -0.0002138093113899231, -0.00020750798285007477, -0.00020120665431022644, -0.0001949053257703781, -0.00018860399723052979, -0.00018230266869068146, -0.00017600134015083313, -0.0001697000116109848, -0.00016339868307113647, -0.00015709735453128815, -0.00015079602599143982, -0.0001444946974515915, -0.00013819336891174316, -0.00013189204037189484, -0.0001255907118320465, -0.00011928938329219818, -0.00011298805475234985, -0.00010668672621250153, -0.0001003853976726532, -9.408406913280487e-05, -8.778274059295654e-05, -8.148141205310822e-05, -7.518008351325989e-05, -6.887875497341156e-05, -6.257742643356323e-05, -5.6276097893714905e-05, -4.997476935386658e-05, -4.367344081401825e-05, -3.737211227416992e-05, -3.1070783734321594e-05, -2.4769455194473267e-05, -1.846812665462494e-05, -1.2166798114776611e-05, -5.865469574928284e-06, 4.3585896492004395e-07, 6.737187504768372e-06, 1.30385160446167e-05, 1.9339844584465027e-05, 2.5641173124313354e-05, 3.194250166416168e-05, 3.824383020401001e-05, 4.454515874385834e-05, 5.0846487283706665e-05, 5.714781582355499e-05, 6.344914436340332e-05, 6.975047290325165e-05, 7.605180144309998e-05, 8.23531299829483e-05, 8.865445852279663e-05, 9.495578706264496e-05, 0.00010125711560249329, 0.00010755844414234161, 0.00011385977268218994, 0.00012016110122203827, 0.0001264624297618866, 0.00013276375830173492, 0.00013906508684158325, 0.00014536641538143158, 0.0001516677439212799, 0.00015796907246112823, 0.00016427040100097656]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 12.0, 15.0, 21.0, 32.0, 46.0, 61.0, 122.0, 204.0, 314.0, 575.0, 1228.0, 2543.0, 6277.0, 18370.0, 80056.0, 753360.0, 144210.0, 26549.0, 8269.0, 3242.0, 1441.0, 651.0, 363.0, 203.0, 137.0, 74.0, 65.0, 34.0, 23.0, 14.0, 9.0, 9.0, 12.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.763671875, -0.7439117431640625, -0.724151611328125, -0.7043914794921875, -0.68463134765625, -0.6648712158203125, -0.645111083984375, -0.6253509521484375, -0.6055908203125, -0.5858306884765625, -0.566070556640625, -0.5463104248046875, -0.52655029296875, -0.5067901611328125, -0.487030029296875, -0.4672698974609375, -0.447509765625, -0.4277496337890625, -0.407989501953125, -0.3882293701171875, -0.36846923828125, -0.3487091064453125, -0.328948974609375, -0.3091888427734375, -0.2894287109375, -0.2696685791015625, -0.249908447265625, -0.2301483154296875, -0.21038818359375, -0.1906280517578125, -0.170867919921875, -0.1511077880859375, -0.13134765625, -0.1115875244140625, -0.091827392578125, -0.0720672607421875, -0.05230712890625, -0.0325469970703125, -0.012786865234375, 0.0069732666015625, 0.0267333984375, 0.0464935302734375, 0.066253662109375, 0.0860137939453125, 0.10577392578125, 0.1255340576171875, 0.145294189453125, 0.1650543212890625, 0.184814453125, 0.2045745849609375, 0.224334716796875, 0.2440948486328125, 0.26385498046875, 0.2836151123046875, 0.303375244140625, 0.3231353759765625, 0.3428955078125, 0.3626556396484375, 0.382415771484375, 0.4021759033203125, 0.42193603515625, 0.4416961669921875, 0.461456298828125, 0.4812164306640625, 0.5009765625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 7.0, 5.0, 2.0, 10.0, 19.0, 13.0, 20.0, 53.0, 74.0, 102.0, 180.0, 176.0, 125.0, 68.0, 50.0, 42.0, 14.0, 10.0, 6.0, 11.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93017578125, -0.903717041015625, -0.87725830078125, -0.850799560546875, -0.8243408203125, -0.797882080078125, -0.77142333984375, -0.744964599609375, -0.718505859375, -0.692047119140625, -0.66558837890625, -0.639129638671875, -0.6126708984375, -0.586212158203125, -0.55975341796875, -0.533294677734375, -0.5068359375, -0.480377197265625, -0.45391845703125, -0.427459716796875, -0.4010009765625, -0.374542236328125, -0.34808349609375, -0.321624755859375, -0.295166015625, -0.268707275390625, -0.24224853515625, -0.215789794921875, -0.1893310546875, -0.162872314453125, -0.13641357421875, -0.109954833984375, -0.08349609375, -0.057037353515625, -0.03057861328125, -0.004119873046875, 0.0223388671875, 0.048797607421875, 0.07525634765625, 0.101715087890625, 0.128173828125, 0.154632568359375, 0.18109130859375, 0.207550048828125, 0.2340087890625, 0.260467529296875, 0.28692626953125, 0.313385009765625, 0.33984375, 0.366302490234375, 0.39276123046875, 0.419219970703125, 0.4456787109375, 0.472137451171875, 0.49859619140625, 0.525054931640625, 0.551513671875, 0.577972412109375, 0.60443115234375, 0.630889892578125, 0.6573486328125, 0.683807373046875, 0.71026611328125, 0.736724853515625, 0.76318359375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 15.0, 56.0, 189.0, 477.0, 169.0, 46.0, 23.0, 8.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.352218627929688, -18.487207412719727, -17.622196197509766, -16.757184982299805, -15.892172813415527, -15.027161598205566, -14.162150382995605, -13.297138214111328, -12.432126998901367, -11.567115783691406, -10.702104568481445, -9.837093353271484, -8.972081184387207, -8.107069969177246, -7.242058753967285, -6.377047061920166, -5.512036323547363, -4.647025108337402, -3.782013416290283, -2.9170022010803223, -2.0519907474517822, -1.1869792938232422, -0.32196807861328125, 0.5430436134338379, 1.4080548286437988, 2.273066282272339, 3.138077735900879, 4.00308895111084, 4.868100166320801, 5.73311185836792, 6.598123073577881, 7.463134765625, 8.328145980834961, 9.193157196044922, 10.058168411254883, 10.923179626464844, 11.788191795349121, 12.653203010559082, 13.518214225769043, 14.38322639465332, 15.248237609863281, 16.113248825073242, 16.978260040283203, 17.843271255493164, 18.708282470703125, 19.57329559326172, 20.438304901123047, 21.30331802368164, 22.16832733154297, 23.03333854675293, 23.89834976196289, 24.76336097717285, 25.628372192382812, 26.493385314941406, 27.358394622802734, 28.223407745361328, 29.08841896057129, 29.95343017578125, 30.81844139099121, 31.683452606201172, 32.548465728759766, 33.413475036621094, 34.27848815917969, 35.143497467041016, 36.00851058959961]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 9.0, 13.0, 8.0, 20.0, 21.0, 22.0, 22.0, 23.0, 21.0, 33.0, 34.0, 49.0, 53.0, 70.0, 91.0, 81.0, 78.0, 54.0, 33.0, 35.0, 37.0, 30.0, 26.0, 14.0, 10.0, 15.0, 16.0, 13.0, 9.0, 11.0, 9.0, 7.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.518571853637695, -10.177492141723633, -9.83641242980957, -9.495332717895508, -9.154252052307129, -8.813172340393066, -8.472092628479004, -8.131012916564941, -7.789932727813721, -7.448853015899658, -7.1077728271484375, -6.766693115234375, -6.4256134033203125, -6.084533214569092, -5.743453502655029, -5.402373313903809, -5.061293601989746, -4.720213890075684, -4.379133701324463, -4.0380539894104, -3.696974039077759, -3.355894088745117, -3.0148143768310547, -2.673734426498413, -2.3326544761657715, -1.9915745258331299, -1.6504946947097778, -1.3094148635864258, -0.9683349132537842, -0.6272549629211426, -0.2861752510070801, 0.05490469932556152, 0.3959836959838867, 0.7370635867118835, 1.0781434774398804, 1.4192233085632324, 1.760303258895874, 2.1013832092285156, 2.442462921142578, 2.7835428714752197, 3.1246228218078613, 3.465702772140503, 3.8067827224731445, 4.147862434387207, 4.4889421463012695, 4.83002233505249, 5.171102046966553, 5.512182235717773, 5.853261947631836, 6.194341659545898, 6.535421848297119, 6.876501560211182, 7.217581748962402, 7.558661460876465, 7.899741172790527, 8.24082088470459, 8.581901550292969, 8.922981262207031, 9.264060974121094, 9.605140686035156, 9.946221351623535, 10.287301063537598, 10.62838077545166, 10.969460487365723, 11.310540199279785]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 9.0, 9.0, 17.0, 29.0, 41.0, 56.0, 89.0, 156.0, 287.0, 614.0, 1601.0, 5327.0, 41017.0, 2899999.0, 1215041.0, 23288.0, 4109.0, 1340.0, 618.0, 258.0, 144.0, 85.0, 51.0, 24.0, 30.0, 14.0, 14.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.015625, -2.93603515625, -2.8564453125, -2.77685546875, -2.697265625, -2.61767578125, -2.5380859375, -2.45849609375, -2.37890625, -2.29931640625, -2.2197265625, -2.14013671875, -2.060546875, -1.98095703125, -1.9013671875, -1.82177734375, -1.7421875, -1.66259765625, -1.5830078125, -1.50341796875, -1.423828125, -1.34423828125, -1.2646484375, -1.18505859375, -1.10546875, -1.02587890625, -0.9462890625, -0.86669921875, -0.787109375, -0.70751953125, -0.6279296875, -0.54833984375, -0.46875, -0.38916015625, -0.3095703125, -0.22998046875, -0.150390625, -0.07080078125, 0.0087890625, 0.08837890625, 0.16796875, 0.24755859375, 0.3271484375, 0.40673828125, 0.486328125, 0.56591796875, 0.6455078125, 0.72509765625, 0.8046875, 0.88427734375, 0.9638671875, 1.04345703125, 1.123046875, 1.20263671875, 1.2822265625, 1.36181640625, 1.44140625, 1.52099609375, 1.6005859375, 1.68017578125, 1.759765625, 1.83935546875, 1.9189453125, 1.99853515625, 2.078125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 1.0, 9.0, 10.0, 7.0, 15.0, 11.0, 18.0, 19.0, 25.0, 27.0, 35.0, 39.0, 35.0, 44.0, 56.0, 49.0, 48.0, 52.0, 43.0, 52.0, 41.0, 47.0, 46.0, 33.0, 41.0, 28.0, 27.0, 34.0, 14.0, 14.0, 20.0, 9.0, 14.0, 8.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.8974609375, -0.872406005859375, -0.84735107421875, -0.822296142578125, -0.7972412109375, -0.772186279296875, -0.74713134765625, -0.722076416015625, -0.697021484375, -0.671966552734375, -0.64691162109375, -0.621856689453125, -0.5968017578125, -0.571746826171875, -0.54669189453125, -0.521636962890625, -0.49658203125, -0.471527099609375, -0.44647216796875, -0.421417236328125, -0.3963623046875, -0.371307373046875, -0.34625244140625, -0.321197509765625, -0.296142578125, -0.271087646484375, -0.24603271484375, -0.220977783203125, -0.1959228515625, -0.170867919921875, -0.14581298828125, -0.120758056640625, -0.095703125, -0.070648193359375, -0.04559326171875, -0.020538330078125, 0.0045166015625, 0.029571533203125, 0.05462646484375, 0.079681396484375, 0.104736328125, 0.129791259765625, 0.15484619140625, 0.179901123046875, 0.2049560546875, 0.230010986328125, 0.25506591796875, 0.280120849609375, 0.30517578125, 0.330230712890625, 0.35528564453125, 0.380340576171875, 0.4053955078125, 0.430450439453125, 0.45550537109375, 0.480560302734375, 0.505615234375, 0.530670166015625, 0.55572509765625, 0.580780029296875, 0.6058349609375, 0.630889892578125, 0.65594482421875, 0.680999755859375, 0.7060546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 8.0, 11.0, 21.0, 31.0, 55.0, 124.0, 342.0, 965.0, 4466.0, 53357.0, 3845303.0, 277972.0, 9207.0, 1593.0, 465.0, 167.0, 82.0, 35.0, 27.0, 13.0, 8.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.103515625, -3.008575439453125, -2.91363525390625, -2.818695068359375, -2.7237548828125, -2.628814697265625, -2.53387451171875, -2.438934326171875, -2.343994140625, -2.249053955078125, -2.15411376953125, -2.059173583984375, -1.9642333984375, -1.869293212890625, -1.77435302734375, -1.679412841796875, -1.58447265625, -1.489532470703125, -1.39459228515625, -1.299652099609375, -1.2047119140625, -1.109771728515625, -1.01483154296875, -0.919891357421875, -0.824951171875, -0.730010986328125, -0.63507080078125, -0.540130615234375, -0.4451904296875, -0.350250244140625, -0.25531005859375, -0.160369873046875, -0.0654296875, 0.029510498046875, 0.12445068359375, 0.219390869140625, 0.3143310546875, 0.409271240234375, 0.50421142578125, 0.599151611328125, 0.694091796875, 0.789031982421875, 0.88397216796875, 0.978912353515625, 1.0738525390625, 1.168792724609375, 1.26373291015625, 1.358673095703125, 1.45361328125, 1.548553466796875, 1.64349365234375, 1.738433837890625, 1.8333740234375, 1.928314208984375, 2.02325439453125, 2.118194580078125, 2.213134765625, 2.308074951171875, 2.40301513671875, 2.497955322265625, 2.5928955078125, 2.687835693359375, 2.78277587890625, 2.877716064453125, 2.97265625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 7.0, 6.0, 15.0, 13.0, 15.0, 26.0, 60.0, 94.0, 223.0, 419.0, 767.0, 1024.0, 670.0, 375.0, 177.0, 80.0, 40.0, 20.0, 10.0, 15.0, 12.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.3533935546875, -2.282958984375, -2.2125244140625, -2.14208984375, -2.0716552734375, -2.001220703125, -1.9307861328125, -1.8603515625, -1.7899169921875, -1.719482421875, -1.6490478515625, -1.57861328125, -1.5081787109375, -1.437744140625, -1.3673095703125, -1.296875, -1.2264404296875, -1.156005859375, -1.0855712890625, -1.01513671875, -0.9447021484375, -0.874267578125, -0.8038330078125, -0.7333984375, -0.6629638671875, -0.592529296875, -0.5220947265625, -0.45166015625, -0.3812255859375, -0.310791015625, -0.2403564453125, -0.169921875, -0.0994873046875, -0.029052734375, 0.0413818359375, 0.11181640625, 0.1822509765625, 0.252685546875, 0.3231201171875, 0.3935546875, 0.4639892578125, 0.534423828125, 0.6048583984375, 0.67529296875, 0.7457275390625, 0.816162109375, 0.8865966796875, 0.95703125, 1.0274658203125, 1.097900390625, 1.1683349609375, 1.23876953125, 1.3092041015625, 1.379638671875, 1.4500732421875, 1.5205078125, 1.5909423828125, 1.661376953125, 1.7318115234375, 1.80224609375, 1.8726806640625, 1.943115234375, 2.0135498046875, 2.083984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 16.0, 46.0, 85.0, 209.0, 282.0, 219.0, 76.0, 34.0, 14.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.630271911621094, -26.00605583190918, -25.3818416595459, -24.757625579833984, -24.133411407470703, -23.50919532775879, -22.884981155395508, -22.260765075683594, -21.636550903320312, -21.0123348236084, -20.388120651245117, -19.763904571533203, -19.139690399169922, -18.515474319458008, -17.891260147094727, -17.267044067382812, -16.64282989501953, -16.018613815307617, -15.394399642944336, -14.770184516906738, -14.14596939086914, -13.521754264831543, -12.897539138793945, -12.273323059082031, -11.649106979370117, -11.02489185333252, -10.400676727294922, -9.776461601257324, -9.152246475219727, -8.528031349182129, -7.903815746307373, -7.279600620269775, -6.6553850173950195, -6.031169891357422, -5.406954765319824, -4.782739639282227, -4.158524513244629, -3.534309148788452, -2.9100937843322754, -2.2858786582946777, -1.66166353225708, -1.0374484062194824, -0.4132331609725952, 0.210982084274292, 0.8351972103118896, 1.4594123363494873, 2.083627700805664, 2.7078428268432617, 3.3320579528808594, 3.956273078918457, 4.580488204956055, 5.204703330993652, 5.82891845703125, 6.453133583068848, 7.0773491859436035, 7.701564311981201, 8.32577896118164, 8.949994087219238, 9.574209213256836, 10.198424339294434, 10.822639465332031, 11.446854591369629, 12.071069717407227, 12.69528579711914, 13.319500923156738]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 10.0, 7.0, 9.0, 11.0, 13.0, 16.0, 20.0, 36.0, 30.0, 43.0, 52.0, 40.0, 28.0, 55.0, 52.0, 51.0, 53.0, 48.0, 52.0, 42.0, 46.0, 43.0, 39.0, 19.0, 26.0, 30.0, 28.0, 16.0, 16.0, 12.0, 13.0, 8.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.886723041534424, -6.671534538269043, -6.456346035003662, -6.241157531738281, -6.0259690284729, -5.8107805252075195, -5.595592021942139, -5.380403518676758, -5.165215015411377, -4.950026512145996, -4.734838008880615, -4.519649505615234, -4.3044610023498535, -4.089272499084473, -3.874083995819092, -3.658895492553711, -3.44370698928833, -3.228518486022949, -3.0133299827575684, -2.7981414794921875, -2.5829529762268066, -2.367764472961426, -2.152575969696045, -1.937387466430664, -1.7221989631652832, -1.5070104598999023, -1.2918219566345215, -1.0766334533691406, -0.8614449501037598, -0.6462564468383789, -0.43106794357299805, -0.2158794403076172, -0.000690460205078125, 0.21449804306030273, 0.4296865463256836, 0.6448750495910645, 0.8600635528564453, 1.0752520561218262, 1.290440559387207, 1.505629062652588, 1.7208175659179688, 1.9360060691833496, 2.1511945724487305, 2.3663830757141113, 2.581571578979492, 2.796760082244873, 3.011948585510254, 3.2271370887756348, 3.4423255920410156, 3.6575140953063965, 3.8727025985717773, 4.087891101837158, 4.303079605102539, 4.51826810836792, 4.733456611633301, 4.948645114898682, 5.1638336181640625, 5.379022121429443, 5.594210624694824, 5.809399127960205, 6.024587631225586, 6.239776134490967, 6.454964637756348, 6.6701531410217285, 6.885341644287109]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 11.0, 15.0, 9.0, 14.0, 32.0, 46.0, 105.0, 174.0, 339.0, 770.0, 1814.0, 5461.0, 22480.0, 133664.0, 662179.0, 182220.0, 28659.0, 6621.0, 2189.0, 833.0, 412.0, 204.0, 103.0, 62.0, 39.0, 28.0, 25.0, 14.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.224609375, -2.1654052734375, -2.106201171875, -2.0469970703125, -1.98779296875, -1.9285888671875, -1.869384765625, -1.8101806640625, -1.7509765625, -1.6917724609375, -1.632568359375, -1.5733642578125, -1.51416015625, -1.4549560546875, -1.395751953125, -1.3365478515625, -1.27734375, -1.2181396484375, -1.158935546875, -1.0997314453125, -1.04052734375, -0.9813232421875, -0.922119140625, -0.8629150390625, -0.8037109375, -0.7445068359375, -0.685302734375, -0.6260986328125, -0.56689453125, -0.5076904296875, -0.448486328125, -0.3892822265625, -0.330078125, -0.2708740234375, -0.211669921875, -0.1524658203125, -0.09326171875, -0.0340576171875, 0.025146484375, 0.0843505859375, 0.1435546875, 0.2027587890625, 0.261962890625, 0.3211669921875, 0.38037109375, 0.4395751953125, 0.498779296875, 0.5579833984375, 0.6171875, 0.6763916015625, 0.735595703125, 0.7947998046875, 0.85400390625, 0.9132080078125, 0.972412109375, 1.0316162109375, 1.0908203125, 1.1500244140625, 1.209228515625, 1.2684326171875, 1.32763671875, 1.3868408203125, 1.446044921875, 1.5052490234375, 1.564453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 10.0, 9.0, 8.0, 16.0, 15.0, 14.0, 19.0, 31.0, 31.0, 32.0, 28.0, 37.0, 39.0, 41.0, 47.0, 48.0, 41.0, 34.0, 58.0, 55.0, 39.0, 36.0, 33.0, 33.0, 24.0, 24.0, 30.0, 27.0, 21.0, 17.0, 20.0, 13.0, 13.0, 14.0, 5.0, 4.0, 2.0, 5.0, 3.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.78466796875, -0.7618484497070312, -0.7390289306640625, -0.7162094116210938, -0.693389892578125, -0.6705703735351562, -0.6477508544921875, -0.6249313354492188, -0.60211181640625, -0.5792922973632812, -0.5564727783203125, -0.5336532592773438, -0.510833740234375, -0.48801422119140625, -0.4651947021484375, -0.44237518310546875, -0.4195556640625, -0.39673614501953125, -0.3739166259765625, -0.35109710693359375, -0.328277587890625, -0.30545806884765625, -0.2826385498046875, -0.25981903076171875, -0.23699951171875, -0.21417999267578125, -0.1913604736328125, -0.16854095458984375, -0.145721435546875, -0.12290191650390625, -0.1000823974609375, -0.07726287841796875, -0.054443359375, -0.03162384033203125, -0.0088043212890625, 0.01401519775390625, 0.036834716796875, 0.05965423583984375, 0.0824737548828125, 0.10529327392578125, 0.12811279296875, 0.15093231201171875, 0.1737518310546875, 0.19657135009765625, 0.219390869140625, 0.24221038818359375, 0.2650299072265625, 0.28784942626953125, 0.3106689453125, 0.33348846435546875, 0.3563079833984375, 0.37912750244140625, 0.401947021484375, 0.42476654052734375, 0.4475860595703125, 0.47040557861328125, 0.49322509765625, 0.5160446166992188, 0.5388641357421875, 0.5616836547851562, 0.584503173828125, 0.6073226928710938, 0.6301422119140625, 0.6529617309570312, 0.67578125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 8.0, 1.0, 9.0, 16.0, 15.0, 16.0, 32.0, 45.0, 57.0, 105.0, 144.0, 273.0, 407.0, 877.0, 2094.0, 6756.0, 34657.0, 637529.0, 326744.0, 29315.0, 5788.0, 1848.0, 791.0, 429.0, 208.0, 126.0, 64.0, 59.0, 31.0, 20.0, 18.0, 15.0, 10.0, 9.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.06640625, -1.995025634765625, -1.92364501953125, -1.852264404296875, -1.7808837890625, -1.709503173828125, -1.63812255859375, -1.566741943359375, -1.495361328125, -1.423980712890625, -1.35260009765625, -1.281219482421875, -1.2098388671875, -1.138458251953125, -1.06707763671875, -0.995697021484375, -0.92431640625, -0.852935791015625, -0.78155517578125, -0.710174560546875, -0.6387939453125, -0.567413330078125, -0.49603271484375, -0.424652099609375, -0.353271484375, -0.281890869140625, -0.21051025390625, -0.139129638671875, -0.0677490234375, 0.003631591796875, 0.07501220703125, 0.146392822265625, 0.2177734375, 0.289154052734375, 0.36053466796875, 0.431915283203125, 0.5032958984375, 0.574676513671875, 0.64605712890625, 0.717437744140625, 0.788818359375, 0.860198974609375, 0.93157958984375, 1.002960205078125, 1.0743408203125, 1.145721435546875, 1.21710205078125, 1.288482666015625, 1.35986328125, 1.431243896484375, 1.50262451171875, 1.574005126953125, 1.6453857421875, 1.716766357421875, 1.78814697265625, 1.859527587890625, 1.930908203125, 2.002288818359375, 2.07366943359375, 2.145050048828125, 2.2164306640625, 2.287811279296875, 2.35919189453125, 2.430572509765625, 2.501953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 13.0, 9.0, 8.0, 15.0, 13.0, 29.0, 27.0, 33.0, 34.0, 37.0, 57.0, 81.0, 61.0, 73.0, 72.0, 64.0, 69.0, 58.0, 49.0, 35.0, 33.0, 31.0, 25.0, 15.0, 12.0, 15.0, 7.0, 4.0, 7.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -4.02569580078125, -3.9068603515625, -3.78802490234375, -3.669189453125, -3.55035400390625, -3.4315185546875, -3.31268310546875, -3.19384765625, -3.07501220703125, -2.9561767578125, -2.83734130859375, -2.718505859375, -2.59967041015625, -2.4808349609375, -2.36199951171875, -2.2431640625, -2.12432861328125, -2.0054931640625, -1.88665771484375, -1.767822265625, -1.64898681640625, -1.5301513671875, -1.41131591796875, -1.29248046875, -1.17364501953125, -1.0548095703125, -0.93597412109375, -0.817138671875, -0.69830322265625, -0.5794677734375, -0.46063232421875, -0.341796875, -0.22296142578125, -0.1041259765625, 0.01470947265625, 0.133544921875, 0.25238037109375, 0.3712158203125, 0.49005126953125, 0.60888671875, 0.72772216796875, 0.8465576171875, 0.96539306640625, 1.084228515625, 1.20306396484375, 1.3218994140625, 1.44073486328125, 1.5595703125, 1.67840576171875, 1.7972412109375, 1.91607666015625, 2.034912109375, 2.15374755859375, 2.2725830078125, 2.39141845703125, 2.51025390625, 2.62908935546875, 2.7479248046875, 2.86676025390625, 2.985595703125, 3.10443115234375, 3.2232666015625, 3.34210205078125, 3.4609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 9.0, 9.0, 7.0, 21.0, 21.0, 35.0, 52.0, 87.0, 109.0, 221.0, 474.0, 1275.0, 4646.0, 22905.0, 806647.0, 192278.0, 14700.0, 3192.0, 939.0, 392.0, 194.0, 103.0, 74.0, 49.0, 25.0, 18.0, 18.0, 11.0, 14.0, 8.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98291015625, -0.9530105590820312, -0.9231109619140625, -0.8932113647460938, -0.863311767578125, -0.8334121704101562, -0.8035125732421875, -0.7736129760742188, -0.74371337890625, -0.7138137817382812, -0.6839141845703125, -0.6540145874023438, -0.624114990234375, -0.5942153930664062, -0.5643157958984375, -0.5344161987304688, -0.5045166015625, -0.47461700439453125, -0.4447174072265625, -0.41481781005859375, -0.384918212890625, -0.35501861572265625, -0.3251190185546875, -0.29521942138671875, -0.26531982421875, -0.23542022705078125, -0.2055206298828125, -0.17562103271484375, -0.145721435546875, -0.11582183837890625, -0.0859222412109375, -0.05602264404296875, -0.026123046875, 0.00377655029296875, 0.0336761474609375, 0.06357574462890625, 0.093475341796875, 0.12337493896484375, 0.1532745361328125, 0.18317413330078125, 0.21307373046875, 0.24297332763671875, 0.2728729248046875, 0.30277252197265625, 0.332672119140625, 0.36257171630859375, 0.3924713134765625, 0.42237091064453125, 0.4522705078125, 0.48217010498046875, 0.5120697021484375, 0.5419692993164062, 0.571868896484375, 0.6017684936523438, 0.6316680908203125, 0.6615676879882812, 0.69146728515625, 0.7213668823242188, 0.7512664794921875, 0.7811660766601562, 0.811065673828125, 0.8409652709960938, 0.8708648681640625, 0.9007644653320312, 0.9306640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 6.0, 1.0, 2.0, 6.0, 4.0, 6.0, 8.0, 10.0, 8.0, 18.0, 10.0, 13.0, 42.0, 59.0, 120.0, 230.0, 191.0, 88.0, 61.0, 25.0, 20.0, 18.0, 14.0, 8.0, 4.0, 8.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00019216537475585938, -0.00018594972789287567, -0.00017973408102989197, -0.00017351843416690826, -0.00016730278730392456, -0.00016108714044094086, -0.00015487149357795715, -0.00014865584671497345, -0.00014244019985198975, -0.00013622455298900604, -0.00013000890612602234, -0.00012379325926303864, -0.00011757761240005493, -0.00011136196553707123, -0.00010514631867408752, -9.893067181110382e-05, -9.271502494812012e-05, -8.649937808513641e-05, -8.028373122215271e-05, -7.4068084359169e-05, -6.78524374961853e-05, -6.16367906332016e-05, -5.5421143770217896e-05, -4.920549690723419e-05, -4.298985004425049e-05, -3.6774203181266785e-05, -3.055855631828308e-05, -2.4342909455299377e-05, -1.8127262592315674e-05, -1.191161572933197e-05, -5.695968866348267e-06, 5.19677996635437e-07, 6.735324859619141e-06, 1.2950971722602844e-05, 1.9166618585586548e-05, 2.538226544857025e-05, 3.1597912311553955e-05, 3.781355917453766e-05, 4.402920603752136e-05, 5.0244852900505066e-05, 5.646049976348877e-05, 6.267614662647247e-05, 6.889179348945618e-05, 7.510744035243988e-05, 8.132308721542358e-05, 8.753873407840729e-05, 9.375438094139099e-05, 9.99700278043747e-05, 0.0001061856746673584, 0.0001124013215303421, 0.0001186169683933258, 0.0001248326152563095, 0.0001310482621192932, 0.00013726390898227692, 0.00014347955584526062, 0.00014969520270824432, 0.00015591084957122803, 0.00016212649643421173, 0.00016834214329719543, 0.00017455779016017914, 0.00018077343702316284, 0.00018698908388614655, 0.00019320473074913025, 0.00019942037761211395, 0.00020563602447509766]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 12.0, 17.0, 18.0, 22.0, 29.0, 43.0, 53.0, 69.0, 134.0, 215.0, 354.0, 594.0, 1133.0, 2254.0, 5013.0, 12477.0, 39717.0, 262552.0, 644798.0, 52412.0, 15233.0, 5837.0, 2645.0, 1240.0, 663.0, 369.0, 196.0, 129.0, 101.0, 64.0, 47.0, 35.0, 24.0, 16.0, 6.0, 8.0, 11.0, 6.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5078125, -0.4919891357421875, -0.476165771484375, -0.4603424072265625, -0.44451904296875, -0.4286956787109375, -0.412872314453125, -0.3970489501953125, -0.3812255859375, -0.3654022216796875, -0.349578857421875, -0.3337554931640625, -0.31793212890625, -0.3021087646484375, -0.286285400390625, -0.2704620361328125, -0.254638671875, -0.2388153076171875, -0.222991943359375, -0.2071685791015625, -0.19134521484375, -0.1755218505859375, -0.159698486328125, -0.1438751220703125, -0.1280517578125, -0.1122283935546875, -0.096405029296875, -0.0805816650390625, -0.06475830078125, -0.0489349365234375, -0.033111572265625, -0.0172882080078125, -0.00146484375, 0.0143585205078125, 0.030181884765625, 0.0460052490234375, 0.06182861328125, 0.0776519775390625, 0.093475341796875, 0.1092987060546875, 0.1251220703125, 0.1409454345703125, 0.156768798828125, 0.1725921630859375, 0.18841552734375, 0.2042388916015625, 0.220062255859375, 0.2358856201171875, 0.251708984375, 0.2675323486328125, 0.283355712890625, 0.2991790771484375, 0.31500244140625, 0.3308258056640625, 0.346649169921875, 0.3624725341796875, 0.3782958984375, 0.3941192626953125, 0.409942626953125, 0.4257659912109375, 0.44158935546875, 0.4574127197265625, 0.473236083984375, 0.4890594482421875, 0.5048828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 4.0, 12.0, 7.0, 8.0, 13.0, 22.0, 27.0, 39.0, 54.0, 100.0, 100.0, 119.0, 114.0, 94.0, 60.0, 43.0, 32.0, 25.0, 27.0, 13.0, 20.0, 6.0, 7.0, 5.0, 7.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5, -0.48317718505859375, -0.4663543701171875, -0.44953155517578125, -0.432708740234375, -0.41588592529296875, -0.3990631103515625, -0.38224029541015625, -0.36541748046875, -0.34859466552734375, -0.3317718505859375, -0.31494903564453125, -0.298126220703125, -0.28130340576171875, -0.2644805908203125, -0.24765777587890625, -0.2308349609375, -0.21401214599609375, -0.1971893310546875, -0.18036651611328125, -0.163543701171875, -0.14672088623046875, -0.1298980712890625, -0.11307525634765625, -0.09625244140625, -0.07942962646484375, -0.0626068115234375, -0.04578399658203125, -0.028961181640625, -0.01213836669921875, 0.0046844482421875, 0.02150726318359375, 0.038330078125, 0.05515289306640625, 0.0719757080078125, 0.08879852294921875, 0.105621337890625, 0.12244415283203125, 0.1392669677734375, 0.15608978271484375, 0.17291259765625, 0.18973541259765625, 0.2065582275390625, 0.22338104248046875, 0.240203857421875, 0.25702667236328125, 0.2738494873046875, 0.29067230224609375, 0.3074951171875, 0.32431793212890625, 0.3411407470703125, 0.35796356201171875, 0.374786376953125, 0.39160919189453125, 0.4084320068359375, 0.42525482177734375, 0.44207763671875, 0.45890045166015625, 0.4757232666015625, 0.49254608154296875, 0.509368896484375, 0.5261917114257812, 0.5430145263671875, 0.5598373413085938, 0.57666015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 9.0, 47.0, 389.0, 473.0, 56.0, 15.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.1500244140625, -48.75836944580078, -47.36671829223633, -45.975067138671875, -44.583412170410156, -43.19175720214844, -41.800106048583984, -40.40845489501953, -39.01679992675781, -37.625144958496094, -36.23349380493164, -34.84184265136719, -33.45018768310547, -32.05853271484375, -30.666881561279297, -29.27522850036621, -27.883575439453125, -26.49192237854004, -25.100269317626953, -23.708616256713867, -22.31696319580078, -20.925310134887695, -19.53365707397461, -18.142004013061523, -16.750350952148438, -15.358697891235352, -13.967044830322266, -12.57539176940918, -11.183738708496094, -9.792085647583008, -8.400432586669922, -7.008779525756836, -5.617130279541016, -4.22547721862793, -2.8338241577148438, -1.4421710968017578, -0.050518035888671875, 1.341135025024414, 2.7327880859375, 4.124441146850586, 5.516094207763672, 6.907747268676758, 8.299400329589844, 9.69105339050293, 11.082706451416016, 12.474359512329102, 13.866012573242188, 15.257665634155273, 16.64931869506836, 18.040971755981445, 19.43262481689453, 20.824277877807617, 22.215930938720703, 23.60758399963379, 24.999237060546875, 26.39089012145996, 27.782543182373047, 29.174196243286133, 30.56584930419922, 31.957502365112305, 33.34915542602539, 34.740806579589844, 36.13246154785156, 37.52411651611328, 38.915767669677734]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 10.0, 5.0, 7.0, 10.0, 16.0, 14.0, 18.0, 11.0, 27.0, 18.0, 38.0, 40.0, 39.0, 52.0, 76.0, 142.0, 107.0, 57.0, 45.0, 37.0, 34.0, 31.0, 37.0, 28.0, 19.0, 13.0, 14.0, 11.0, 13.0, 9.0, 8.0, 6.0, 6.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.922733306884766, -10.529598236083984, -10.136462211608887, -9.743326187133789, -9.350191116333008, -8.957056045532227, -8.563920021057129, -8.170783996582031, -7.77764892578125, -7.3845133781433105, -6.991377830505371, -6.598242282867432, -6.205106735229492, -5.811971187591553, -5.418835639953613, -5.025700092315674, -4.632564544677734, -4.239428997039795, -3.8462934494018555, -3.453157901763916, -3.0600223541259766, -2.666886806488037, -2.2737512588500977, -1.8806157112121582, -1.4874801635742188, -1.0943446159362793, -0.7012090682983398, -0.3080735206604004, 0.08506202697753906, 0.4781975746154785, 0.871333122253418, 1.2644686698913574, 1.6576032638549805, 2.05073881149292, 2.4438743591308594, 2.837009906768799, 3.2301454544067383, 3.6232810020446777, 4.016416549682617, 4.409552097320557, 4.802687644958496, 5.1958231925964355, 5.588958740234375, 5.9820942878723145, 6.375229835510254, 6.768365383148193, 7.161500930786133, 7.554636478424072, 7.947772026062012, 8.34090805053711, 8.73404312133789, 9.127178192138672, 9.52031421661377, 9.913450241088867, 10.306585311889648, 10.69972038269043, 11.092856407165527, 11.485992431640625, 11.879127502441406, 12.272262573242188, 12.665398597717285, 13.058534622192383, 13.451669692993164, 13.844804763793945, 14.237940788269043]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 3.0, 5.0, 6.0, 9.0, 15.0, 21.0, 27.0, 49.0, 95.0, 150.0, 250.0, 608.0, 1298.0, 3232.0, 10656.0, 69249.0, 2243608.0, 1791191.0, 58877.0, 9498.0, 3101.0, 1166.0, 556.0, 282.0, 135.0, 81.0, 40.0, 25.0, 16.0, 10.0, 12.0, 1.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.016510009765625, -2.91583251953125, -2.815155029296875, -2.7144775390625, -2.613800048828125, -2.51312255859375, -2.412445068359375, -2.311767578125, -2.211090087890625, -2.11041259765625, -2.009735107421875, -1.9090576171875, -1.808380126953125, -1.70770263671875, -1.607025146484375, -1.50634765625, -1.405670166015625, -1.30499267578125, -1.204315185546875, -1.1036376953125, -1.002960205078125, -0.90228271484375, -0.801605224609375, -0.700927734375, -0.600250244140625, -0.49957275390625, -0.398895263671875, -0.2982177734375, -0.197540283203125, -0.09686279296875, 0.003814697265625, 0.1044921875, 0.205169677734375, 0.30584716796875, 0.406524658203125, 0.5072021484375, 0.607879638671875, 0.70855712890625, 0.809234619140625, 0.909912109375, 1.010589599609375, 1.11126708984375, 1.211944580078125, 1.3126220703125, 1.413299560546875, 1.51397705078125, 1.614654541015625, 1.71533203125, 1.816009521484375, 1.91668701171875, 2.017364501953125, 2.1180419921875, 2.218719482421875, 2.31939697265625, 2.420074462890625, 2.520751953125, 2.621429443359375, 2.72210693359375, 2.822784423828125, 2.9234619140625, 3.024139404296875, 3.12481689453125, 3.225494384765625, 3.326171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 9.0, 5.0, 14.0, 23.0, 21.0, 25.0, 43.0, 51.0, 63.0, 74.0, 90.0, 82.0, 75.0, 77.0, 70.0, 68.0, 55.0, 49.0, 36.0, 31.0, 18.0, 15.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4697265625, -1.427886962890625, -1.38604736328125, -1.344207763671875, -1.3023681640625, -1.260528564453125, -1.21868896484375, -1.176849365234375, -1.135009765625, -1.093170166015625, -1.05133056640625, -1.009490966796875, -0.9676513671875, -0.925811767578125, -0.88397216796875, -0.842132568359375, -0.80029296875, -0.758453369140625, -0.71661376953125, -0.674774169921875, -0.6329345703125, -0.591094970703125, -0.54925537109375, -0.507415771484375, -0.465576171875, -0.423736572265625, -0.38189697265625, -0.340057373046875, -0.2982177734375, -0.256378173828125, -0.21453857421875, -0.172698974609375, -0.130859375, -0.089019775390625, -0.04718017578125, -0.005340576171875, 0.0364990234375, 0.078338623046875, 0.12017822265625, 0.162017822265625, 0.203857421875, 0.245697021484375, 0.28753662109375, 0.329376220703125, 0.3712158203125, 0.413055419921875, 0.45489501953125, 0.496734619140625, 0.53857421875, 0.580413818359375, 0.62225341796875, 0.664093017578125, 0.7059326171875, 0.747772216796875, 0.78961181640625, 0.831451416015625, 0.873291015625, 0.915130615234375, 0.95697021484375, 0.998809814453125, 1.0406494140625, 1.082489013671875, 1.12432861328125, 1.166168212890625, 1.2080078125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 8.0, 10.0, 6.0, 14.0, 24.0, 45.0, 83.0, 196.0, 578.0, 2630.0, 226952.0, 3957606.0, 4801.0, 815.0, 305.0, 102.0, 53.0, 17.0, 9.0, 14.0, 6.0, 8.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.4171142578125, -15.974853515625, -15.5325927734375, -15.09033203125, -14.6480712890625, -14.205810546875, -13.7635498046875, -13.3212890625, -12.8790283203125, -12.436767578125, -11.9945068359375, -11.55224609375, -11.1099853515625, -10.667724609375, -10.2254638671875, -9.783203125, -9.3409423828125, -8.898681640625, -8.4564208984375, -8.01416015625, -7.5718994140625, -7.129638671875, -6.6873779296875, -6.2451171875, -5.8028564453125, -5.360595703125, -4.9183349609375, -4.47607421875, -4.0338134765625, -3.591552734375, -3.1492919921875, -2.70703125, -2.2647705078125, -1.822509765625, -1.3802490234375, -0.93798828125, -0.4957275390625, -0.053466796875, 0.3887939453125, 0.8310546875, 1.2733154296875, 1.715576171875, 2.1578369140625, 2.60009765625, 3.0423583984375, 3.484619140625, 3.9268798828125, 4.369140625, 4.8114013671875, 5.253662109375, 5.6959228515625, 6.13818359375, 6.5804443359375, 7.022705078125, 7.4649658203125, 7.9072265625, 8.3494873046875, 8.791748046875, 9.2340087890625, 9.67626953125, 10.1185302734375, 10.560791015625, 11.0030517578125, 11.4453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 9.0, 7.0, 29.0, 51.0, 94.0, 167.0, 307.0, 573.0, 1005.0, 895.0, 441.0, 229.0, 102.0, 59.0, 37.0, 19.0, 8.0, 12.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.096923828125, -3.94384765625, -3.790771484375, -3.6376953125, -3.484619140625, -3.33154296875, -3.178466796875, -3.025390625, -2.872314453125, -2.71923828125, -2.566162109375, -2.4130859375, -2.260009765625, -2.10693359375, -1.953857421875, -1.80078125, -1.647705078125, -1.49462890625, -1.341552734375, -1.1884765625, -1.035400390625, -0.88232421875, -0.729248046875, -0.576171875, -0.423095703125, -0.27001953125, -0.116943359375, 0.0361328125, 0.189208984375, 0.34228515625, 0.495361328125, 0.6484375, 0.801513671875, 0.95458984375, 1.107666015625, 1.2607421875, 1.413818359375, 1.56689453125, 1.719970703125, 1.873046875, 2.026123046875, 2.17919921875, 2.332275390625, 2.4853515625, 2.638427734375, 2.79150390625, 2.944580078125, 3.09765625, 3.250732421875, 3.40380859375, 3.556884765625, 3.7099609375, 3.863037109375, 4.01611328125, 4.169189453125, 4.322265625, 4.475341796875, 4.62841796875, 4.781494140625, 4.9345703125, 5.087646484375, 5.24072265625, 5.393798828125, 5.546875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 7.0, 11.0, 10.0, 11.0, 23.0, 66.0, 174.0, 289.0, 225.0, 107.0, 38.0, 19.0, 11.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.26983642578125, -68.62259674072266, -66.97534942626953, -65.32810974121094, -63.68086624145508, -62.03362274169922, -60.38637924194336, -58.7391357421875, -57.091896057128906, -55.44465255737305, -53.79740905761719, -52.150169372558594, -50.502925872802734, -48.855682373046875, -47.208438873291016, -45.561195373535156, -43.9139518737793, -42.26670837402344, -40.61946487426758, -38.97222137451172, -37.324981689453125, -35.677738189697266, -34.030494689941406, -32.38325119018555, -30.73600959777832, -29.08876609802246, -27.441524505615234, -25.794281005859375, -24.147037506103516, -22.49979591369629, -20.85255241394043, -19.205310821533203, -17.558067321777344, -15.9108247756958, -14.263582229614258, -12.616338729858398, -10.969096183776855, -9.321853637695312, -7.674610137939453, -6.02736759185791, -4.380125045776367, -2.732882261276245, -1.085639476776123, 0.5616035461425781, 2.208846092224121, 3.856088638305664, 5.503332138061523, 7.150574684143066, 8.79781723022461, 10.445059776306152, 12.092302322387695, 13.739545822143555, 15.386788368225098, 17.03403091430664, 18.6812744140625, 20.32851791381836, 21.975759506225586, 23.623003005981445, 25.270244598388672, 26.91748809814453, 28.56473159790039, 30.211973190307617, 31.859216690063477, 33.5064582824707, 35.15370178222656]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 9.0, 17.0, 17.0, 19.0, 25.0, 24.0, 41.0, 33.0, 48.0, 71.0, 68.0, 85.0, 83.0, 79.0, 68.0, 56.0, 40.0, 47.0, 30.0, 22.0, 24.0, 25.0, 16.0, 13.0, 6.0, 8.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-27.29422378540039, -26.57469367980957, -25.855161666870117, -25.135631561279297, -24.416099548339844, -23.696569442749023, -22.977039337158203, -22.25750732421875, -21.537975311279297, -20.818445205688477, -20.098913192749023, -19.379383087158203, -18.65985107421875, -17.94032096862793, -17.22079086303711, -16.501258850097656, -15.781728744506836, -15.0621976852417, -14.342666625976562, -13.623136520385742, -12.903604507446289, -12.184074401855469, -11.464543342590332, -10.745012283325195, -10.025481224060059, -9.305950164794922, -8.586419105529785, -7.866888523101807, -7.14735746383667, -6.427826404571533, -5.708295822143555, -4.988764762878418, -4.269235610961914, -3.5497045516967773, -2.8301737308502197, -2.110642910003662, -1.3911118507385254, -0.6715807914733887, 0.047949790954589844, 0.7674808502197266, 1.4870119094848633, 2.20654296875, 2.9260737895965576, 3.6456046104431152, 4.365135669708252, 5.084666728973389, 5.804197311401367, 6.523728370666504, 7.243259429931641, 7.962790489196777, 8.682321548461914, 9.401851654052734, 10.121383666992188, 10.840913772583008, 11.560444831848145, 12.279975891113281, 12.999506950378418, 13.719038009643555, 14.438569068908691, 15.158100128173828, 15.877630233764648, 16.5971622467041, 17.316692352294922, 18.036224365234375, 18.755754470825195]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 16.0, 17.0, 45.0, 45.0, 64.0, 113.0, 199.0, 298.0, 622.0, 1294.0, 2873.0, 7855.0, 27851.0, 170300.0, 680384.0, 122659.0, 22287.0, 6569.0, 2635.0, 1159.0, 537.0, 250.0, 168.0, 94.0, 60.0, 45.0, 28.0, 18.0, 11.0, 7.0, 4.0, 7.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.869140625, -1.803375244140625, -1.73760986328125, -1.671844482421875, -1.6060791015625, -1.540313720703125, -1.47454833984375, -1.408782958984375, -1.343017578125, -1.277252197265625, -1.21148681640625, -1.145721435546875, -1.0799560546875, -1.014190673828125, -0.94842529296875, -0.882659912109375, -0.81689453125, -0.751129150390625, -0.68536376953125, -0.619598388671875, -0.5538330078125, -0.488067626953125, -0.42230224609375, -0.356536865234375, -0.290771484375, -0.225006103515625, -0.15924072265625, -0.093475341796875, -0.0277099609375, 0.038055419921875, 0.10382080078125, 0.169586181640625, 0.2353515625, 0.301116943359375, 0.36688232421875, 0.432647705078125, 0.4984130859375, 0.564178466796875, 0.62994384765625, 0.695709228515625, 0.761474609375, 0.827239990234375, 0.89300537109375, 0.958770751953125, 1.0245361328125, 1.090301513671875, 1.15606689453125, 1.221832275390625, 1.28759765625, 1.353363037109375, 1.41912841796875, 1.484893798828125, 1.5506591796875, 1.616424560546875, 1.68218994140625, 1.747955322265625, 1.813720703125, 1.879486083984375, 1.94525146484375, 2.011016845703125, 2.0767822265625, 2.142547607421875, 2.20831298828125, 2.274078369140625, 2.33984375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 1.0, 5.0, 3.0, 7.0, 9.0, 33.0, 29.0, 38.0, 66.0, 66.0, 98.0, 103.0, 97.0, 96.0, 78.0, 94.0, 48.0, 47.0, 27.0, 27.0, 14.0, 6.0, 4.0, 1.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.11822509765625, -2.0509033203125, -1.98358154296875, -1.916259765625, -1.84893798828125, -1.7816162109375, -1.71429443359375, -1.64697265625, -1.57965087890625, -1.5123291015625, -1.44500732421875, -1.377685546875, -1.31036376953125, -1.2430419921875, -1.17572021484375, -1.1083984375, -1.04107666015625, -0.9737548828125, -0.90643310546875, -0.839111328125, -0.77178955078125, -0.7044677734375, -0.63714599609375, -0.56982421875, -0.50250244140625, -0.4351806640625, -0.36785888671875, -0.300537109375, -0.23321533203125, -0.1658935546875, -0.09857177734375, -0.03125, 0.03607177734375, 0.1033935546875, 0.17071533203125, 0.238037109375, 0.30535888671875, 0.3726806640625, 0.44000244140625, 0.50732421875, 0.57464599609375, 0.6419677734375, 0.70928955078125, 0.776611328125, 0.84393310546875, 0.9112548828125, 0.97857666015625, 1.0458984375, 1.11322021484375, 1.1805419921875, 1.24786376953125, 1.315185546875, 1.38250732421875, 1.4498291015625, 1.51715087890625, 1.58447265625, 1.65179443359375, 1.7191162109375, 1.78643798828125, 1.853759765625, 1.92108154296875, 1.9884033203125, 2.05572509765625, 2.123046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 5.0, 1.0, 11.0, 7.0, 4.0, 10.0, 11.0, 24.0, 32.0, 44.0, 67.0, 108.0, 184.0, 334.0, 596.0, 1526.0, 5373.0, 41572.0, 882778.0, 102872.0, 9025.0, 2109.0, 796.0, 426.0, 218.0, 113.0, 80.0, 51.0, 38.0, 41.0, 20.0, 15.0, 12.0, 14.0, 7.0, 12.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.82421875, -2.7511444091796875, -2.678070068359375, -2.6049957275390625, -2.53192138671875, -2.4588470458984375, -2.385772705078125, -2.3126983642578125, -2.2396240234375, -2.1665496826171875, -2.093475341796875, -2.0204010009765625, -1.94732666015625, -1.8742523193359375, -1.801177978515625, -1.7281036376953125, -1.655029296875, -1.5819549560546875, -1.508880615234375, -1.4358062744140625, -1.36273193359375, -1.2896575927734375, -1.216583251953125, -1.1435089111328125, -1.0704345703125, -0.9973602294921875, -0.924285888671875, -0.8512115478515625, -0.77813720703125, -0.7050628662109375, -0.631988525390625, -0.5589141845703125, -0.48583984375, -0.4127655029296875, -0.339691162109375, -0.2666168212890625, -0.19354248046875, -0.1204681396484375, -0.047393798828125, 0.0256805419921875, 0.0987548828125, 0.1718292236328125, 0.244903564453125, 0.3179779052734375, 0.39105224609375, 0.4641265869140625, 0.537200927734375, 0.6102752685546875, 0.683349609375, 0.7564239501953125, 0.829498291015625, 0.9025726318359375, 0.97564697265625, 1.0487213134765625, 1.121795654296875, 1.1948699951171875, 1.2679443359375, 1.3410186767578125, 1.414093017578125, 1.4871673583984375, 1.56024169921875, 1.6333160400390625, 1.706390380859375, 1.7794647216796875, 1.8525390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 8.0, 2.0, 6.0, 6.0, 4.0, 5.0, 6.0, 11.0, 12.0, 14.0, 20.0, 20.0, 23.0, 31.0, 44.0, 47.0, 69.0, 67.0, 71.0, 77.0, 63.0, 68.0, 48.0, 39.0, 34.0, 31.0, 18.0, 28.0, 31.0, 22.0, 17.0, 7.0, 8.0, 6.0, 8.0, 8.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.9266357421875, -3.786865234375, -3.6470947265625, -3.50732421875, -3.3675537109375, -3.227783203125, -3.0880126953125, -2.9482421875, -2.8084716796875, -2.668701171875, -2.5289306640625, -2.38916015625, -2.2493896484375, -2.109619140625, -1.9698486328125, -1.830078125, -1.6903076171875, -1.550537109375, -1.4107666015625, -1.27099609375, -1.1312255859375, -0.991455078125, -0.8516845703125, -0.7119140625, -0.5721435546875, -0.432373046875, -0.2926025390625, -0.15283203125, -0.0130615234375, 0.126708984375, 0.2664794921875, 0.40625, 0.5460205078125, 0.685791015625, 0.8255615234375, 0.96533203125, 1.1051025390625, 1.244873046875, 1.3846435546875, 1.5244140625, 1.6641845703125, 1.803955078125, 1.9437255859375, 2.08349609375, 2.2232666015625, 2.363037109375, 2.5028076171875, 2.642578125, 2.7823486328125, 2.922119140625, 3.0618896484375, 3.20166015625, 3.3414306640625, 3.481201171875, 3.6209716796875, 3.7607421875, 3.9005126953125, 4.040283203125, 4.1800537109375, 4.31982421875, 4.4595947265625, 4.599365234375, 4.7391357421875, 4.87890625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 10.0, 13.0, 15.0, 20.0, 33.0, 48.0, 55.0, 101.0, 182.0, 264.0, 462.0, 1058.0, 2786.0, 10179.0, 63283.0, 895814.0, 59457.0, 9793.0, 2634.0, 1027.0, 511.0, 275.0, 172.0, 105.0, 63.0, 39.0, 37.0, 23.0, 13.0, 16.0, 16.0, 7.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44775390625, -0.43306732177734375, -0.4183807373046875, -0.40369415283203125, -0.389007568359375, -0.37432098388671875, -0.3596343994140625, -0.34494781494140625, -0.33026123046875, -0.31557464599609375, -0.3008880615234375, -0.28620147705078125, -0.271514892578125, -0.25682830810546875, -0.2421417236328125, -0.22745513916015625, -0.2127685546875, -0.19808197021484375, -0.1833953857421875, -0.16870880126953125, -0.154022216796875, -0.13933563232421875, -0.1246490478515625, -0.10996246337890625, -0.09527587890625, -0.08058929443359375, -0.0659027099609375, -0.05121612548828125, -0.036529541015625, -0.02184295654296875, -0.0071563720703125, 0.00753021240234375, 0.022216796875, 0.03690338134765625, 0.0515899658203125, 0.06627655029296875, 0.080963134765625, 0.09564971923828125, 0.1103363037109375, 0.12502288818359375, 0.13970947265625, 0.15439605712890625, 0.1690826416015625, 0.18376922607421875, 0.198455810546875, 0.21314239501953125, 0.2278289794921875, 0.24251556396484375, 0.2572021484375, 0.27188873291015625, 0.2865753173828125, 0.30126190185546875, 0.315948486328125, 0.33063507080078125, 0.3453216552734375, 0.36000823974609375, 0.37469482421875, 0.38938140869140625, 0.4040679931640625, 0.41875457763671875, 0.433441162109375, 0.44812774658203125, 0.4628143310546875, 0.47750091552734375, 0.4921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 8.0, 4.0, 4.0, 7.0, 7.0, 15.0, 11.0, 8.0, 21.0, 21.0, 23.0, 46.0, 59.0, 70.0, 99.0, 131.0, 118.0, 103.0, 62.0, 39.0, 33.0, 34.0, 14.0, 12.0, 6.0, 9.0, 9.0, 5.0, 5.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.369850158691406e-05, -9.073875844478607e-05, -8.777901530265808e-05, -8.481927216053009e-05, -8.18595290184021e-05, -7.889978587627411e-05, -7.594004273414612e-05, -7.298029959201813e-05, -7.002055644989014e-05, -6.706081330776215e-05, -6.410107016563416e-05, -6.114132702350616e-05, -5.8181583881378174e-05, -5.522184073925018e-05, -5.226209759712219e-05, -4.93023544549942e-05, -4.634261131286621e-05, -4.338286817073822e-05, -4.042312502861023e-05, -3.746338188648224e-05, -3.450363874435425e-05, -3.154389560222626e-05, -2.8584152460098267e-05, -2.5624409317970276e-05, -2.2664666175842285e-05, -1.9704923033714294e-05, -1.6745179891586304e-05, -1.3785436749458313e-05, -1.0825693607330322e-05, -7.865950465202332e-06, -4.906207323074341e-06, -1.94646418094635e-06, 1.0132789611816406e-06, 3.973022103309631e-06, 6.932765245437622e-06, 9.892508387565613e-06, 1.2852251529693604e-05, 1.5811994671821594e-05, 1.8771737813949585e-05, 2.1731480956077576e-05, 2.4691224098205566e-05, 2.7650967240333557e-05, 3.061071038246155e-05, 3.357045352458954e-05, 3.653019666671753e-05, 3.948993980884552e-05, 4.244968295097351e-05, 4.54094260931015e-05, 4.836916923522949e-05, 5.132891237735748e-05, 5.4288655519485474e-05, 5.7248398661613464e-05, 6.0208141803741455e-05, 6.316788494586945e-05, 6.612762808799744e-05, 6.908737123012543e-05, 7.204711437225342e-05, 7.500685751438141e-05, 7.79666006565094e-05, 8.092634379863739e-05, 8.388608694076538e-05, 8.684583008289337e-05, 8.980557322502136e-05, 9.276531636714935e-05, 9.572505950927734e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 5.0, 6.0, 6.0, 8.0, 11.0, 23.0, 15.0, 33.0, 53.0, 112.0, 132.0, 245.0, 423.0, 731.0, 1467.0, 3586.0, 10095.0, 40346.0, 739980.0, 211359.0, 26756.0, 7573.0, 2845.0, 1256.0, 590.0, 352.0, 207.0, 126.0, 86.0, 34.0, 33.0, 14.0, 13.0, 7.0, 8.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348876953125, -0.3367919921875, -0.32470703125, -0.3126220703125, -0.300537109375, -0.2884521484375, -0.2763671875, -0.2642822265625, -0.252197265625, -0.2401123046875, -0.22802734375, -0.2159423828125, -0.203857421875, -0.1917724609375, -0.1796875, -0.1676025390625, -0.155517578125, -0.1434326171875, -0.13134765625, -0.1192626953125, -0.107177734375, -0.0950927734375, -0.0830078125, -0.0709228515625, -0.058837890625, -0.0467529296875, -0.03466796875, -0.0225830078125, -0.010498046875, 0.0015869140625, 0.013671875, 0.0257568359375, 0.037841796875, 0.0499267578125, 0.06201171875, 0.0740966796875, 0.086181640625, 0.0982666015625, 0.1103515625, 0.1224365234375, 0.134521484375, 0.1466064453125, 0.15869140625, 0.1707763671875, 0.182861328125, 0.1949462890625, 0.20703125, 0.2191162109375, 0.231201171875, 0.2432861328125, 0.25537109375, 0.2674560546875, 0.279541015625, 0.2916259765625, 0.3037109375, 0.3157958984375, 0.327880859375, 0.3399658203125, 0.35205078125, 0.3641357421875, 0.376220703125, 0.3883056640625, 0.400390625, 0.4124755859375, 0.424560546875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 0.0, 3.0, 9.0, 9.0, 9.0, 11.0, 17.0, 12.0, 11.0, 29.0, 30.0, 38.0, 58.0, 58.0, 80.0, 93.0, 88.0, 71.0, 74.0, 53.0, 41.0, 35.0, 29.0, 26.0, 28.0, 13.0, 16.0, 9.0, 16.0, 6.0, 6.0, 4.0, 4.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40625, -0.3932914733886719, -0.38033294677734375, -0.3673744201660156, -0.3544158935546875, -0.3414573669433594, -0.32849884033203125, -0.3155403137207031, -0.302581787109375, -0.2896232604980469, -0.27666473388671875, -0.2637062072753906, -0.2507476806640625, -0.23778915405273438, -0.22483062744140625, -0.21187210083007812, -0.19891357421875, -0.18595504760742188, -0.17299652099609375, -0.16003799438476562, -0.1470794677734375, -0.13412094116210938, -0.12116241455078125, -0.10820388793945312, -0.095245361328125, -0.08228683471679688, -0.06932830810546875, -0.056369781494140625, -0.0434112548828125, -0.030452728271484375, -0.01749420166015625, -0.004535675048828125, 0.0084228515625, 0.021381378173828125, 0.03433990478515625, 0.047298431396484375, 0.0602569580078125, 0.07321548461914062, 0.08617401123046875, 0.09913253784179688, 0.112091064453125, 0.12504959106445312, 0.13800811767578125, 0.15096664428710938, 0.1639251708984375, 0.17688369750976562, 0.18984222412109375, 0.20280075073242188, 0.21575927734375, 0.22871780395507812, 0.24167633056640625, 0.2546348571777344, 0.2675933837890625, 0.2805519104003906, 0.29351043701171875, 0.3064689636230469, 0.319427490234375, 0.3323860168457031, 0.34534454345703125, 0.3583030700683594, 0.3712615966796875, 0.3842201232910156, 0.39717864990234375, 0.4101371765136719, 0.423095703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 13.0, 16.0, 57.0, 224.0, 380.0, 188.0, 59.0, 30.0, 15.0, 8.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.913375854492188, -18.882577896118164, -17.851778030395508, -16.820980072021484, -15.790181159973145, -14.759382247924805, -13.728584289550781, -12.697785377502441, -11.666986465454102, -10.636187553405762, -9.605388641357422, -8.574590682983398, -7.543791770935059, -6.512992858886719, -5.482194423675537, -4.4513959884643555, -3.4205970764160156, -2.389798402786255, -1.3589997291564941, -0.3282010555267334, 0.7025976181030273, 1.7333965301513672, 2.764194965362549, 3.7949934005737305, 4.82579231262207, 5.85659122467041, 6.887389659881592, 7.918188095092773, 8.948987007141113, 9.979785919189453, 11.010583877563477, 12.041382789611816, 13.072181701660156, 14.102980613708496, 15.133779525756836, 16.16457748413086, 17.195377349853516, 18.22617530822754, 19.256973266601562, 20.28777313232422, 21.318571090698242, 22.349369049072266, 23.380168914794922, 24.410966873168945, 25.44176483154297, 26.472564697265625, 27.50336265563965, 28.534160614013672, 29.564960479736328, 30.59575843811035, 31.626558303833008, 32.65735626220703, 33.68815612792969, 34.718955993652344, 35.749752044677734, 36.78055191040039, 37.81134796142578, 38.84214782714844, 39.87294387817383, 40.903743743896484, 41.93454360961914, 42.96533966064453, 43.99613952636719, 45.026939392089844, 46.0577392578125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 2.0, 6.0, 6.0, 12.0, 18.0, 19.0, 20.0, 31.0, 46.0, 85.0, 68.0, 74.0, 82.0, 64.0, 84.0, 85.0, 72.0, 58.0, 34.0, 37.0, 22.0, 15.0, 10.0, 13.0, 9.0, 5.0, 2.0, 5.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.85467529296875, -23.229001998901367, -22.60332679748535, -21.97765350341797, -21.351980209350586, -20.726306915283203, -20.100631713867188, -19.474958419799805, -18.849285125732422, -18.22361183166504, -17.597936630249023, -16.97226333618164, -16.346590042114258, -15.720915794372559, -15.09524154663086, -14.469568252563477, -13.843893051147461, -13.218218803405762, -12.592545509338379, -11.96687126159668, -11.341197967529297, -10.715523719787598, -10.089849472045898, -9.464176177978516, -8.838501930236816, -8.212827682495117, -7.587154388427734, -6.961480140686035, -6.335806369781494, -5.710132598876953, -5.084458351135254, -4.458784580230713, -3.833110809326172, -3.207437038421631, -2.5817630290985107, -1.9560891389846802, -1.3304152488708496, -0.7047414779663086, -0.07906746864318848, 0.5466065406799316, 1.1722803115844727, 1.7979542016983032, 2.423628091812134, 3.049302101135254, 3.674975872039795, 4.300649642944336, 4.926323890686035, 5.551997661590576, 6.177671432495117, 6.803345203399658, 7.429018974304199, 8.054693222045898, 8.680366516113281, 9.30604076385498, 9.93171501159668, 10.557388305664062, 11.183062553405762, 11.808736801147461, 12.434410095214844, 13.060084342956543, 13.685758590698242, 14.311431884765625, 14.937106132507324, 15.562780380249023, 16.188453674316406]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 15.0, 14.0, 19.0, 31.0, 39.0, 60.0, 92.0, 256.0, 208.0, 91.0, 65.0, 34.0, 32.0, 20.0, 9.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.34765625, -3.2714996337890625, -3.195343017578125, -3.1191864013671875, -3.04302978515625, -2.9668731689453125, -2.890716552734375, -2.8145599365234375, -2.7384033203125, -2.6622467041015625, -2.586090087890625, -2.5099334716796875, -2.43377685546875, -2.3576202392578125, -2.281463623046875, -2.2053070068359375, -2.129150390625, -2.0529937744140625, -1.976837158203125, -1.9006805419921875, -1.82452392578125, -1.7483673095703125, -1.672210693359375, -1.5960540771484375, -1.5198974609375, -1.4437408447265625, -1.367584228515625, -1.2914276123046875, -1.21527099609375, -1.1391143798828125, -1.062957763671875, -0.9868011474609375, -0.91064453125, -0.8344879150390625, -0.758331298828125, -0.6821746826171875, -0.60601806640625, -0.5298614501953125, -0.453704833984375, -0.3775482177734375, -0.3013916015625, -0.2252349853515625, -0.149078369140625, -0.0729217529296875, 0.00323486328125, 0.0793914794921875, 0.155548095703125, 0.2317047119140625, 0.307861328125, 0.3840179443359375, 0.460174560546875, 0.5363311767578125, 0.61248779296875, 0.6886444091796875, 0.764801025390625, 0.8409576416015625, 0.9171142578125, 0.9932708740234375, 1.069427490234375, 1.1455841064453125, 1.22174072265625, 1.2978973388671875, 1.374053955078125, 1.4502105712890625, 1.5263671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 13.0, 23.0, 17.0, 36.0, 131.0, 237.0, 1048.0, 19576.0, 8363456.0, 3249.0, 435.0, 145.0, 77.0, 61.0, 13.0, 14.0, 9.0, 12.0, 3.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.985815048217773, -18.35810089111328, -17.730384826660156, -17.102670669555664, -16.474956512451172, -15.847240447998047, -15.219526290893555, -14.591811180114746, -13.964096069335938, -13.336380958557129, -12.70866584777832, -12.080951690673828, -11.45323657989502, -10.825521469116211, -10.197807312011719, -9.57009220123291, -8.942377090454102, -8.314661979675293, -7.686947345733643, -7.059232711791992, -6.431517601013184, -5.803802490234375, -5.176087856292725, -4.548373222351074, -3.9206581115722656, -3.292943239212036, -2.6652283668518066, -2.037513494491577, -1.4097986221313477, -0.7820837497711182, -0.15436887741088867, 0.4733457565307617, 1.1010608673095703, 1.7287757396697998, 2.3564906120300293, 2.984205484390259, 3.6119203567504883, 4.239635467529297, 4.867350101470947, 5.495064735412598, 6.122779846191406, 6.750494956970215, 7.378209590911865, 8.005924224853516, 8.633639335632324, 9.261354446411133, 9.889068603515625, 10.516783714294434, 11.144498825073242, 11.77221393585205, 12.39992904663086, 13.027643203735352, 13.65535831451416, 14.283073425292969, 14.910787582397461, 15.53850269317627, 16.166217803955078, 16.79393196105957, 17.421648025512695, 18.049362182617188, 18.677078247070312, 19.304792404174805, 19.932506561279297, 20.560222625732422, 21.187936782836914]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 2.0, 1.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-30.634408950805664, -29.937395095825195, -29.240381240844727, -28.543367385864258, -27.846355438232422, -27.149341583251953, -26.452327728271484, -25.755313873291016, -25.058300018310547, -24.361286163330078, -23.66427230834961, -22.96725845336914, -22.270244598388672, -21.573232650756836, -20.876218795776367, -20.1792049407959, -19.48219108581543, -18.78517723083496, -18.088163375854492, -17.391149520874023, -16.694137573242188, -15.997122764587402, -15.30010986328125, -14.603096008300781, -13.906082153320312, -13.209068298339844, -12.512054443359375, -11.815041542053223, -11.118027687072754, -10.421013832092285, -9.724000930786133, -9.026987075805664, -8.329975128173828, -7.632961273193359, -6.935947895050049, -6.238934516906738, -5.5419206619262695, -4.844906806945801, -4.14789342880249, -3.4508800506591797, -2.753866195678711, -2.0568525791168213, -1.3598389625549316, -0.662825345993042, 0.034188270568847656, 0.7312018871307373, 1.428215503692627, 2.1252288818359375, 2.8222427368164062, 3.519256353378296, 4.2162699699401855, 4.913283348083496, 5.610297203063965, 6.307311058044434, 7.004324436187744, 7.701337814331055, 8.398351669311523, 9.095365524291992, 9.792379379272461, 10.489392280578613, 11.186406135559082, 11.88341999053955, 12.580432891845703, 13.277446746826172, 13.97446060180664]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 8.0, 8.0, 14.0, 23.0, 30.0, 44.0, 85.0, 91.0, 113.0, 105.0, 93.0, 93.0, 78.0, 57.0, 46.0, 33.0, 26.0, 18.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0, -0.9674530029296875, -0.934906005859375, -0.9023590087890625, -0.86981201171875, -0.8372650146484375, -0.804718017578125, -0.7721710205078125, -0.7396240234375, -0.7070770263671875, -0.674530029296875, -0.6419830322265625, -0.60943603515625, -0.5768890380859375, -0.544342041015625, -0.5117950439453125, -0.479248046875, -0.4467010498046875, -0.414154052734375, -0.3816070556640625, -0.34906005859375, -0.3165130615234375, -0.283966064453125, -0.2514190673828125, -0.2188720703125, -0.1863250732421875, -0.153778076171875, -0.1212310791015625, -0.08868408203125, -0.0561370849609375, -0.023590087890625, 0.0089569091796875, 0.04150390625, 0.0740509033203125, 0.106597900390625, 0.1391448974609375, 0.17169189453125, 0.2042388916015625, 0.236785888671875, 0.2693328857421875, 0.3018798828125, 0.3344268798828125, 0.366973876953125, 0.3995208740234375, 0.43206787109375, 0.4646148681640625, 0.497161865234375, 0.5297088623046875, 0.562255859375, 0.5948028564453125, 0.627349853515625, 0.6598968505859375, 0.69244384765625, 0.7249908447265625, 0.757537841796875, 0.7900848388671875, 0.8226318359375, 0.8551788330078125, 0.887725830078125, 0.9202728271484375, 0.95281982421875, 0.9853668212890625, 1.017913818359375, 1.0504608154296875, 1.0830078125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 2.0, 4.0, 4.0, 3.0, 7.0, 16.0, 10.0, 26.0, 29.0, 42.0, 58.0, 75.0, 153.0, 242.0, 503.0, 1103.0, 3252.0, 13122.0, 77676.0, 311976.0, 94537.0, 15290.0, 3659.0, 1209.0, 588.0, 294.0, 160.0, 92.0, 45.0, 25.0, 20.0, 13.0, 8.0, 5.0, 3.0, 0.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.0234375, -14.6529541015625, -14.282470703125, -13.9119873046875, -13.54150390625, -13.1710205078125, -12.800537109375, -12.4300537109375, -12.0595703125, -11.6890869140625, -11.318603515625, -10.9481201171875, -10.57763671875, -10.2071533203125, -9.836669921875, -9.4661865234375, -9.095703125, -8.7252197265625, -8.354736328125, -7.9842529296875, -7.61376953125, -7.2432861328125, -6.872802734375, -6.5023193359375, -6.1318359375, -5.7613525390625, -5.390869140625, -5.0203857421875, -4.64990234375, -4.2794189453125, -3.908935546875, -3.5384521484375, -3.16796875, -2.7974853515625, -2.427001953125, -2.0565185546875, -1.68603515625, -1.3155517578125, -0.945068359375, -0.5745849609375, -0.2041015625, 0.1663818359375, 0.536865234375, 0.9073486328125, 1.27783203125, 1.6483154296875, 2.018798828125, 2.3892822265625, 2.759765625, 3.1302490234375, 3.500732421875, 3.8712158203125, 4.24169921875, 4.6121826171875, 4.982666015625, 5.3531494140625, 5.7236328125, 6.0941162109375, 6.464599609375, 6.8350830078125, 7.20556640625, 7.5760498046875, 7.946533203125, 8.3170166015625, 8.6875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 13.0, 11.0, 11.0, 29.0, 29.0, 48.0, 59.0, 76.0, 102.0, 99.0, 115.0, 111.0, 70.0, 80.0, 32.0, 30.0, 26.0, 14.0, 10.0, 8.0, 8.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.51953125, -2.4581146240234375, -2.396697998046875, -2.3352813720703125, -2.27386474609375, -2.2124481201171875, -2.151031494140625, -2.0896148681640625, -2.0281982421875, -1.9667816162109375, -1.905364990234375, -1.8439483642578125, -1.78253173828125, -1.7211151123046875, -1.659698486328125, -1.5982818603515625, -1.536865234375, -1.4754486083984375, -1.414031982421875, -1.3526153564453125, -1.29119873046875, -1.2297821044921875, -1.168365478515625, -1.1069488525390625, -1.0455322265625, -0.9841156005859375, -0.922698974609375, -0.8612823486328125, -0.79986572265625, -0.7384490966796875, -0.677032470703125, -0.6156158447265625, -0.55419921875, -0.4927825927734375, -0.431365966796875, -0.3699493408203125, -0.30853271484375, -0.2471160888671875, -0.185699462890625, -0.1242828369140625, -0.0628662109375, -0.0014495849609375, 0.059967041015625, 0.1213836669921875, 0.18280029296875, 0.2442169189453125, 0.305633544921875, 0.3670501708984375, 0.428466796875, 0.4898834228515625, 0.551300048828125, 0.6127166748046875, 0.67413330078125, 0.7355499267578125, 0.796966552734375, 0.8583831787109375, 0.9197998046875, 0.9812164306640625, 1.042633056640625, 1.1040496826171875, 1.16546630859375, 1.2268829345703125, 1.288299560546875, 1.3497161865234375, 1.4111328125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 14.0, 8.0, 22.0, 33.0, 51.0, 90.0, 78.0, 82.0, 38.0, 27.0, 9.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.384020805358887, -8.034505844116211, -7.684991836547852, -7.335476875305176, -6.985962390899658, -6.636447906494141, -6.286932945251465, -5.937418460845947, -5.58790397644043, -5.238389492034912, -4.8888750076293945, -4.539360046386719, -4.189845561981201, -3.8403310775756836, -3.490816354751587, -3.1413016319274902, -2.7917871475219727, -2.442272663116455, -2.0927579402923584, -1.7432433366775513, -1.3937287330627441, -1.044214129447937, -0.6946995258331299, -0.3451848030090332, 0.004329681396484375, 0.3538442850112915, 0.7033588886260986, 1.0528734922409058, 1.402388095855713, 1.75190269947052, 2.101417303085327, 2.450932025909424, 2.800445556640625, 3.1499600410461426, 3.4994747638702393, 3.848989486694336, 4.1985039710998535, 4.548018455505371, 4.897533416748047, 5.2470479011535645, 5.596562385559082, 5.9460768699646, 6.295591354370117, 6.645106315612793, 6.9946208000183105, 7.344135284423828, 7.693650245666504, 8.04316520690918, 8.392679214477539, 8.742194175720215, 9.091708183288574, 9.44122314453125, 9.79073715209961, 10.140252113342285, 10.489767074584961, 10.83928108215332, 11.188796043395996, 11.538311004638672, 11.887825012207031, 12.237339973449707, 12.586854934692383, 12.936368942260742, 13.285883903503418, 13.635398864746094, 13.984912872314453]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 11.0, 13.0, 24.0, 43.0, 57.0, 89.0, 89.0, 54.0, 24.0, 15.0, 8.0, 8.0, 5.0, 7.0, 3.0, 2.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.315199375152588, -7.070064067840576, -6.824928283691406, -6.5797929763793945, -6.334657192230225, -6.089521884918213, -5.844386100769043, -5.599250793457031, -5.3541154861450195, -5.108980178833008, -4.863844394683838, -4.618709087371826, -4.373573303222656, -4.1284379959106445, -3.8833024501800537, -3.638166904449463, -3.393031120300293, -3.147895574569702, -2.9027600288391113, -2.6576247215270996, -2.4124889373779297, -2.167353630065918, -1.9222180843353271, -1.6770825386047363, -1.4319469928741455, -1.1868114471435547, -0.9416759610176086, -0.6965404748916626, -0.4514049291610718, -0.20626938343048096, 0.03886604309082031, 0.28400158882141113, 0.5291376113891602, 0.774273157119751, 1.0194087028503418, 1.264544129371643, 1.5096796751022339, 1.7548152208328247, 1.999950647354126, 2.245086193084717, 2.4902217388153076, 2.7353572845458984, 2.9804928302764893, 3.22562837600708, 3.470763683319092, 3.7158994674682617, 3.9610347747802734, 4.206170082092285, 4.451305866241455, 4.696441173553467, 4.941576957702637, 5.186712265014648, 5.431848049163818, 5.67698335647583, 5.922119140625, 6.167254447937012, 6.412389755249023, 6.657525062561035, 6.902660846710205, 7.147796154022217, 7.392931938171387, 7.638067245483398, 7.88320255279541, 8.128337860107422, 8.37347412109375]}, "eval/loss": 2.6299471855163574, "eval/wer": 1.4451408171360571, "eval/runtime": 336.2822, "eval/samples_per_second": 7.856, "eval/steps_per_second": 0.494} \ No newline at end of file +{"train/loss": 0.1177, "train/learning_rate": 5.557377049180327e-05, "train/epoch": 9.01, "train/global_step": 1000, "_runtime": 23313, "_timestamp": 1648510215, "_step": 1001, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 11.0, 12.0, 20.0, 24.0, 32.0, 39.0, 71.0, 74.0, 94.0, 117.0, 103.0, 81.0, 77.0, 69.0, 54.0, 32.0, 26.0, 18.0, 10.0, 14.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6982321739196777, -1.651377558708191, -1.604522943496704, -1.5576683282852173, -1.5108137130737305, -1.4639590978622437, -1.4171044826507568, -1.37024986743927, -1.3233952522277832, -1.2765406370162964, -1.2296860218048096, -1.1828314065933228, -1.135976791381836, -1.0891221761703491, -1.0422675609588623, -0.9954129457473755, -0.9485583305358887, -0.9017037153244019, -0.854849100112915, -0.8079944849014282, -0.7611398696899414, -0.7142852544784546, -0.6674306392669678, -0.620576024055481, -0.5737214088439941, -0.5268667936325073, -0.4800121784210205, -0.4331575632095337, -0.3863029479980469, -0.33944833278656006, -0.29259371757507324, -0.24573910236358643, -0.19888460636138916, -0.15202999114990234, -0.10517537593841553, -0.05832076072692871, -0.011466145515441895, 0.03538846969604492, 0.08224308490753174, 0.12909770011901855, 0.17595231533050537, 0.2228069305419922, 0.269661545753479, 0.3165161609649658, 0.36337077617645264, 0.41022539138793945, 0.45708000659942627, 0.5039346218109131, 0.5507892370223999, 0.5976438522338867, 0.6444984674453735, 0.6913530826568604, 0.7382076978683472, 0.785062313079834, 0.8319169282913208, 0.8787715435028076, 0.9256261587142944, 0.9724807739257812, 1.019335389137268, 1.0661900043487549, 1.1130446195602417, 1.1598992347717285, 1.2067538499832153, 1.2536084651947021, 1.300463080406189]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 11.0, 6.0, 10.0, 15.0, 18.0, 19.0, 18.0, 17.0, 31.0, 24.0, 42.0, 24.0, 37.0, 26.0, 42.0, 31.0, 38.0, 47.0, 29.0, 31.0, 33.0, 45.0, 35.0, 46.0, 32.0, 38.0, 24.0, 29.0, 27.0, 27.0, 24.0, 15.0, 16.0, 12.0, 16.0, 14.0, 12.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.7940231561660767, -0.7693271636962891, -0.7446311712265015, -0.7199351787567139, -0.6952391862869263, -0.6705431938171387, -0.6458472013473511, -0.6211512088775635, -0.5964552164077759, -0.5717592239379883, -0.5470632314682007, -0.5223672389984131, -0.4976712465286255, -0.4729752540588379, -0.4482792615890503, -0.4235832691192627, -0.3988872766494751, -0.3741912841796875, -0.3494952917098999, -0.3247992992401123, -0.3001033067703247, -0.2754073143005371, -0.2507113218307495, -0.22601532936096191, -0.20131933689117432, -0.17662334442138672, -0.15192735195159912, -0.12723135948181152, -0.10253536701202393, -0.07783937454223633, -0.05314338207244873, -0.028447389602661133, -0.0037513375282287598, 0.020944654941558838, 0.045640647411346436, 0.07033663988113403, 0.09503263235092163, 0.11972862482070923, 0.14442461729049683, 0.16912060976028442, 0.19381660223007202, 0.21851259469985962, 0.24320858716964722, 0.2679045796394348, 0.2926005721092224, 0.31729656457901, 0.3419925570487976, 0.3666885495185852, 0.3913845419883728, 0.4160805344581604, 0.440776526927948, 0.4654725193977356, 0.4901685118675232, 0.5148645043373108, 0.5395604968070984, 0.564256489276886, 0.5889524817466736, 0.6136484742164612, 0.6383444666862488, 0.6630404591560364, 0.687736451625824, 0.7124324440956116, 0.7371284365653992, 0.7618244290351868, 0.7865204215049744]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [4.0, 3.0, 5.0, 2.0, 8.0, 6.0, 11.0, 18.0, 13.0, 32.0, 34.0, 69.0, 81.0, 108.0, 143.0, 216.0, 333.0, 489.0, 724.0, 1109.0, 1788.0, 2812.0, 5143.0, 11100.0, 35137.0, 253462.0, 1494864.0, 1929695.0, 381752.0, 49243.0, 12019.0, 5573.0, 3088.0, 1833.0, 1142.0, 771.0, 406.0, 331.0, 220.0, 153.0, 105.0, 72.0, 55.0, 38.0, 15.0, 28.0, 13.0, 14.0, 9.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.755859375, -2.654144287109375, -2.55242919921875, -2.450714111328125, -2.3489990234375, -2.247283935546875, -2.14556884765625, -2.043853759765625, -1.942138671875, -1.840423583984375, -1.73870849609375, -1.636993408203125, -1.5352783203125, -1.433563232421875, -1.33184814453125, -1.230133056640625, -1.12841796875, -1.026702880859375, -0.92498779296875, -0.823272705078125, -0.7215576171875, -0.619842529296875, -0.51812744140625, -0.416412353515625, -0.314697265625, -0.212982177734375, -0.11126708984375, -0.009552001953125, 0.0921630859375, 0.193878173828125, 0.29559326171875, 0.397308349609375, 0.4990234375, 0.600738525390625, 0.70245361328125, 0.804168701171875, 0.9058837890625, 1.007598876953125, 1.10931396484375, 1.211029052734375, 1.312744140625, 1.414459228515625, 1.51617431640625, 1.617889404296875, 1.7196044921875, 1.821319580078125, 1.92303466796875, 2.024749755859375, 2.12646484375, 2.228179931640625, 2.32989501953125, 2.431610107421875, 2.5333251953125, 2.635040283203125, 2.73675537109375, 2.838470458984375, 2.940185546875, 3.041900634765625, 3.14361572265625, 3.245330810546875, 3.3470458984375, 3.448760986328125, 3.55047607421875, 3.652191162109375, 3.75390625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 5.0, 6.0, 5.0, 8.0, 15.0, 13.0, 14.0, 22.0, 24.0, 29.0, 21.0, 38.0, 26.0, 51.0, 35.0, 32.0, 49.0, 40.0, 36.0, 35.0, 45.0, 51.0, 41.0, 46.0, 38.0, 28.0, 27.0, 32.0, 31.0, 26.0, 18.0, 12.0, 25.0, 19.0, 17.0, 8.0, 8.0, 8.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.779296875, -1.717010498046875, -1.65472412109375, -1.592437744140625, -1.5301513671875, -1.467864990234375, -1.40557861328125, -1.343292236328125, -1.281005859375, -1.218719482421875, -1.15643310546875, -1.094146728515625, -1.0318603515625, -0.969573974609375, -0.90728759765625, -0.845001220703125, -0.78271484375, -0.720428466796875, -0.65814208984375, -0.595855712890625, -0.5335693359375, -0.471282958984375, -0.40899658203125, -0.346710205078125, -0.284423828125, -0.222137451171875, -0.15985107421875, -0.097564697265625, -0.0352783203125, 0.027008056640625, 0.08929443359375, 0.151580810546875, 0.2138671875, 0.276153564453125, 0.33843994140625, 0.400726318359375, 0.4630126953125, 0.525299072265625, 0.58758544921875, 0.649871826171875, 0.712158203125, 0.774444580078125, 0.83673095703125, 0.899017333984375, 0.9613037109375, 1.023590087890625, 1.08587646484375, 1.148162841796875, 1.21044921875, 1.272735595703125, 1.33502197265625, 1.397308349609375, 1.4595947265625, 1.521881103515625, 1.58416748046875, 1.646453857421875, 1.708740234375, 1.771026611328125, 1.83331298828125, 1.895599365234375, 1.9578857421875, 2.020172119140625, 2.08245849609375, 2.144744873046875, 2.20703125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 11.0, 14.0, 35.0, 69.0, 190.0, 1104.0, 72219.0, 4115758.0, 4331.0, 374.0, 83.0, 35.0, 24.0, 9.0, 8.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.015625, -23.333984375, -22.65234375, -21.970703125, -21.2890625, -20.607421875, -19.92578125, -19.244140625, -18.5625, -17.880859375, -17.19921875, -16.517578125, -15.8359375, -15.154296875, -14.47265625, -13.791015625, -13.109375, -12.427734375, -11.74609375, -11.064453125, -10.3828125, -9.701171875, -9.01953125, -8.337890625, -7.65625, -6.974609375, -6.29296875, -5.611328125, -4.9296875, -4.248046875, -3.56640625, -2.884765625, -2.203125, -1.521484375, -0.83984375, -0.158203125, 0.5234375, 1.205078125, 1.88671875, 2.568359375, 3.25, 3.931640625, 4.61328125, 5.294921875, 5.9765625, 6.658203125, 7.33984375, 8.021484375, 8.703125, 9.384765625, 10.06640625, 10.748046875, 11.4296875, 12.111328125, 12.79296875, 13.474609375, 14.15625, 14.837890625, 15.51953125, 16.201171875, 16.8828125, 17.564453125, 18.24609375, 18.927734375, 19.609375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 10.0, 17.0, 16.0, 31.0, 34.0, 73.0, 111.0, 172.0, 353.0, 783.0, 1166.0, 610.0, 289.0, 158.0, 71.0, 62.0, 29.0, 12.0, 17.0, 13.0, 9.0, 5.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4169921875, -1.3744964599609375, -1.332000732421875, -1.2895050048828125, -1.24700927734375, -1.2045135498046875, -1.162017822265625, -1.1195220947265625, -1.0770263671875, -1.0345306396484375, -0.992034912109375, -0.9495391845703125, -0.90704345703125, -0.8645477294921875, -0.822052001953125, -0.7795562744140625, -0.737060546875, -0.6945648193359375, -0.652069091796875, -0.6095733642578125, -0.56707763671875, -0.5245819091796875, -0.482086181640625, -0.4395904541015625, -0.3970947265625, -0.3545989990234375, -0.312103271484375, -0.2696075439453125, -0.22711181640625, -0.1846160888671875, -0.142120361328125, -0.0996246337890625, -0.05712890625, -0.0146331787109375, 0.027862548828125, 0.0703582763671875, 0.11285400390625, 0.1553497314453125, 0.197845458984375, 0.2403411865234375, 0.2828369140625, 0.3253326416015625, 0.367828369140625, 0.4103240966796875, 0.45281982421875, 0.4953155517578125, 0.537811279296875, 0.5803070068359375, 0.622802734375, 0.6652984619140625, 0.707794189453125, 0.7502899169921875, 0.79278564453125, 0.8352813720703125, 0.877777099609375, 0.9202728271484375, 0.9627685546875, 1.0052642822265625, 1.047760009765625, 1.0902557373046875, 1.13275146484375, 1.1752471923828125, 1.217742919921875, 1.2602386474609375, 1.302734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 2.0, 7.0, 15.0, 5.0, 12.0, 19.0, 22.0, 31.0, 25.0, 47.0, 40.0, 45.0, 76.0, 58.0, 75.0, 69.0, 54.0, 69.0, 55.0, 58.0, 45.0, 32.0, 15.0, 26.0, 20.0, 15.0, 13.0, 12.0, 4.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4160919189453125, -2.338754892349243, -2.261418104171753, -2.1840810775756836, -2.1067442893981934, -2.029407262802124, -1.9520702362060547, -1.874733328819275, -1.7973964214324951, -1.7200595140457153, -1.6427226066589355, -1.5653855800628662, -1.4880486726760864, -1.4107117652893066, -1.3333747386932373, -1.2560378313064575, -1.1787009239196777, -1.101364016532898, -1.0240271091461182, -0.9466900825500488, -0.869353175163269, -0.7920162677764893, -0.7146793007850647, -0.6373423337936401, -0.5600054264068604, -0.4826684892177582, -0.405331552028656, -0.32799461483955383, -0.25065767765045166, -0.1733207404613495, -0.09598380327224731, -0.018646836280822754, 0.05869007110595703, 0.1360270082950592, 0.21336394548416138, 0.29070088267326355, 0.3680378198623657, 0.4453747570514679, 0.5227116942405701, 0.6000486612319946, 0.6773855686187744, 0.7547224760055542, 0.8320594429969788, 0.9093964099884033, 0.9867333173751831, 1.064070224761963, 1.1414072513580322, 1.218744158744812, 1.2960810661315918, 1.3734179735183716, 1.4507548809051514, 1.5280919075012207, 1.6054288148880005, 1.6827657222747803, 1.7601027488708496, 1.8374396562576294, 1.9147765636444092, 1.992113471031189, 2.0694503784179688, 2.146787405014038, 2.2241244316101074, 2.3014612197875977, 2.378798246383667, 2.4561352729797363, 2.5334720611572266]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 6.0, 5.0, 7.0, 7.0, 14.0, 12.0, 13.0, 21.0, 22.0, 21.0, 22.0, 24.0, 18.0, 25.0, 42.0, 28.0, 30.0, 37.0, 35.0, 32.0, 46.0, 38.0, 38.0, 31.0, 43.0, 43.0, 28.0, 34.0, 23.0, 23.0, 31.0, 27.0, 16.0, 17.0, 29.0, 16.0, 11.0, 10.0, 11.0, 10.0, 5.0, 11.0, 10.0, 2.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.5252161026000977, -1.4722870588302612, -1.4193580150604248, -1.3664289712905884, -1.313499927520752, -1.2605708837509155, -1.207641839981079, -1.1547127962112427, -1.1017837524414062, -1.0488547086715698, -0.9959256649017334, -0.942996621131897, -0.8900675773620605, -0.8371385335922241, -0.7842094898223877, -0.7312804460525513, -0.6783514022827148, -0.6254223585128784, -0.572493314743042, -0.5195642709732056, -0.46663522720336914, -0.4137061834335327, -0.3607771396636963, -0.30784809589385986, -0.25491905212402344, -0.201990008354187, -0.14906096458435059, -0.09613192081451416, -0.043202877044677734, 0.009726166725158691, 0.06265521049499512, 0.11558425426483154, 0.16851329803466797, 0.2214423418045044, 0.2743713855743408, 0.32730042934417725, 0.38022947311401367, 0.4331585168838501, 0.4860875606536865, 0.539016604423523, 0.5919456481933594, 0.6448746919631958, 0.6978037357330322, 0.7507327795028687, 0.8036618232727051, 0.8565908670425415, 0.9095199108123779, 0.9624489545822144, 1.0153779983520508, 1.0683070421218872, 1.1212360858917236, 1.17416512966156, 1.2270941734313965, 1.280023217201233, 1.3329522609710693, 1.3858813047409058, 1.4388103485107422, 1.4917393922805786, 1.544668436050415, 1.5975974798202515, 1.650526523590088, 1.7034555673599243, 1.7563846111297607, 1.8093136548995972, 1.8622426986694336]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 10.0, 22.0, 26.0, 35.0, 37.0, 71.0, 113.0, 180.0, 268.0, 426.0, 663.0, 1009.0, 1680.0, 2860.0, 4783.0, 8412.0, 15122.0, 28238.0, 53580.0, 103487.0, 196989.0, 266994.0, 171798.0, 89652.0, 46017.0, 24477.0, 13384.0, 7520.0, 4223.0, 2459.0, 1473.0, 875.0, 619.0, 357.0, 237.0, 143.0, 113.0, 69.0, 30.0, 29.0, 16.0, 20.0, 13.0, 8.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.7880859375, -0.765167236328125, -0.74224853515625, -0.719329833984375, -0.6964111328125, -0.673492431640625, -0.65057373046875, -0.627655029296875, -0.604736328125, -0.581817626953125, -0.55889892578125, -0.535980224609375, -0.5130615234375, -0.490142822265625, -0.46722412109375, -0.444305419921875, -0.42138671875, -0.398468017578125, -0.37554931640625, -0.352630615234375, -0.3297119140625, -0.306793212890625, -0.28387451171875, -0.260955810546875, -0.238037109375, -0.215118408203125, -0.19219970703125, -0.169281005859375, -0.1463623046875, -0.123443603515625, -0.10052490234375, -0.077606201171875, -0.0546875, -0.031768798828125, -0.00885009765625, 0.014068603515625, 0.0369873046875, 0.059906005859375, 0.08282470703125, 0.105743408203125, 0.128662109375, 0.151580810546875, 0.17449951171875, 0.197418212890625, 0.2203369140625, 0.243255615234375, 0.26617431640625, 0.289093017578125, 0.31201171875, 0.334930419921875, 0.35784912109375, 0.380767822265625, 0.4036865234375, 0.426605224609375, 0.44952392578125, 0.472442626953125, 0.495361328125, 0.518280029296875, 0.54119873046875, 0.564117431640625, 0.5870361328125, 0.609954833984375, 0.63287353515625, 0.655792236328125, 0.6787109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 2.0, 6.0, 7.0, 7.0, 8.0, 12.0, 13.0, 18.0, 11.0, 18.0, 21.0, 28.0, 28.0, 27.0, 41.0, 32.0, 42.0, 45.0, 47.0, 49.0, 52.0, 43.0, 46.0, 42.0, 39.0, 44.0, 34.0, 31.0, 36.0, 25.0, 20.0, 21.0, 17.0, 10.0, 15.0, 11.0, 12.0, 9.0, 12.0, 4.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26953125, -1.22235107421875, -1.1751708984375, -1.12799072265625, -1.080810546875, -1.03363037109375, -0.9864501953125, -0.93927001953125, -0.89208984375, -0.84490966796875, -0.7977294921875, -0.75054931640625, -0.703369140625, -0.65618896484375, -0.6090087890625, -0.56182861328125, -0.5146484375, -0.46746826171875, -0.4202880859375, -0.37310791015625, -0.325927734375, -0.27874755859375, -0.2315673828125, -0.18438720703125, -0.13720703125, -0.09002685546875, -0.0428466796875, 0.00433349609375, 0.051513671875, 0.09869384765625, 0.1458740234375, 0.19305419921875, 0.240234375, 0.28741455078125, 0.3345947265625, 0.38177490234375, 0.428955078125, 0.47613525390625, 0.5233154296875, 0.57049560546875, 0.61767578125, 0.66485595703125, 0.7120361328125, 0.75921630859375, 0.806396484375, 0.85357666015625, 0.9007568359375, 0.94793701171875, 0.9951171875, 1.04229736328125, 1.0894775390625, 1.13665771484375, 1.183837890625, 1.23101806640625, 1.2781982421875, 1.32537841796875, 1.37255859375, 1.41973876953125, 1.4669189453125, 1.51409912109375, 1.561279296875, 1.60845947265625, 1.6556396484375, 1.70281982421875, 1.75]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 15.0, 12.0, 17.0, 32.0, 33.0, 62.0, 74.0, 128.0, 193.0, 288.0, 464.0, 703.0, 1278.0, 2151.0, 4019.0, 7694.0, 15403.0, 32524.0, 70982.0, 159869.0, 294964.0, 242945.0, 115665.0, 51133.0, 23396.0, 11391.0, 5792.0, 3010.0, 1669.0, 999.0, 592.0, 360.0, 205.0, 139.0, 113.0, 68.0, 51.0, 37.0, 20.0, 20.0, 6.0, 7.0, 7.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74365234375, -0.7202606201171875, -0.696868896484375, -0.6734771728515625, -0.65008544921875, -0.6266937255859375, -0.603302001953125, -0.5799102783203125, -0.5565185546875, -0.5331268310546875, -0.509735107421875, -0.4863433837890625, -0.46295166015625, -0.4395599365234375, -0.416168212890625, -0.3927764892578125, -0.369384765625, -0.3459930419921875, -0.322601318359375, -0.2992095947265625, -0.27581787109375, -0.2524261474609375, -0.229034423828125, -0.2056427001953125, -0.1822509765625, -0.1588592529296875, -0.135467529296875, -0.1120758056640625, -0.08868408203125, -0.0652923583984375, -0.041900634765625, -0.0185089111328125, 0.0048828125, 0.0282745361328125, 0.051666259765625, 0.0750579833984375, 0.09844970703125, 0.1218414306640625, 0.145233154296875, 0.1686248779296875, 0.1920166015625, 0.2154083251953125, 0.238800048828125, 0.2621917724609375, 0.28558349609375, 0.3089752197265625, 0.332366943359375, 0.3557586669921875, 0.379150390625, 0.4025421142578125, 0.425933837890625, 0.4493255615234375, 0.47271728515625, 0.4961090087890625, 0.519500732421875, 0.5428924560546875, 0.5662841796875, 0.5896759033203125, 0.613067626953125, 0.6364593505859375, 0.65985107421875, 0.6832427978515625, 0.706634521484375, 0.7300262451171875, 0.75341796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 5.0, 3.0, 8.0, 13.0, 12.0, 13.0, 17.0, 16.0, 25.0, 23.0, 26.0, 21.0, 35.0, 20.0, 32.0, 42.0, 37.0, 44.0, 38.0, 50.0, 53.0, 32.0, 44.0, 50.0, 40.0, 46.0, 26.0, 29.0, 39.0, 25.0, 28.0, 18.0, 28.0, 12.0, 9.0, 7.0, 9.0, 7.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-3.134765625, -3.03961181640625, -2.9444580078125, -2.84930419921875, -2.754150390625, -2.65899658203125, -2.5638427734375, -2.46868896484375, -2.37353515625, -2.27838134765625, -2.1832275390625, -2.08807373046875, -1.992919921875, -1.89776611328125, -1.8026123046875, -1.70745849609375, -1.6123046875, -1.51715087890625, -1.4219970703125, -1.32684326171875, -1.231689453125, -1.13653564453125, -1.0413818359375, -0.94622802734375, -0.85107421875, -0.75592041015625, -0.6607666015625, -0.56561279296875, -0.470458984375, -0.37530517578125, -0.2801513671875, -0.18499755859375, -0.08984375, 0.00531005859375, 0.1004638671875, 0.19561767578125, 0.290771484375, 0.38592529296875, 0.4810791015625, 0.57623291015625, 0.67138671875, 0.76654052734375, 0.8616943359375, 0.95684814453125, 1.052001953125, 1.14715576171875, 1.2423095703125, 1.33746337890625, 1.4326171875, 1.52777099609375, 1.6229248046875, 1.71807861328125, 1.813232421875, 1.90838623046875, 2.0035400390625, 2.09869384765625, 2.19384765625, 2.28900146484375, 2.3841552734375, 2.47930908203125, 2.574462890625, 2.66961669921875, 2.7647705078125, 2.85992431640625, 2.955078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 8.0, 5.0, 10.0, 12.0, 20.0, 19.0, 37.0, 60.0, 79.0, 118.0, 192.0, 328.0, 528.0, 979.0, 2254.0, 7072.0, 46388.0, 671507.0, 289266.0, 21671.0, 4387.0, 1570.0, 845.0, 464.0, 247.0, 171.0, 92.0, 67.0, 56.0, 30.0, 23.0, 16.0, 12.0, 12.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6676483154296875, -0.647308349609375, -0.6269683837890625, -0.60662841796875, -0.5862884521484375, -0.565948486328125, -0.5456085205078125, -0.5252685546875, -0.5049285888671875, -0.484588623046875, -0.4642486572265625, -0.44390869140625, -0.4235687255859375, -0.403228759765625, -0.3828887939453125, -0.362548828125, -0.3422088623046875, -0.321868896484375, -0.3015289306640625, -0.28118896484375, -0.2608489990234375, -0.240509033203125, -0.2201690673828125, -0.1998291015625, -0.1794891357421875, -0.159149169921875, -0.1388092041015625, -0.11846923828125, -0.0981292724609375, -0.077789306640625, -0.0574493408203125, -0.037109375, -0.0167694091796875, 0.003570556640625, 0.0239105224609375, 0.04425048828125, 0.0645904541015625, 0.084930419921875, 0.1052703857421875, 0.1256103515625, 0.1459503173828125, 0.166290283203125, 0.1866302490234375, 0.20697021484375, 0.2273101806640625, 0.247650146484375, 0.2679901123046875, 0.288330078125, 0.3086700439453125, 0.329010009765625, 0.3493499755859375, 0.36968994140625, 0.3900299072265625, 0.410369873046875, 0.4307098388671875, 0.4510498046875, 0.4713897705078125, 0.491729736328125, 0.5120697021484375, 0.53240966796875, 0.5527496337890625, 0.573089599609375, 0.5934295654296875, 0.61376953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 4.0, 8.0, 7.0, 15.0, 29.0, 51.0, 65.0, 101.0, 154.0, 159.0, 144.0, 84.0, 55.0, 30.0, 31.0, 17.0, 20.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002949237823486328, -0.0002832375466823578, -0.00027155131101608276, -0.00025986507534980774, -0.0002481788396835327, -0.0002364926040172577, -0.00022480636835098267, -0.00021312013268470764, -0.00020143389701843262, -0.0001897476613521576, -0.00017806142568588257, -0.00016637519001960754, -0.00015468895435333252, -0.0001430027186870575, -0.00013131648302078247, -0.00011963024735450745, -0.00010794401168823242, -9.62577760219574e-05, -8.457154035568237e-05, -7.288530468940735e-05, -6.119906902313232e-05, -4.95128333568573e-05, -3.7826597690582275e-05, -2.614036202430725e-05, -1.4454126358032227e-05, -2.767890691757202e-06, 8.918344974517822e-06, 2.0604580640792847e-05, 3.229081630706787e-05, 4.3977051973342896e-05, 5.566328763961792e-05, 6.734952330589294e-05, 7.903575897216797e-05, 9.072199463844299e-05, 0.00010240823030471802, 0.00011409446597099304, 0.00012578070163726807, 0.0001374669373035431, 0.00014915317296981812, 0.00016083940863609314, 0.00017252564430236816, 0.0001842118799686432, 0.0001958981156349182, 0.00020758435130119324, 0.00021927058696746826, 0.00023095682263374329, 0.0002426430583000183, 0.00025432929396629333, 0.00026601552963256836, 0.0002777017652988434, 0.0002893880009651184, 0.00030107423663139343, 0.00031276047229766846, 0.0003244467079639435, 0.0003361329436302185, 0.00034781917929649353, 0.00035950541496276855, 0.0003711916506290436, 0.0003828778862953186, 0.00039456412196159363, 0.00040625035762786865, 0.0004179365932941437, 0.0004296228289604187, 0.0004413090646266937, 0.00045299530029296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 8.0, 8.0, 20.0, 12.0, 25.0, 41.0, 45.0, 82.0, 87.0, 131.0, 202.0, 270.0, 389.0, 523.0, 879.0, 1340.0, 2273.0, 4957.0, 13336.0, 58022.0, 393063.0, 473034.0, 71771.0, 15891.0, 5460.0, 2486.0, 1394.0, 883.0, 589.0, 361.0, 280.0, 187.0, 138.0, 103.0, 65.0, 47.0, 34.0, 28.0, 24.0, 21.0, 10.0, 13.0, 6.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429443359375, -0.4151573181152344, -0.40087127685546875, -0.3865852355957031, -0.3722991943359375, -0.3580131530761719, -0.34372711181640625, -0.3294410705566406, -0.315155029296875, -0.3008689880371094, -0.28658294677734375, -0.2722969055175781, -0.2580108642578125, -0.24372482299804688, -0.22943878173828125, -0.21515274047851562, -0.20086669921875, -0.18658065795898438, -0.17229461669921875, -0.15800857543945312, -0.1437225341796875, -0.12943649291992188, -0.11515045166015625, -0.10086441040039062, -0.086578369140625, -0.07229232788085938, -0.05800628662109375, -0.043720245361328125, -0.0294342041015625, -0.015148162841796875, -0.00086212158203125, 0.013423919677734375, 0.0277099609375, 0.041996002197265625, 0.05628204345703125, 0.07056808471679688, 0.0848541259765625, 0.09914016723632812, 0.11342620849609375, 0.12771224975585938, 0.141998291015625, 0.15628433227539062, 0.17057037353515625, 0.18485641479492188, 0.1991424560546875, 0.21342849731445312, 0.22771453857421875, 0.24200057983398438, 0.25628662109375, 0.2705726623535156, 0.28485870361328125, 0.2991447448730469, 0.3134307861328125, 0.3277168273925781, 0.34200286865234375, 0.3562889099121094, 0.370574951171875, 0.3848609924316406, 0.39914703369140625, 0.4134330749511719, 0.4277191162109375, 0.4420051574707031, 0.45629119873046875, 0.4705772399902344, 0.48486328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 4.0, 11.0, 14.0, 29.0, 40.0, 64.0, 93.0, 105.0, 133.0, 121.0, 117.0, 96.0, 67.0, 36.0, 19.0, 14.0, 10.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1915283203125, -0.18604087829589844, -0.18055343627929688, -0.1750659942626953, -0.16957855224609375, -0.1640911102294922, -0.15860366821289062, -0.15311622619628906, -0.1476287841796875, -0.14214134216308594, -0.13665390014648438, -0.1311664581298828, -0.12567901611328125, -0.12019157409667969, -0.11470413208007812, -0.10921669006347656, -0.103729248046875, -0.09824180603027344, -0.09275436401367188, -0.08726692199707031, -0.08177947998046875, -0.07629203796386719, -0.07080459594726562, -0.06531715393066406, -0.0598297119140625, -0.05434226989746094, -0.048854827880859375, -0.04336738586425781, -0.03787994384765625, -0.03239250183105469, -0.026905059814453125, -0.021417617797851562, -0.01593017578125, -0.010442733764648438, -0.004955291748046875, 0.0005321502685546875, 0.00601959228515625, 0.011507034301757812, 0.016994476318359375, 0.022481918334960938, 0.0279693603515625, 0.03345680236816406, 0.038944244384765625, 0.04443168640136719, 0.04991912841796875, 0.05540657043457031, 0.060894012451171875, 0.06638145446777344, 0.071868896484375, 0.07735633850097656, 0.08284378051757812, 0.08833122253417969, 0.09381866455078125, 0.09930610656738281, 0.10479354858398438, 0.11028099060058594, 0.1157684326171875, 0.12125587463378906, 0.12674331665039062, 0.1322307586669922, 0.13771820068359375, 0.1432056427001953, 0.14869308471679688, 0.15418052673339844, 0.15966796875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 6.0, 3.0, 5.0, 9.0, 12.0, 18.0, 23.0, 25.0, 39.0, 47.0, 82.0, 85.0, 111.0, 99.0, 105.0, 79.0, 79.0, 49.0, 37.0, 28.0, 22.0, 10.0, 8.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6781560182571411, -1.5998300313949585, -1.5215039253234863, -1.4431779384613037, -1.364851951599121, -1.2865259647369385, -1.2081998586654663, -1.1298738718032837, -1.0515477657318115, -0.9732217192649841, -0.8948957324028015, -0.8165696859359741, -0.7382436990737915, -0.6599176526069641, -0.5815916061401367, -0.5032656192779541, -0.4249396324157715, -0.3466136157512665, -0.2682875990867615, -0.18996155261993408, -0.11163553595542908, -0.03330951929092407, 0.04501652717590332, 0.12334251403808594, 0.20166856050491333, 0.27999457716941833, 0.35832059383392334, 0.43664664030075073, 0.5149726867675781, 0.5932986736297607, 0.6716247200965881, 0.7499507069587708, 0.8282766342163086, 0.906602680683136, 0.9849286675453186, 1.063254714012146, 1.1415807008743286, 1.2199068069458008, 1.2982327938079834, 1.376558780670166, 1.4548847675323486, 1.5332107543945312, 1.6115368604660034, 1.689862847328186, 1.7681888341903687, 1.8465149402618408, 1.9248409271240234, 2.003166913986206, 2.0814929008483887, 2.1598188877105713, 2.238144874572754, 2.3164710998535156, 2.3947970867156982, 2.473123073577881, 2.5514490604400635, 2.629775047302246, 2.708101272583008, 2.7864272594451904, 2.864753246307373, 2.9430794715881348, 3.0214054584503174, 3.0997314453125, 3.1780574321746826, 3.2563834190368652, 3.334709405899048]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 8.0, 2.0, 6.0, 9.0, 9.0, 10.0, 20.0, 23.0, 19.0, 16.0, 21.0, 22.0, 25.0, 38.0, 33.0, 41.0, 43.0, 40.0, 33.0, 44.0, 31.0, 40.0, 50.0, 41.0, 42.0, 32.0, 41.0, 27.0, 29.0, 37.0, 23.0, 18.0, 15.0, 18.0, 17.0, 16.0, 15.0, 7.0, 7.0, 3.0, 9.0, 5.0, 2.0, 4.0, 4.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1356970071792603, -1.0936849117279053, -1.0516726970672607, -1.0096604824066162, -0.9676483869552612, -0.9256362318992615, -0.8836240768432617, -0.841611921787262, -0.7995997667312622, -0.7575876116752625, -0.7155754566192627, -0.6735633015632629, -0.6315511465072632, -0.5895389914512634, -0.5475268363952637, -0.5055146813392639, -0.46350252628326416, -0.4214903712272644, -0.37947821617126465, -0.3374660611152649, -0.29545390605926514, -0.2534417510032654, -0.21142959594726562, -0.16941744089126587, -0.1274052858352661, -0.08539313077926636, -0.0433809757232666, -0.0013688206672668457, 0.04064333438873291, 0.08265548944473267, 0.12466764450073242, 0.16667979955673218, 0.20869183540344238, 0.25070399045944214, 0.2927161455154419, 0.33472830057144165, 0.3767404556274414, 0.41875261068344116, 0.4607647657394409, 0.5027769207954407, 0.5447890758514404, 0.5868012309074402, 0.6288133859634399, 0.6708255410194397, 0.7128376960754395, 0.7548498511314392, 0.796862006187439, 0.8388741612434387, 0.8808863162994385, 0.9228984713554382, 0.964910626411438, 1.006922721862793, 1.0489349365234375, 1.090947151184082, 1.132959246635437, 1.174971342086792, 1.2169835567474365, 1.258995771408081, 1.301007866859436, 1.343019962310791, 1.3850321769714355, 1.42704439163208, 1.469056487083435, 1.51106858253479, 1.5530807971954346]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 9.0, 7.0, 12.0, 12.0, 12.0, 21.0, 14.0, 29.0, 37.0, 41.0, 63.0, 79.0, 74.0, 115.0, 133.0, 187.0, 246.0, 331.0, 412.0, 605.0, 815.0, 1139.0, 1732.0, 2703.0, 4822.0, 10274.0, 32918.0, 194597.0, 638040.0, 115614.0, 23175.0, 8167.0, 4069.0, 2487.0, 1547.0, 1037.0, 741.0, 529.0, 407.0, 278.0, 213.0, 170.0, 137.0, 121.0, 87.0, 73.0, 51.0, 43.0, 30.0, 23.0, 19.0, 17.0, 7.0, 13.0, 10.0, 6.0, 5.0, 2.0, 4.0, 4.0, 1.0], "bins": [-0.9267578125, -0.897216796875, -0.86767578125, -0.838134765625, -0.80859375, -0.779052734375, -0.74951171875, -0.719970703125, -0.6904296875, -0.660888671875, -0.63134765625, -0.601806640625, -0.572265625, -0.542724609375, -0.51318359375, -0.483642578125, -0.4541015625, -0.424560546875, -0.39501953125, -0.365478515625, -0.3359375, -0.306396484375, -0.27685546875, -0.247314453125, -0.2177734375, -0.188232421875, -0.15869140625, -0.129150390625, -0.099609375, -0.070068359375, -0.04052734375, -0.010986328125, 0.0185546875, 0.048095703125, 0.07763671875, 0.107177734375, 0.13671875, 0.166259765625, 0.19580078125, 0.225341796875, 0.2548828125, 0.284423828125, 0.31396484375, 0.343505859375, 0.373046875, 0.402587890625, 0.43212890625, 0.461669921875, 0.4912109375, 0.520751953125, 0.55029296875, 0.579833984375, 0.609375, 0.638916015625, 0.66845703125, 0.697998046875, 0.7275390625, 0.757080078125, 0.78662109375, 0.816162109375, 0.845703125, 0.875244140625, 0.90478515625, 0.934326171875, 0.9638671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 7.0, 4.0, 9.0, 13.0, 14.0, 14.0, 11.0, 17.0, 28.0, 17.0, 21.0, 33.0, 36.0, 33.0, 30.0, 43.0, 43.0, 33.0, 29.0, 64.0, 28.0, 42.0, 41.0, 27.0, 45.0, 35.0, 35.0, 17.0, 30.0, 26.0, 21.0, 29.0, 14.0, 7.0, 12.0, 17.0, 13.0, 13.0, 6.0, 8.0, 5.0, 6.0, 7.0, 1.0, 2.0, 5.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.109375, -2.039581298828125, -1.96978759765625, -1.899993896484375, -1.8302001953125, -1.760406494140625, -1.69061279296875, -1.620819091796875, -1.551025390625, -1.481231689453125, -1.41143798828125, -1.341644287109375, -1.2718505859375, -1.202056884765625, -1.13226318359375, -1.062469482421875, -0.99267578125, -0.922882080078125, -0.85308837890625, -0.783294677734375, -0.7135009765625, -0.643707275390625, -0.57391357421875, -0.504119873046875, -0.434326171875, -0.364532470703125, -0.29473876953125, -0.224945068359375, -0.1551513671875, -0.085357666015625, -0.01556396484375, 0.054229736328125, 0.1240234375, 0.193817138671875, 0.26361083984375, 0.333404541015625, 0.4031982421875, 0.472991943359375, 0.54278564453125, 0.612579345703125, 0.682373046875, 0.752166748046875, 0.82196044921875, 0.891754150390625, 0.9615478515625, 1.031341552734375, 1.10113525390625, 1.170928955078125, 1.24072265625, 1.310516357421875, 1.38031005859375, 1.450103759765625, 1.5198974609375, 1.589691162109375, 1.65948486328125, 1.729278564453125, 1.799072265625, 1.868865966796875, 1.93865966796875, 2.008453369140625, 2.0782470703125, 2.148040771484375, 2.21783447265625, 2.287628173828125, 2.357421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 14.0, 20.0, 28.0, 24.0, 41.0, 44.0, 80.0, 120.0, 172.0, 227.0, 385.0, 746.0, 1181.0, 2309.0, 5624.0, 18106.0, 192172.0, 766301.0, 44250.0, 9232.0, 3542.0, 1632.0, 865.0, 491.0, 294.0, 176.0, 121.0, 82.0, 59.0, 54.0, 31.0, 21.0, 18.0, 14.0, 12.0, 12.0, 8.0, 8.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0], "bins": [-1.970703125, -1.91778564453125, -1.8648681640625, -1.81195068359375, -1.759033203125, -1.70611572265625, -1.6531982421875, -1.60028076171875, -1.54736328125, -1.49444580078125, -1.4415283203125, -1.38861083984375, -1.335693359375, -1.28277587890625, -1.2298583984375, -1.17694091796875, -1.1240234375, -1.07110595703125, -1.0181884765625, -0.96527099609375, -0.912353515625, -0.85943603515625, -0.8065185546875, -0.75360107421875, -0.70068359375, -0.64776611328125, -0.5948486328125, -0.54193115234375, -0.489013671875, -0.43609619140625, -0.3831787109375, -0.33026123046875, -0.27734375, -0.22442626953125, -0.1715087890625, -0.11859130859375, -0.065673828125, -0.01275634765625, 0.0401611328125, 0.09307861328125, 0.14599609375, 0.19891357421875, 0.2518310546875, 0.30474853515625, 0.357666015625, 0.41058349609375, 0.4635009765625, 0.51641845703125, 0.5693359375, 0.62225341796875, 0.6751708984375, 0.72808837890625, 0.781005859375, 0.83392333984375, 0.8868408203125, 0.93975830078125, 0.99267578125, 1.04559326171875, 1.0985107421875, 1.15142822265625, 1.204345703125, 1.25726318359375, 1.3101806640625, 1.36309814453125, 1.416015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 6.0, 6.0, 7.0, 5.0, 11.0, 19.0, 19.0, 11.0, 23.0, 25.0, 31.0, 18.0, 41.0, 36.0, 32.0, 51.0, 42.0, 40.0, 49.0, 51.0, 60.0, 47.0, 58.0, 34.0, 42.0, 45.0, 26.0, 22.0, 20.0, 28.0, 20.0, 17.0, 8.0, 6.0, 9.0, 9.0, 5.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0], "bins": [-3.32421875, -3.2357177734375, -3.147216796875, -3.0587158203125, -2.97021484375, -2.8817138671875, -2.793212890625, -2.7047119140625, -2.6162109375, -2.5277099609375, -2.439208984375, -2.3507080078125, -2.26220703125, -2.1737060546875, -2.085205078125, -1.9967041015625, -1.908203125, -1.8197021484375, -1.731201171875, -1.6427001953125, -1.55419921875, -1.4656982421875, -1.377197265625, -1.2886962890625, -1.2001953125, -1.1116943359375, -1.023193359375, -0.9346923828125, -0.84619140625, -0.7576904296875, -0.669189453125, -0.5806884765625, -0.4921875, -0.4036865234375, -0.315185546875, -0.2266845703125, -0.13818359375, -0.0496826171875, 0.038818359375, 0.1273193359375, 0.2158203125, 0.3043212890625, 0.392822265625, 0.4813232421875, 0.56982421875, 0.6583251953125, 0.746826171875, 0.8353271484375, 0.923828125, 1.0123291015625, 1.100830078125, 1.1893310546875, 1.27783203125, 1.3663330078125, 1.454833984375, 1.5433349609375, 1.6318359375, 1.7203369140625, 1.808837890625, 1.8973388671875, 1.98583984375, 2.0743408203125, 2.162841796875, 2.2513427734375, 2.33984375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 1.0, 2.0, 10.0, 7.0, 20.0, 16.0, 18.0, 23.0, 34.0, 47.0, 60.0, 107.0, 168.0, 249.0, 436.0, 743.0, 1417.0, 2806.0, 6814.0, 21629.0, 257636.0, 712861.0, 28339.0, 8145.0, 3216.0, 1635.0, 811.0, 473.0, 272.0, 145.0, 129.0, 85.0, 60.0, 38.0, 30.0, 12.0, 17.0, 13.0, 11.0, 6.0, 3.0, 4.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61083984375, -0.5911941528320312, -0.5715484619140625, -0.5519027709960938, -0.532257080078125, -0.5126113891601562, -0.4929656982421875, -0.47332000732421875, -0.45367431640625, -0.43402862548828125, -0.4143829345703125, -0.39473724365234375, -0.375091552734375, -0.35544586181640625, -0.3358001708984375, -0.31615447998046875, -0.2965087890625, -0.27686309814453125, -0.2572174072265625, -0.23757171630859375, -0.217926025390625, -0.19828033447265625, -0.1786346435546875, -0.15898895263671875, -0.13934326171875, -0.11969757080078125, -0.1000518798828125, -0.08040618896484375, -0.060760498046875, -0.04111480712890625, -0.0214691162109375, -0.00182342529296875, 0.017822265625, 0.03746795654296875, 0.0571136474609375, 0.07675933837890625, 0.096405029296875, 0.11605072021484375, 0.1356964111328125, 0.15534210205078125, 0.17498779296875, 0.19463348388671875, 0.2142791748046875, 0.23392486572265625, 0.253570556640625, 0.27321624755859375, 0.2928619384765625, 0.31250762939453125, 0.3321533203125, 0.35179901123046875, 0.3714447021484375, 0.39109039306640625, 0.410736083984375, 0.43038177490234375, 0.4500274658203125, 0.46967315673828125, 0.48931884765625, 0.5089645385742188, 0.5286102294921875, 0.5482559204101562, 0.567901611328125, 0.5875473022460938, 0.6071929931640625, 0.6268386840820312, 0.646484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 7.0, 4.0, 5.0, 11.0, 30.0, 62.0, 150.0, 432.0, 173.0, 58.0, 24.0, 12.0, 12.0, 9.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010144710540771484, -9.760819375514984e-05, -9.376928210258484e-05, -8.993037045001984e-05, -8.609145879745483e-05, -8.225254714488983e-05, -7.841363549232483e-05, -7.457472383975983e-05, -7.073581218719482e-05, -6.689690053462982e-05, -6.305798888206482e-05, -5.921907722949982e-05, -5.5380165576934814e-05, -5.154125392436981e-05, -4.770234227180481e-05, -4.386343061923981e-05, -4.0024518966674805e-05, -3.61856073141098e-05, -3.23466956615448e-05, -2.8507784008979797e-05, -2.4668872356414795e-05, -2.0829960703849792e-05, -1.699104905128479e-05, -1.3152137398719788e-05, -9.313225746154785e-06, -5.474314093589783e-06, -1.6354024410247803e-06, 2.203509211540222e-06, 6.042420864105225e-06, 9.881332516670227e-06, 1.372024416923523e-05, 1.7559155821800232e-05, 2.1398067474365234e-05, 2.5236979126930237e-05, 2.907589077949524e-05, 3.291480243206024e-05, 3.6753714084625244e-05, 4.0592625737190247e-05, 4.443153738975525e-05, 4.827044904232025e-05, 5.2109360694885254e-05, 5.5948272347450256e-05, 5.978718400001526e-05, 6.362609565258026e-05, 6.746500730514526e-05, 7.130391895771027e-05, 7.514283061027527e-05, 7.898174226284027e-05, 8.282065391540527e-05, 8.665956556797028e-05, 9.049847722053528e-05, 9.433738887310028e-05, 9.817630052566528e-05, 0.00010201521217823029, 0.00010585412383079529, 0.00010969303548336029, 0.00011353194713592529, 0.0001173708587884903, 0.0001212097704410553, 0.0001250486820936203, 0.0001288875937461853, 0.0001327265053987503, 0.0001365654170513153, 0.0001404043287038803, 0.0001442432403564453]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 10.0, 18.0, 21.0, 34.0, 30.0, 52.0, 71.0, 97.0, 150.0, 190.0, 280.0, 423.0, 567.0, 900.0, 1446.0, 2336.0, 4073.0, 7740.0, 18268.0, 63796.0, 678086.0, 208717.0, 34651.0, 12176.0, 5734.0, 3120.0, 1909.0, 1187.0, 754.0, 503.0, 384.0, 238.0, 158.0, 118.0, 86.0, 55.0, 40.0, 35.0, 28.0, 16.0, 7.0, 6.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.277099609375, -0.2674713134765625, -0.257843017578125, -0.2482147216796875, -0.23858642578125, -0.2289581298828125, -0.219329833984375, -0.2097015380859375, -0.2000732421875, -0.1904449462890625, -0.180816650390625, -0.1711883544921875, -0.16156005859375, -0.1519317626953125, -0.142303466796875, -0.1326751708984375, -0.123046875, -0.1134185791015625, -0.103790283203125, -0.0941619873046875, -0.08453369140625, -0.0749053955078125, -0.065277099609375, -0.0556488037109375, -0.0460205078125, -0.0363922119140625, -0.026763916015625, -0.0171356201171875, -0.00750732421875, 0.0021209716796875, 0.011749267578125, 0.0213775634765625, 0.031005859375, 0.0406341552734375, 0.050262451171875, 0.0598907470703125, 0.06951904296875, 0.0791473388671875, 0.088775634765625, 0.0984039306640625, 0.1080322265625, 0.1176605224609375, 0.127288818359375, 0.1369171142578125, 0.14654541015625, 0.1561737060546875, 0.165802001953125, 0.1754302978515625, 0.18505859375, 0.1946868896484375, 0.204315185546875, 0.2139434814453125, 0.22357177734375, 0.2332000732421875, 0.242828369140625, 0.2524566650390625, 0.2620849609375, 0.2717132568359375, 0.281341552734375, 0.2909698486328125, 0.30059814453125, 0.3102264404296875, 0.319854736328125, 0.3294830322265625, 0.339111328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 5.0, 12.0, 14.0, 5.0, 12.0, 16.0, 27.0, 39.0, 54.0, 89.0, 208.0, 208.0, 93.0, 48.0, 42.0, 31.0, 23.0, 17.0, 11.0, 5.0, 2.0, 1.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.177001953125, -0.1718006134033203, -0.16659927368164062, -0.16139793395996094, -0.15619659423828125, -0.15099525451660156, -0.14579391479492188, -0.1405925750732422, -0.1353912353515625, -0.1301898956298828, -0.12498855590820312, -0.11978721618652344, -0.11458587646484375, -0.10938453674316406, -0.10418319702148438, -0.09898185729980469, -0.093780517578125, -0.08857917785644531, -0.08337783813476562, -0.07817649841308594, -0.07297515869140625, -0.06777381896972656, -0.06257247924804688, -0.05737113952636719, -0.0521697998046875, -0.04696846008300781, -0.041767120361328125, -0.03656578063964844, -0.03136444091796875, -0.026163101196289062, -0.020961761474609375, -0.015760421752929688, -0.01055908203125, -0.0053577423095703125, -0.000156402587890625, 0.0050449371337890625, 0.01024627685546875, 0.015447616577148438, 0.020648956298828125, 0.025850296020507812, 0.0310516357421875, 0.03625297546386719, 0.041454315185546875, 0.04665565490722656, 0.05185699462890625, 0.05705833435058594, 0.062259674072265625, 0.06746101379394531, 0.072662353515625, 0.07786369323730469, 0.08306503295898438, 0.08826637268066406, 0.09346771240234375, 0.09866905212402344, 0.10387039184570312, 0.10907173156738281, 0.1142730712890625, 0.11947441101074219, 0.12467575073242188, 0.12987709045410156, 0.13507843017578125, 0.14027976989746094, 0.14548110961914062, 0.1506824493408203, 0.1558837890625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 13.0, 20.0, 53.0, 128.0, 218.0, 246.0, 175.0, 88.0, 34.0, 22.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15004825592041, -14.848811149597168, -14.547574043273926, -14.246337890625, -13.945100784301758, -13.643863677978516, -13.342626571655273, -13.041389465332031, -12.740152359008789, -12.438915252685547, -12.137678146362305, -11.836441993713379, -11.535204887390137, -11.233967781066895, -10.932730674743652, -10.63149356842041, -10.330257415771484, -10.029020309448242, -9.727783203125, -9.426547050476074, -9.125309944152832, -8.82407283782959, -8.522835731506348, -8.221598625183105, -7.9203619956970215, -7.619124889373779, -7.317888259887695, -7.016651153564453, -6.715414047241211, -6.414177417755127, -6.112940311431885, -5.811703681945801, -5.510465621948242, -5.209228515625, -4.907991886138916, -4.606754779815674, -4.30551815032959, -4.004281044006348, -3.7030439376831055, -3.4018070697784424, -3.1005702018737793, -2.799333333969116, -2.498096466064453, -2.196859359741211, -1.8956224918365479, -1.5943856239318848, -1.2931486368179321, -0.9919116497039795, -0.6906747817993164, -0.38943785429000854, -0.08820092678070068, 0.21303600072860718, 0.514272928237915, 0.8155097961425781, 1.1167467832565308, 1.4179837703704834, 1.7192206382751465, 2.0204575061798096, 2.3216943740844727, 2.622931480407715, 2.924168348312378, 3.225405216217041, 3.526642322540283, 3.8278791904449463, 4.129116058349609]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 6.0, 7.0, 7.0, 11.0, 14.0, 6.0, 21.0, 12.0, 16.0, 16.0, 15.0, 17.0, 21.0, 23.0, 45.0, 33.0, 31.0, 18.0, 34.0, 39.0, 40.0, 28.0, 38.0, 37.0, 35.0, 40.0, 31.0, 32.0, 29.0, 31.0, 25.0, 26.0, 28.0, 23.0, 25.0, 18.0, 18.0, 15.0, 16.0, 11.0, 11.0, 6.0, 8.0, 5.0, 5.0, 5.0, 2.0, 8.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.2388625144958496, -3.131962776184082, -3.0250630378723145, -2.918163299560547, -2.8112635612487793, -2.7043638229370117, -2.597464084625244, -2.4905643463134766, -2.383664608001709, -2.2767648696899414, -2.169865131378174, -2.0629653930664062, -1.9560656547546387, -1.849165916442871, -1.7422661781311035, -1.635366439819336, -1.528466820716858, -1.4215670824050903, -1.3146673440933228, -1.2077676057815552, -1.1008678674697876, -0.9939681887626648, -0.8870684504508972, -0.7801687121391296, -0.6732689738273621, -0.5663692355155945, -0.4594694972038269, -0.3525697886943817, -0.24567005038261414, -0.13877034187316895, -0.03187060356140137, 0.07502913475036621, 0.1819288730621338, 0.28882861137390137, 0.39572834968566895, 0.5026280879974365, 0.6095278263092041, 0.7164275050163269, 0.8233272433280945, 0.9302269816398621, 1.0371267795562744, 1.144026517868042, 1.2509262561798096, 1.3578259944915771, 1.4647257328033447, 1.5716254711151123, 1.6785252094268799, 1.7854249477386475, 1.8923245668411255, 1.999224305152893, 2.106123924255371, 2.2130236625671387, 2.3199234008789062, 2.426823139190674, 2.5337228775024414, 2.640622615814209, 2.7475223541259766, 2.854422092437744, 2.9613218307495117, 3.0682215690612793, 3.175121307373047, 3.2820210456848145, 3.388920783996582, 3.4958205223083496, 3.602720260620117]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 9.0, 17.0, 20.0, 22.0, 28.0, 53.0, 61.0, 99.0, 109.0, 184.0, 257.0, 379.0, 490.0, 685.0, 1033.0, 1567.0, 2376.0, 3968.0, 7701.0, 18670.0, 77515.0, 365979.0, 1572293.0, 1650992.0, 379059.0, 74278.0, 17639.0, 7720.0, 3871.0, 2409.0, 1573.0, 943.0, 673.0, 471.0, 380.0, 221.0, 165.0, 111.0, 86.0, 51.0, 45.0, 32.0, 18.0, 10.0, 12.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.26953125, -2.200775146484375, -2.13201904296875, -2.063262939453125, -1.9945068359375, -1.925750732421875, -1.85699462890625, -1.788238525390625, -1.719482421875, -1.650726318359375, -1.58197021484375, -1.513214111328125, -1.4444580078125, -1.375701904296875, -1.30694580078125, -1.238189697265625, -1.16943359375, -1.100677490234375, -1.03192138671875, -0.963165283203125, -0.8944091796875, -0.825653076171875, -0.75689697265625, -0.688140869140625, -0.619384765625, -0.550628662109375, -0.48187255859375, -0.413116455078125, -0.3443603515625, -0.275604248046875, -0.20684814453125, -0.138092041015625, -0.0693359375, -0.000579833984375, 0.06817626953125, 0.136932373046875, 0.2056884765625, 0.274444580078125, 0.34320068359375, 0.411956787109375, 0.480712890625, 0.549468994140625, 0.61822509765625, 0.686981201171875, 0.7557373046875, 0.824493408203125, 0.89324951171875, 0.962005615234375, 1.03076171875, 1.099517822265625, 1.16827392578125, 1.237030029296875, 1.3057861328125, 1.374542236328125, 1.44329833984375, 1.512054443359375, 1.580810546875, 1.649566650390625, 1.71832275390625, 1.787078857421875, 1.8558349609375, 1.924591064453125, 1.99334716796875, 2.062103271484375, 2.130859375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 10.0, 5.0, 9.0, 11.0, 12.0, 15.0, 24.0, 24.0, 25.0, 23.0, 31.0, 37.0, 47.0, 30.0, 43.0, 45.0, 42.0, 46.0, 45.0, 52.0, 44.0, 52.0, 32.0, 35.0, 41.0, 30.0, 22.0, 28.0, 20.0, 19.0, 14.0, 15.0, 10.0, 11.0, 4.0, 7.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.3264617919921875, -1.275970458984375, -1.2254791259765625, -1.17498779296875, -1.1244964599609375, -1.074005126953125, -1.0235137939453125, -0.9730224609375, -0.9225311279296875, -0.872039794921875, -0.8215484619140625, -0.77105712890625, -0.7205657958984375, -0.670074462890625, -0.6195831298828125, -0.569091796875, -0.5186004638671875, -0.468109130859375, -0.4176177978515625, -0.36712646484375, -0.3166351318359375, -0.266143798828125, -0.2156524658203125, -0.1651611328125, -0.1146697998046875, -0.064178466796875, -0.0136871337890625, 0.03680419921875, 0.0872955322265625, 0.137786865234375, 0.1882781982421875, 0.23876953125, 0.2892608642578125, 0.339752197265625, 0.3902435302734375, 0.44073486328125, 0.4912261962890625, 0.541717529296875, 0.5922088623046875, 0.6427001953125, 0.6931915283203125, 0.743682861328125, 0.7941741943359375, 0.84466552734375, 0.8951568603515625, 0.945648193359375, 0.9961395263671875, 1.046630859375, 1.0971221923828125, 1.147613525390625, 1.1981048583984375, 1.24859619140625, 1.2990875244140625, 1.349578857421875, 1.4000701904296875, 1.4505615234375, 1.5010528564453125, 1.551544189453125, 1.6020355224609375, 1.65252685546875, 1.7030181884765625, 1.753509521484375, 1.8040008544921875, 1.8544921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 19.0, 18.0, 34.0, 68.0, 140.0, 559.0, 3888.0, 77587.0, 4071939.0, 36889.0, 2454.0, 433.0, 105.0, 53.0, 24.0, 13.0, 13.0, 3.0, 4.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.75439453125, -8.4228515625, -8.09130859375, -7.759765625, -7.42822265625, -7.0966796875, -6.76513671875, -6.43359375, -6.10205078125, -5.7705078125, -5.43896484375, -5.107421875, -4.77587890625, -4.4443359375, -4.11279296875, -3.78125, -3.44970703125, -3.1181640625, -2.78662109375, -2.455078125, -2.12353515625, -1.7919921875, -1.46044921875, -1.12890625, -0.79736328125, -0.4658203125, -0.13427734375, 0.197265625, 0.52880859375, 0.8603515625, 1.19189453125, 1.5234375, 1.85498046875, 2.1865234375, 2.51806640625, 2.849609375, 3.18115234375, 3.5126953125, 3.84423828125, 4.17578125, 4.50732421875, 4.8388671875, 5.17041015625, 5.501953125, 5.83349609375, 6.1650390625, 6.49658203125, 6.828125, 7.15966796875, 7.4912109375, 7.82275390625, 8.154296875, 8.48583984375, 8.8173828125, 9.14892578125, 9.48046875, 9.81201171875, 10.1435546875, 10.47509765625, 10.806640625, 11.13818359375, 11.4697265625, 11.80126953125, 12.1328125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 1.0, 4.0, 8.0, 15.0, 9.0, 16.0, 15.0, 22.0, 30.0, 44.0, 66.0, 107.0, 158.0, 278.0, 438.0, 676.0, 780.0, 525.0, 297.0, 169.0, 100.0, 78.0, 54.0, 40.0, 26.0, 14.0, 18.0, 14.0, 11.0, 13.0, 8.0, 4.0, 5.0, 5.0, 0.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.95556640625, -0.9275436401367188, -0.8995208740234375, -0.8714981079101562, -0.843475341796875, -0.8154525756835938, -0.7874298095703125, -0.7594070434570312, -0.73138427734375, -0.7033615112304688, -0.6753387451171875, -0.6473159790039062, -0.619293212890625, -0.5912704467773438, -0.5632476806640625, -0.5352249145507812, -0.5072021484375, -0.47917938232421875, -0.4511566162109375, -0.42313385009765625, -0.395111083984375, -0.36708831787109375, -0.3390655517578125, -0.31104278564453125, -0.28302001953125, -0.25499725341796875, -0.2269744873046875, -0.19895172119140625, -0.170928955078125, -0.14290618896484375, -0.1148834228515625, -0.08686065673828125, -0.058837890625, -0.03081512451171875, -0.0027923583984375, 0.02523040771484375, 0.053253173828125, 0.08127593994140625, 0.1092987060546875, 0.13732147216796875, 0.16534423828125, 0.19336700439453125, 0.2213897705078125, 0.24941253662109375, 0.277435302734375, 0.30545806884765625, 0.3334808349609375, 0.36150360107421875, 0.3895263671875, 0.41754913330078125, 0.4455718994140625, 0.47359466552734375, 0.501617431640625, 0.5296401977539062, 0.5576629638671875, 0.5856857299804688, 0.61370849609375, 0.6417312622070312, 0.6697540283203125, 0.6977767944335938, 0.725799560546875, 0.7538223266601562, 0.7818450927734375, 0.8098678588867188, 0.837890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 6.0, 13.0, 13.0, 12.0, 21.0, 27.0, 39.0, 48.0, 53.0, 68.0, 81.0, 100.0, 96.0, 92.0, 64.0, 65.0, 53.0, 45.0, 27.0, 15.0, 12.0, 13.0, 7.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.3531672954559326, -3.265151262283325, -3.1771352291107178, -3.0891191959381104, -3.001103162765503, -2.9130871295928955, -2.825071096420288, -2.7370550632476807, -2.6490390300750732, -2.561022996902466, -2.4730069637298584, -2.384990930557251, -2.2969748973846436, -2.208958864212036, -2.1209428310394287, -2.0329267978668213, -1.9449107646942139, -1.8568947315216064, -1.768878698348999, -1.6808626651763916, -1.5928466320037842, -1.5048305988311768, -1.4168145656585693, -1.328798532485962, -1.2407824993133545, -1.152766466140747, -1.0647504329681396, -0.9767343997955322, -0.8887183666229248, -0.8007023334503174, -0.71268630027771, -0.6246702671051025, -0.5366544723510742, -0.4486384391784668, -0.3606224060058594, -0.27260637283325195, -0.18459033966064453, -0.09657430648803711, -0.008558273315429688, 0.07945775985717773, 0.16747379302978516, 0.2554898262023926, 0.343505859375, 0.4315218925476074, 0.5195379257202148, 0.6075539588928223, 0.6955699920654297, 0.7835860252380371, 0.8716020584106445, 0.959618091583252, 1.0476341247558594, 1.1356501579284668, 1.2236661911010742, 1.3116822242736816, 1.399698257446289, 1.4877142906188965, 1.575730323791504, 1.6637463569641113, 1.7517623901367188, 1.8397784233093262, 1.9277944564819336, 2.015810489654541, 2.1038265228271484, 2.191842555999756, 2.2798585891723633]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 7.0, 10.0, 8.0, 13.0, 15.0, 13.0, 9.0, 31.0, 21.0, 30.0, 24.0, 27.0, 28.0, 35.0, 26.0, 44.0, 37.0, 46.0, 52.0, 52.0, 33.0, 37.0, 30.0, 37.0, 32.0, 36.0, 28.0, 29.0, 23.0, 20.0, 22.0, 19.0, 22.0, 18.0, 9.0, 11.0, 10.0, 11.0, 6.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.6309282779693604, -1.5800631046295166, -1.5291980504989624, -1.4783328771591187, -1.427467703819275, -1.3766026496887207, -1.325737476348877, -1.2748723030090332, -1.2240071296691895, -1.1731419563293457, -1.1222769021987915, -1.0714117288589478, -1.020546555519104, -0.969681441783905, -0.918816328048706, -0.8679511547088623, -0.8170861005783081, -0.7662209868431091, -0.7153558135032654, -0.6644906997680664, -0.6136255264282227, -0.5627604126930237, -0.5118952989578247, -0.46103015542030334, -0.410165011882782, -0.3592998683452606, -0.30843472480773926, -0.2575696110725403, -0.20670446753501892, -0.15583932399749756, -0.10497421026229858, -0.05410906672477722, -0.0032439231872558594, 0.047621212899684906, 0.09848634898662567, 0.14935147762298584, 0.2002166211605072, 0.25108176469802856, 0.30194687843322754, 0.3528120219707489, 0.40367716550827026, 0.4545423090457916, 0.505407452583313, 0.556272566318512, 0.6071376800537109, 0.6580028533935547, 0.7088679671287537, 0.7597330808639526, 0.8105982542037964, 0.8614633679389954, 0.9123285412788391, 0.9631936550140381, 1.0140588283538818, 1.0649240016937256, 1.1157890558242798, 1.1666542291641235, 1.2175192832946777, 1.2683844566345215, 1.3192495107650757, 1.3701146841049194, 1.4209798574447632, 1.4718449115753174, 1.5227100849151611, 1.5735752582550049, 1.6244404315948486]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 1.0, 2.0, 4.0, 4.0, 10.0, 6.0, 6.0, 16.0, 21.0, 29.0, 47.0, 57.0, 102.0, 148.0, 260.0, 391.0, 731.0, 1298.0, 2450.0, 4667.0, 9765.0, 23312.0, 62615.0, 192445.0, 437548.0, 202468.0, 65311.0, 24020.0, 10292.0, 4967.0, 2473.0, 1321.0, 691.0, 394.0, 259.0, 128.0, 99.0, 57.0, 47.0, 25.0, 25.0, 12.0, 10.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.71240234375, -0.6865158081054688, -0.6606292724609375, -0.6347427368164062, -0.608856201171875, -0.5829696655273438, -0.5570831298828125, -0.5311965942382812, -0.50531005859375, -0.47942352294921875, -0.4535369873046875, -0.42765045166015625, -0.401763916015625, -0.37587738037109375, -0.3499908447265625, -0.32410430908203125, -0.2982177734375, -0.27233123779296875, -0.2464447021484375, -0.22055816650390625, -0.194671630859375, -0.16878509521484375, -0.1428985595703125, -0.11701202392578125, -0.09112548828125, -0.06523895263671875, -0.0393524169921875, -0.01346588134765625, 0.012420654296875, 0.03830718994140625, 0.0641937255859375, 0.09008026123046875, 0.115966796875, 0.14185333251953125, 0.1677398681640625, 0.19362640380859375, 0.219512939453125, 0.24539947509765625, 0.2712860107421875, 0.29717254638671875, 0.32305908203125, 0.34894561767578125, 0.3748321533203125, 0.40071868896484375, 0.426605224609375, 0.45249176025390625, 0.4783782958984375, 0.5042648315429688, 0.5301513671875, 0.5560379028320312, 0.5819244384765625, 0.6078109741210938, 0.633697509765625, 0.6595840454101562, 0.6854705810546875, 0.7113571166992188, 0.73724365234375, 0.7631301879882812, 0.7890167236328125, 0.8149032592773438, 0.840789794921875, 0.8666763305664062, 0.8925628662109375, 0.9184494018554688, 0.9443359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 5.0, 4.0, 7.0, 7.0, 9.0, 9.0, 10.0, 13.0, 15.0, 15.0, 13.0, 20.0, 24.0, 33.0, 27.0, 35.0, 33.0, 33.0, 33.0, 39.0, 56.0, 33.0, 54.0, 40.0, 35.0, 37.0, 36.0, 40.0, 36.0, 25.0, 21.0, 25.0, 25.0, 21.0, 17.0, 13.0, 16.0, 10.0, 9.0, 8.0, 9.0, 13.0, 8.0, 6.0, 1.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.0205078125, -0.987030029296875, -0.95355224609375, -0.920074462890625, -0.8865966796875, -0.853118896484375, -0.81964111328125, -0.786163330078125, -0.752685546875, -0.719207763671875, -0.68572998046875, -0.652252197265625, -0.6187744140625, -0.585296630859375, -0.55181884765625, -0.518341064453125, -0.48486328125, -0.451385498046875, -0.41790771484375, -0.384429931640625, -0.3509521484375, -0.317474365234375, -0.28399658203125, -0.250518798828125, -0.217041015625, -0.183563232421875, -0.15008544921875, -0.116607666015625, -0.0831298828125, -0.049652099609375, -0.01617431640625, 0.017303466796875, 0.05078125, 0.084259033203125, 0.11773681640625, 0.151214599609375, 0.1846923828125, 0.218170166015625, 0.25164794921875, 0.285125732421875, 0.318603515625, 0.352081298828125, 0.38555908203125, 0.419036865234375, 0.4525146484375, 0.485992431640625, 0.51947021484375, 0.552947998046875, 0.58642578125, 0.619903564453125, 0.65338134765625, 0.686859130859375, 0.7203369140625, 0.753814697265625, 0.78729248046875, 0.820770263671875, 0.854248046875, 0.887725830078125, 0.92120361328125, 0.954681396484375, 0.9881591796875, 1.021636962890625, 1.05511474609375, 1.088592529296875, 1.1220703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 9.0, 12.0, 16.0, 13.0, 36.0, 38.0, 56.0, 85.0, 112.0, 184.0, 260.0, 396.0, 619.0, 1041.0, 1696.0, 3090.0, 5835.0, 12091.0, 27618.0, 69376.0, 187429.0, 372622.0, 222937.0, 82407.0, 31916.0, 13686.0, 6662.0, 3343.0, 1838.0, 1173.0, 668.0, 414.0, 288.0, 183.0, 109.0, 88.0, 51.0, 47.0, 33.0, 21.0, 21.0, 13.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.568359375, -0.5491485595703125, -0.529937744140625, -0.5107269287109375, -0.49151611328125, -0.4723052978515625, -0.453094482421875, -0.4338836669921875, -0.4146728515625, -0.3954620361328125, -0.376251220703125, -0.3570404052734375, -0.33782958984375, -0.3186187744140625, -0.299407958984375, -0.2801971435546875, -0.260986328125, -0.2417755126953125, -0.222564697265625, -0.2033538818359375, -0.18414306640625, -0.1649322509765625, -0.145721435546875, -0.1265106201171875, -0.1072998046875, -0.0880889892578125, -0.068878173828125, -0.0496673583984375, -0.03045654296875, -0.0112457275390625, 0.007965087890625, 0.0271759033203125, 0.04638671875, 0.0655975341796875, 0.084808349609375, 0.1040191650390625, 0.12322998046875, 0.1424407958984375, 0.161651611328125, 0.1808624267578125, 0.2000732421875, 0.2192840576171875, 0.238494873046875, 0.2577056884765625, 0.27691650390625, 0.2961273193359375, 0.315338134765625, 0.3345489501953125, 0.353759765625, 0.3729705810546875, 0.392181396484375, 0.4113922119140625, 0.43060302734375, 0.4498138427734375, 0.469024658203125, 0.4882354736328125, 0.5074462890625, 0.5266571044921875, 0.545867919921875, 0.5650787353515625, 0.58428955078125, 0.6035003662109375, 0.622711181640625, 0.6419219970703125, 0.6611328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 9.0, 4.0, 3.0, 10.0, 11.0, 9.0, 13.0, 18.0, 28.0, 32.0, 32.0, 29.0, 39.0, 44.0, 46.0, 56.0, 62.0, 51.0, 50.0, 49.0, 55.0, 45.0, 39.0, 41.0, 37.0, 33.0, 28.0, 24.0, 19.0, 19.0, 15.0, 17.0, 11.0, 6.0, 5.0, 4.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.07421875, -2.989471435546875, -2.90472412109375, -2.819976806640625, -2.7352294921875, -2.650482177734375, -2.56573486328125, -2.480987548828125, -2.396240234375, -2.311492919921875, -2.22674560546875, -2.141998291015625, -2.0572509765625, -1.972503662109375, -1.88775634765625, -1.803009033203125, -1.71826171875, -1.633514404296875, -1.54876708984375, -1.464019775390625, -1.3792724609375, -1.294525146484375, -1.20977783203125, -1.125030517578125, -1.040283203125, -0.955535888671875, -0.87078857421875, -0.786041259765625, -0.7012939453125, -0.616546630859375, -0.53179931640625, -0.447052001953125, -0.3623046875, -0.277557373046875, -0.19281005859375, -0.108062744140625, -0.0233154296875, 0.061431884765625, 0.14617919921875, 0.230926513671875, 0.315673828125, 0.400421142578125, 0.48516845703125, 0.569915771484375, 0.6546630859375, 0.739410400390625, 0.82415771484375, 0.908905029296875, 0.99365234375, 1.078399658203125, 1.16314697265625, 1.247894287109375, 1.3326416015625, 1.417388916015625, 1.50213623046875, 1.586883544921875, 1.671630859375, 1.756378173828125, 1.84112548828125, 1.925872802734375, 2.0106201171875, 2.095367431640625, 2.18011474609375, 2.264862060546875, 2.349609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 7.0, 11.0, 18.0, 14.0, 24.0, 41.0, 59.0, 70.0, 103.0, 151.0, 214.0, 388.0, 619.0, 1018.0, 1729.0, 3519.0, 7613.0, 18898.0, 58606.0, 264588.0, 513796.0, 121037.0, 32795.0, 11987.0, 5145.0, 2517.0, 1347.0, 820.0, 488.0, 276.0, 195.0, 129.0, 94.0, 72.0, 39.0, 25.0, 15.0, 25.0, 12.0, 15.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2139892578125, -0.20714378356933594, -0.20029830932617188, -0.1934528350830078, -0.18660736083984375, -0.1797618865966797, -0.17291641235351562, -0.16607093811035156, -0.1592254638671875, -0.15237998962402344, -0.14553451538085938, -0.1386890411376953, -0.13184356689453125, -0.12499809265136719, -0.11815261840820312, -0.11130714416503906, -0.104461669921875, -0.09761619567871094, -0.09077072143554688, -0.08392524719238281, -0.07707977294921875, -0.07023429870605469, -0.06338882446289062, -0.05654335021972656, -0.0496978759765625, -0.04285240173339844, -0.036006927490234375, -0.029161453247070312, -0.02231597900390625, -0.015470504760742188, -0.008625030517578125, -0.0017795562744140625, 0.00506591796875, 0.011911392211914062, 0.018756866455078125, 0.025602340698242188, 0.03244781494140625, 0.03929328918457031, 0.046138763427734375, 0.05298423767089844, 0.0598297119140625, 0.06667518615722656, 0.07352066040039062, 0.08036613464355469, 0.08721160888671875, 0.09405708312988281, 0.10090255737304688, 0.10774803161621094, 0.114593505859375, 0.12143898010253906, 0.12828445434570312, 0.1351299285888672, 0.14197540283203125, 0.1488208770751953, 0.15566635131835938, 0.16251182556152344, 0.1693572998046875, 0.17620277404785156, 0.18304824829101562, 0.1898937225341797, 0.19673919677734375, 0.2035846710205078, 0.21043014526367188, 0.21727561950683594, 0.22412109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 5.0, 4.0, 11.0, 8.0, 12.0, 22.0, 25.0, 42.0, 63.0, 90.0, 130.0, 147.0, 127.0, 100.0, 52.0, 38.0, 32.0, 19.0, 13.0, 10.0, 17.0, 4.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020742416381835938, -0.00020189769566059113, -0.00019637122750282288, -0.00019084475934505463, -0.00018531829118728638, -0.00017979182302951813, -0.00017426535487174988, -0.00016873888671398163, -0.00016321241855621338, -0.00015768595039844513, -0.00015215948224067688, -0.00014663301408290863, -0.00014110654592514038, -0.00013558007776737213, -0.00013005360960960388, -0.00012452714145183563, -0.00011900067329406738, -0.00011347420513629913, -0.00010794773697853088, -0.00010242126882076263, -9.689480066299438e-05, -9.136833250522614e-05, -8.584186434745789e-05, -8.031539618968964e-05, -7.478892803192139e-05, -6.926245987415314e-05, -6.373599171638489e-05, -5.820952355861664e-05, -5.268305540084839e-05, -4.715658724308014e-05, -4.163011908531189e-05, -3.610365092754364e-05, -3.057718276977539e-05, -2.505071461200714e-05, -1.952424645423889e-05, -1.3997778296470642e-05, -8.471310138702393e-06, -2.944841980934143e-06, 2.5816261768341064e-06, 8.108094334602356e-06, 1.3634562492370605e-05, 1.9161030650138855e-05, 2.4687498807907104e-05, 3.0213966965675354e-05, 3.5740435123443604e-05, 4.126690328121185e-05, 4.67933714389801e-05, 5.231983959674835e-05, 5.78463077545166e-05, 6.337277591228485e-05, 6.88992440700531e-05, 7.442571222782135e-05, 7.99521803855896e-05, 8.547864854335785e-05, 9.10051167011261e-05, 9.653158485889435e-05, 0.0001020580530166626, 0.00010758452117443085, 0.0001131109893321991, 0.00011863745748996735, 0.0001241639256477356, 0.00012969039380550385, 0.0001352168619632721, 0.00014074333012104034, 0.0001462697982788086]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 13.0, 15.0, 12.0, 30.0, 33.0, 47.0, 59.0, 76.0, 109.0, 150.0, 202.0, 330.0, 503.0, 739.0, 1054.0, 1807.0, 2907.0, 4939.0, 8927.0, 18069.0, 42200.0, 119242.0, 369267.0, 311914.0, 95328.0, 35150.0, 15616.0, 7941.0, 4403.0, 2559.0, 1640.0, 998.0, 701.0, 443.0, 309.0, 226.0, 148.0, 113.0, 80.0, 71.0, 44.0, 30.0, 27.0, 23.0, 12.0, 9.0, 10.0, 9.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1715087890625, -0.16613388061523438, -0.16075897216796875, -0.15538406372070312, -0.1500091552734375, -0.14463424682617188, -0.13925933837890625, -0.13388442993164062, -0.128509521484375, -0.12313461303710938, -0.11775970458984375, -0.11238479614257812, -0.1070098876953125, -0.10163497924804688, -0.09626007080078125, -0.09088516235351562, -0.08551025390625, -0.08013534545898438, -0.07476043701171875, -0.06938552856445312, -0.0640106201171875, -0.058635711669921875, -0.05326080322265625, -0.047885894775390625, -0.042510986328125, -0.037136077880859375, -0.03176116943359375, -0.026386260986328125, -0.0210113525390625, -0.015636444091796875, -0.01026153564453125, -0.004886627197265625, 0.00048828125, 0.005863189697265625, 0.01123809814453125, 0.016613006591796875, 0.0219879150390625, 0.027362823486328125, 0.03273773193359375, 0.038112640380859375, 0.043487548828125, 0.048862457275390625, 0.05423736572265625, 0.059612274169921875, 0.0649871826171875, 0.07036209106445312, 0.07573699951171875, 0.08111190795898438, 0.08648681640625, 0.09186172485351562, 0.09723663330078125, 0.10261154174804688, 0.1079864501953125, 0.11336135864257812, 0.11873626708984375, 0.12411117553710938, 0.129486083984375, 0.13486099243164062, 0.14023590087890625, 0.14561080932617188, 0.1509857177734375, 0.15636062622070312, 0.16173553466796875, 0.16711044311523438, 0.1724853515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 4.0, 2.0, 7.0, 7.0, 10.0, 22.0, 21.0, 24.0, 32.0, 41.0, 58.0, 86.0, 76.0, 83.0, 111.0, 72.0, 72.0, 52.0, 46.0, 26.0, 29.0, 20.0, 25.0, 13.0, 10.0, 4.0, 8.0, 6.0, 1.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06304931640625, -0.06111574172973633, -0.059182167053222656, -0.057248592376708984, -0.05531501770019531, -0.05338144302368164, -0.05144786834716797, -0.0495142936706543, -0.047580718994140625, -0.04564714431762695, -0.04371356964111328, -0.04177999496459961, -0.03984642028808594, -0.037912845611572266, -0.035979270935058594, -0.03404569625854492, -0.03211212158203125, -0.030178546905517578, -0.028244972229003906, -0.026311397552490234, -0.024377822875976562, -0.02244424819946289, -0.02051067352294922, -0.018577098846435547, -0.016643524169921875, -0.014709949493408203, -0.012776374816894531, -0.01084280014038086, -0.008909225463867188, -0.006975650787353516, -0.005042076110839844, -0.003108501434326172, -0.0011749267578125, 0.0007586479187011719, 0.0026922225952148438, 0.004625797271728516, 0.0065593719482421875, 0.00849294662475586, 0.010426521301269531, 0.012360095977783203, 0.014293670654296875, 0.016227245330810547, 0.01816082000732422, 0.02009439468383789, 0.022027969360351562, 0.023961544036865234, 0.025895118713378906, 0.027828693389892578, 0.02976226806640625, 0.03169584274291992, 0.033629417419433594, 0.035562992095947266, 0.03749656677246094, 0.03943014144897461, 0.04136371612548828, 0.04329729080200195, 0.045230865478515625, 0.0471644401550293, 0.04909801483154297, 0.05103158950805664, 0.05296516418457031, 0.054898738861083984, 0.056832313537597656, 0.05876588821411133, 0.060699462890625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 7.0, 4.0, 8.0, 7.0, 8.0, 17.0, 24.0, 26.0, 60.0, 58.0, 80.0, 83.0, 91.0, 98.0, 80.0, 72.0, 67.0, 53.0, 37.0, 24.0, 28.0, 18.0, 14.0, 3.0, 8.0, 9.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.9908307790756226, -1.9362215995788574, -1.8816124200820923, -1.8270032405853271, -1.7723939418792725, -1.7177847623825073, -1.6631755828857422, -1.608566403388977, -1.553957223892212, -1.4993480443954468, -1.4447388648986816, -1.390129566192627, -1.3355203866958618, -1.2809112071990967, -1.2263020277023315, -1.1716928482055664, -1.1170835494995117, -1.0624743700027466, -1.0078651905059814, -0.9532559514045715, -0.8986467123031616, -0.8440375328063965, -0.7894283533096313, -0.7348191738128662, -0.6802099347114563, -0.6256007552146912, -0.5709915161132812, -0.5163823366165161, -0.4617731273174286, -0.40716391801834106, -0.3525547385215759, -0.2979455292224884, -0.24333643913269043, -0.1887272298336029, -0.13411803543567657, -0.07950884103775024, -0.02489963173866272, 0.029709577560424805, 0.08431875705718994, 0.13892796635627747, 0.193537175655365, 0.24814638495445251, 0.30275559425354004, 0.3573647737503052, 0.4119739830493927, 0.4665831923484802, 0.5211923718452454, 0.5758016109466553, 0.6304107904434204, 0.6850199699401855, 0.7396292090415955, 0.7942383885383606, 0.8488476276397705, 0.9034568071365356, 0.9580659866333008, 1.012675166130066, 1.067284345626831, 1.1218935251235962, 1.1765027046203613, 1.231112003326416, 1.2857211828231812, 1.3403303623199463, 1.3949395418167114, 1.4495487213134766, 1.5041580200195312]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 5.0, 8.0, 11.0, 14.0, 14.0, 12.0, 24.0, 16.0, 28.0, 22.0, 27.0, 25.0, 31.0, 37.0, 29.0, 30.0, 44.0, 33.0, 43.0, 37.0, 50.0, 38.0, 49.0, 31.0, 31.0, 25.0, 30.0, 35.0, 24.0, 18.0, 25.0, 15.0, 23.0, 11.0, 16.0, 8.0, 11.0, 10.0, 10.0, 6.0, 8.0, 3.0, 7.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0005931854248047, -0.969087541103363, -0.9375819563865662, -0.9060763120651245, -0.8745707273483276, -0.843065083026886, -0.8115594387054443, -0.7800538539886475, -0.7485482692718506, -0.7170426249504089, -0.6855370402336121, -0.6540313959121704, -0.6225258111953735, -0.5910201668739319, -0.5595145225524902, -0.5280089378356934, -0.4965032935142517, -0.46499767899513245, -0.4334920644760132, -0.40198642015457153, -0.37048083543777466, -0.338975191116333, -0.30746957659721375, -0.2759639620780945, -0.24445834755897522, -0.21295273303985596, -0.1814471185207367, -0.14994148910045624, -0.11843587458133698, -0.08693026006221771, -0.055424630641937256, -0.023919016122817993, 0.0075865983963012695, 0.03909221664071083, 0.07059783488512039, 0.10210345685482025, 0.13360907137393951, 0.16511468589305878, 0.19662031531333923, 0.2281259298324585, 0.25963154435157776, 0.291137158870697, 0.3226427733898163, 0.35414838790893555, 0.3856540322303772, 0.4171596169471741, 0.4486652612686157, 0.480170875787735, 0.5116764903068542, 0.5431821346282959, 0.5746877193450928, 0.6061933636665344, 0.6376989483833313, 0.669204592704773, 0.7007101774215698, 0.7322158217430115, 0.7637214660644531, 0.7952271103858948, 0.8267326951026917, 0.8582383394241333, 0.8897439241409302, 0.9212495684623718, 0.9527552127838135, 0.9842607975006104, 1.0157663822174072]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 5.0, 19.0, 11.0, 19.0, 28.0, 35.0, 46.0, 60.0, 67.0, 126.0, 140.0, 213.0, 284.0, 437.0, 638.0, 1016.0, 1466.0, 2525.0, 4302.0, 8760.0, 22613.0, 113992.0, 729505.0, 118474.0, 23475.0, 8687.0, 4270.0, 2582.0, 1539.0, 1036.0, 635.0, 459.0, 292.0, 198.0, 167.0, 106.0, 91.0, 63.0, 38.0, 38.0, 15.0, 19.0, 21.0, 10.0, 12.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.4052734375, -1.3620452880859375, -1.318817138671875, -1.2755889892578125, -1.23236083984375, -1.1891326904296875, -1.145904541015625, -1.1026763916015625, -1.0594482421875, -1.0162200927734375, -0.972991943359375, -0.9297637939453125, -0.88653564453125, -0.8433074951171875, -0.800079345703125, -0.7568511962890625, -0.713623046875, -0.6703948974609375, -0.627166748046875, -0.5839385986328125, -0.54071044921875, -0.4974822998046875, -0.454254150390625, -0.4110260009765625, -0.3677978515625, -0.3245697021484375, -0.281341552734375, -0.2381134033203125, -0.19488525390625, -0.1516571044921875, -0.108428955078125, -0.0652008056640625, -0.02197265625, 0.0212554931640625, 0.064483642578125, 0.1077117919921875, 0.15093994140625, 0.1941680908203125, 0.237396240234375, 0.2806243896484375, 0.3238525390625, 0.3670806884765625, 0.410308837890625, 0.4535369873046875, 0.49676513671875, 0.5399932861328125, 0.583221435546875, 0.6264495849609375, 0.669677734375, 0.7129058837890625, 0.756134033203125, 0.7993621826171875, 0.84259033203125, 0.8858184814453125, 0.929046630859375, 0.9722747802734375, 1.0155029296875, 1.0587310791015625, 1.101959228515625, 1.1451873779296875, 1.18841552734375, 1.2316436767578125, 1.274871826171875, 1.3180999755859375, 1.361328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 2.0, 2.0, 8.0, 9.0, 10.0, 15.0, 22.0, 19.0, 21.0, 22.0, 20.0, 30.0, 28.0, 40.0, 33.0, 39.0, 51.0, 45.0, 40.0, 56.0, 49.0, 62.0, 40.0, 40.0, 34.0, 35.0, 22.0, 23.0, 29.0, 27.0, 23.0, 10.0, 24.0, 13.0, 9.0, 9.0, 10.0, 9.0, 4.0, 6.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3828125, -2.308319091796875, -2.23382568359375, -2.159332275390625, -2.0848388671875, -2.010345458984375, -1.93585205078125, -1.861358642578125, -1.786865234375, -1.712371826171875, -1.63787841796875, -1.563385009765625, -1.4888916015625, -1.414398193359375, -1.33990478515625, -1.265411376953125, -1.19091796875, -1.116424560546875, -1.04193115234375, -0.967437744140625, -0.8929443359375, -0.818450927734375, -0.74395751953125, -0.669464111328125, -0.594970703125, -0.520477294921875, -0.44598388671875, -0.371490478515625, -0.2969970703125, -0.222503662109375, -0.14801025390625, -0.073516845703125, 0.0009765625, 0.075469970703125, 0.14996337890625, 0.224456787109375, 0.2989501953125, 0.373443603515625, 0.44793701171875, 0.522430419921875, 0.596923828125, 0.671417236328125, 0.74591064453125, 0.820404052734375, 0.8948974609375, 0.969390869140625, 1.04388427734375, 1.118377685546875, 1.19287109375, 1.267364501953125, 1.34185791015625, 1.416351318359375, 1.4908447265625, 1.565338134765625, 1.63983154296875, 1.714324951171875, 1.788818359375, 1.863311767578125, 1.93780517578125, 2.012298583984375, 2.0867919921875, 2.161285400390625, 2.23577880859375, 2.310272216796875, 2.384765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 12.0, 11.0, 12.0, 11.0, 18.0, 17.0, 22.0, 19.0, 34.0, 71.0, 79.0, 114.0, 259.0, 774.0, 6273.0, 1024550.0, 14481.0, 1014.0, 303.0, 123.0, 85.0, 46.0, 36.0, 37.0, 24.0, 20.0, 18.0, 14.0, 13.0, 8.0, 8.0, 6.0, 9.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9375, -7.7012939453125, -7.465087890625, -7.2288818359375, -6.99267578125, -6.7564697265625, -6.520263671875, -6.2840576171875, -6.0478515625, -5.8116455078125, -5.575439453125, -5.3392333984375, -5.10302734375, -4.8668212890625, -4.630615234375, -4.3944091796875, -4.158203125, -3.9219970703125, -3.685791015625, -3.4495849609375, -3.21337890625, -2.9771728515625, -2.740966796875, -2.5047607421875, -2.2685546875, -2.0323486328125, -1.796142578125, -1.5599365234375, -1.32373046875, -1.0875244140625, -0.851318359375, -0.6151123046875, -0.37890625, -0.1427001953125, 0.093505859375, 0.3297119140625, 0.56591796875, 0.8021240234375, 1.038330078125, 1.2745361328125, 1.5107421875, 1.7469482421875, 1.983154296875, 2.2193603515625, 2.45556640625, 2.6917724609375, 2.927978515625, 3.1641845703125, 3.400390625, 3.6365966796875, 3.872802734375, 4.1090087890625, 4.34521484375, 4.5814208984375, 4.817626953125, 5.0538330078125, 5.2900390625, 5.5262451171875, 5.762451171875, 5.9986572265625, 6.23486328125, 6.4710693359375, 6.707275390625, 6.9434814453125, 7.1796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 4.0, 11.0, 13.0, 11.0, 8.0, 15.0, 20.0, 15.0, 22.0, 20.0, 35.0, 40.0, 47.0, 55.0, 42.0, 43.0, 47.0, 56.0, 63.0, 47.0, 49.0, 41.0, 40.0, 37.0, 28.0, 34.0, 22.0, 17.0, 26.0, 12.0, 16.0, 10.0, 7.0, 7.0, 4.0, 8.0, 9.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.20703125, -3.116729736328125, -3.02642822265625, -2.936126708984375, -2.8458251953125, -2.755523681640625, -2.66522216796875, -2.574920654296875, -2.484619140625, -2.394317626953125, -2.30401611328125, -2.213714599609375, -2.1234130859375, -2.033111572265625, -1.94281005859375, -1.852508544921875, -1.76220703125, -1.671905517578125, -1.58160400390625, -1.491302490234375, -1.4010009765625, -1.310699462890625, -1.22039794921875, -1.130096435546875, -1.039794921875, -0.949493408203125, -0.85919189453125, -0.768890380859375, -0.6785888671875, -0.588287353515625, -0.49798583984375, -0.407684326171875, -0.3173828125, -0.227081298828125, -0.13677978515625, -0.046478271484375, 0.0438232421875, 0.134124755859375, 0.22442626953125, 0.314727783203125, 0.405029296875, 0.495330810546875, 0.58563232421875, 0.675933837890625, 0.7662353515625, 0.856536865234375, 0.94683837890625, 1.037139892578125, 1.12744140625, 1.217742919921875, 1.30804443359375, 1.398345947265625, 1.4886474609375, 1.578948974609375, 1.66925048828125, 1.759552001953125, 1.849853515625, 1.940155029296875, 2.03045654296875, 2.120758056640625, 2.2110595703125, 2.301361083984375, 2.39166259765625, 2.481964111328125, 2.572265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 13.0, 25.0, 34.0, 74.0, 246.0, 1112.0, 12556.0, 999263.0, 32899.0, 1801.0, 303.0, 103.0, 46.0, 17.0, 16.0, 12.0, 12.0, 3.0, 3.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.73046875, -1.67205810546875, -1.6136474609375, -1.55523681640625, -1.496826171875, -1.43841552734375, -1.3800048828125, -1.32159423828125, -1.26318359375, -1.20477294921875, -1.1463623046875, -1.08795166015625, -1.029541015625, -0.97113037109375, -0.9127197265625, -0.85430908203125, -0.7958984375, -0.73748779296875, -0.6790771484375, -0.62066650390625, -0.562255859375, -0.50384521484375, -0.4454345703125, -0.38702392578125, -0.32861328125, -0.27020263671875, -0.2117919921875, -0.15338134765625, -0.094970703125, -0.03656005859375, 0.0218505859375, 0.08026123046875, 0.138671875, 0.19708251953125, 0.2554931640625, 0.31390380859375, 0.372314453125, 0.43072509765625, 0.4891357421875, 0.54754638671875, 0.60595703125, 0.66436767578125, 0.7227783203125, 0.78118896484375, 0.839599609375, 0.89801025390625, 0.9564208984375, 1.01483154296875, 1.0732421875, 1.13165283203125, 1.1900634765625, 1.24847412109375, 1.306884765625, 1.36529541015625, 1.4237060546875, 1.48211669921875, 1.54052734375, 1.59893798828125, 1.6573486328125, 1.71575927734375, 1.774169921875, 1.83258056640625, 1.8909912109375, 1.94940185546875, 2.0078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 5.0, 3.0, 3.0, 2.0, 12.0, 11.0, 23.0, 30.0, 51.0, 97.0, 216.0, 257.0, 130.0, 70.0, 26.0, 19.0, 11.0, 13.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.212162017822266e-05, -6.886385381221771e-05, -6.560608744621277e-05, -6.234832108020782e-05, -5.909055471420288e-05, -5.583278834819794e-05, -5.257502198219299e-05, -4.931725561618805e-05, -4.6059489250183105e-05, -4.280172288417816e-05, -3.954395651817322e-05, -3.6286190152168274e-05, -3.302842378616333e-05, -2.9770657420158386e-05, -2.6512891054153442e-05, -2.32551246881485e-05, -1.9997358322143555e-05, -1.673959195613861e-05, -1.3481825590133667e-05, -1.0224059224128723e-05, -6.966292858123779e-06, -3.7085264921188354e-06, -4.507601261138916e-07, 2.8070062398910522e-06, 6.064772605895996e-06, 9.32253897190094e-06, 1.2580305337905884e-05, 1.5838071703910828e-05, 1.909583806991577e-05, 2.2353604435920715e-05, 2.561137080192566e-05, 2.8869137167930603e-05, 3.212690353393555e-05, 3.538466989994049e-05, 3.8642436265945435e-05, 4.190020263195038e-05, 4.515796899795532e-05, 4.8415735363960266e-05, 5.167350172996521e-05, 5.4931268095970154e-05, 5.81890344619751e-05, 6.144680082798004e-05, 6.470456719398499e-05, 6.796233355998993e-05, 7.122009992599487e-05, 7.447786629199982e-05, 7.773563265800476e-05, 8.09933990240097e-05, 8.425116539001465e-05, 8.750893175601959e-05, 9.076669812202454e-05, 9.402446448802948e-05, 9.728223085403442e-05, 0.00010053999722003937, 0.00010379776358604431, 0.00010705552995204926, 0.0001103132963180542, 0.00011357106268405914, 0.00011682882905006409, 0.00012008659541606903, 0.00012334436178207397, 0.00012660212814807892, 0.00012985989451408386, 0.0001331176608800888, 0.00013637542724609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 9.0, 13.0, 27.0, 25.0, 64.0, 196.0, 425.0, 1761.0, 10819.0, 376152.0, 642989.0, 13154.0, 1998.0, 526.0, 184.0, 97.0, 41.0, 17.0, 18.0, 9.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.359375, -1.3270416259765625, -1.294708251953125, -1.2623748779296875, -1.23004150390625, -1.1977081298828125, -1.165374755859375, -1.1330413818359375, -1.1007080078125, -1.0683746337890625, -1.036041259765625, -1.0037078857421875, -0.97137451171875, -0.9390411376953125, -0.906707763671875, -0.8743743896484375, -0.842041015625, -0.8097076416015625, -0.777374267578125, -0.7450408935546875, -0.71270751953125, -0.6803741455078125, -0.648040771484375, -0.6157073974609375, -0.5833740234375, -0.5510406494140625, -0.518707275390625, -0.4863739013671875, -0.45404052734375, -0.4217071533203125, -0.389373779296875, -0.3570404052734375, -0.32470703125, -0.2923736572265625, -0.260040283203125, -0.2277069091796875, -0.19537353515625, -0.1630401611328125, -0.130706787109375, -0.0983734130859375, -0.0660400390625, -0.0337066650390625, -0.001373291015625, 0.0309600830078125, 0.06329345703125, 0.0956268310546875, 0.127960205078125, 0.1602935791015625, 0.192626953125, 0.2249603271484375, 0.257293701171875, 0.2896270751953125, 0.32196044921875, 0.3542938232421875, 0.386627197265625, 0.4189605712890625, 0.4512939453125, 0.4836273193359375, 0.515960693359375, 0.5482940673828125, 0.58062744140625, 0.6129608154296875, 0.645294189453125, 0.6776275634765625, 0.7099609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 17.0, 23.0, 24.0, 20.0, 41.0, 75.0, 121.0, 230.0, 174.0, 64.0, 53.0, 40.0, 19.0, 22.0, 17.0, 14.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.201171875, -0.1943645477294922, -0.18755722045898438, -0.18074989318847656, -0.17394256591796875, -0.16713523864746094, -0.16032791137695312, -0.1535205841064453, -0.1467132568359375, -0.1399059295654297, -0.13309860229492188, -0.12629127502441406, -0.11948394775390625, -0.11267662048339844, -0.10586929321289062, -0.09906196594238281, -0.092254638671875, -0.08544731140136719, -0.07863998413085938, -0.07183265686035156, -0.06502532958984375, -0.05821800231933594, -0.051410675048828125, -0.04460334777832031, -0.0377960205078125, -0.030988693237304688, -0.024181365966796875, -0.017374038696289062, -0.01056671142578125, -0.0037593841552734375, 0.003047943115234375, 0.009855270385742188, 0.01666259765625, 0.023469924926757812, 0.030277252197265625, 0.03708457946777344, 0.04389190673828125, 0.05069923400878906, 0.057506561279296875, 0.06431388854980469, 0.0711212158203125, 0.07792854309082031, 0.08473587036132812, 0.09154319763183594, 0.09835052490234375, 0.10515785217285156, 0.11196517944335938, 0.11877250671386719, 0.125579833984375, 0.1323871612548828, 0.13919448852539062, 0.14600181579589844, 0.15280914306640625, 0.15961647033691406, 0.16642379760742188, 0.1732311248779297, 0.1800384521484375, 0.1868457794189453, 0.19365310668945312, 0.20046043395996094, 0.20726776123046875, 0.21407508850097656, 0.22088241577148438, 0.2276897430419922, 0.2344970703125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 27.0, 119.0, 520.0, 285.0, 54.0, 7.0, 3.0], "bins": [-39.530670166015625, -38.8690071105957, -38.20734405517578, -37.545677185058594, -36.88401412963867, -36.22235107421875, -35.56068801879883, -34.899024963378906, -34.23735809326172, -33.5756950378418, -32.914031982421875, -32.25236511230469, -31.590702056884766, -30.929039001464844, -30.26737403869629, -29.605710983276367, -28.944047927856445, -28.282384872436523, -27.62071990966797, -26.959056854248047, -26.297391891479492, -25.63572883605957, -24.974063873291016, -24.312400817871094, -23.650737762451172, -22.98907470703125, -22.327409744262695, -21.665746688842773, -21.00408172607422, -20.342418670654297, -19.680753707885742, -19.01909065246582, -18.3574275970459, -17.695764541625977, -17.034099578857422, -16.3724365234375, -15.710771560668945, -15.049108505249023, -14.387444496154785, -13.725780487060547, -13.064115524291992, -12.402451515197754, -11.740787506103516, -11.079123497009277, -10.417459487915039, -9.755796432495117, -9.094132423400879, -8.43246841430664, -7.7708048820495605, -7.109140872955322, -6.447477340698242, -5.785813331604004, -5.124149322509766, -4.462485313415527, -3.800821542739868, -3.139157772064209, -2.4774937629699707, -1.815829873085022, -1.1541659832000732, -0.4925020933151245, 0.16916179656982422, 0.8308258056640625, 1.4924895763397217, 2.154153347015381, 2.815817356109619]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 10.0, 10.0, 13.0, 9.0, 14.0, 17.0, 27.0, 26.0, 29.0, 28.0, 30.0, 33.0, 35.0, 36.0, 40.0, 46.0, 49.0, 50.0, 50.0, 56.0, 37.0, 40.0, 52.0, 24.0, 32.0, 35.0, 18.0, 21.0, 22.0, 14.0, 22.0, 19.0, 13.0, 8.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1127829551696777, -2.9984607696533203, -2.884138822555542, -2.7698166370391846, -2.655494451522827, -2.541172504425049, -2.4268503189086914, -2.312528133392334, -2.1982059478759766, -2.083883762359619, -1.9695616960525513, -1.8552396297454834, -1.740917444229126, -1.626595377922058, -1.5122733116149902, -1.3979511260986328, -1.283629059791565, -1.169306993484497, -1.0549848079681396, -0.9406627416610718, -0.8263405561447144, -0.7120184898376465, -0.5976963639259338, -0.4833742380142212, -0.36905211210250854, -0.2547299861907959, -0.14040787518024445, -0.026085764169692993, 0.08823636174201965, 0.2025584578514099, 0.31688058376312256, 0.4312027096748352, 0.5455248355865479, 0.6598469614982605, 0.7741690874099731, 0.888491153717041, 1.0028133392333984, 1.1171354055404663, 1.2314574718475342, 1.3457796573638916, 1.460101842880249, 1.574423909187317, 1.6887460947036743, 1.8030681610107422, 1.9173903465270996, 2.031712532043457, 2.1460344791412354, 2.2603566646575928, 2.374678611755371, 2.4890007972717285, 2.603322744369507, 2.7176449298858643, 2.8319671154022217, 2.9462890625, 3.0606112480163574, 3.174933433532715, 3.2892556190490723, 3.4035778045654297, 3.517899751663208, 3.6322219371795654, 3.746544122695923, 3.860866069793701, 3.9751882553100586, 4.089510440826416, 4.203832626342773]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 11.0, 11.0, 30.0, 24.0, 35.0, 38.0, 58.0, 78.0, 118.0, 168.0, 275.0, 429.0, 733.0, 1271.0, 2220.0, 4499.0, 12473.0, 78818.0, 1121400.0, 2696247.0, 237757.0, 24338.0, 6659.0, 2946.0, 1419.0, 774.0, 455.0, 326.0, 198.0, 156.0, 98.0, 59.0, 36.0, 25.0, 22.0, 13.0, 9.0, 7.0, 12.0, 6.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.796875, -3.689056396484375, -3.58123779296875, -3.473419189453125, -3.3656005859375, -3.257781982421875, -3.14996337890625, -3.042144775390625, -2.934326171875, -2.826507568359375, -2.71868896484375, -2.610870361328125, -2.5030517578125, -2.395233154296875, -2.28741455078125, -2.179595947265625, -2.07177734375, -1.963958740234375, -1.85614013671875, -1.748321533203125, -1.6405029296875, -1.532684326171875, -1.42486572265625, -1.317047119140625, -1.209228515625, -1.101409912109375, -0.99359130859375, -0.885772705078125, -0.7779541015625, -0.670135498046875, -0.56231689453125, -0.454498291015625, -0.3466796875, -0.238861083984375, -0.13104248046875, -0.023223876953125, 0.0845947265625, 0.192413330078125, 0.30023193359375, 0.408050537109375, 0.515869140625, 0.623687744140625, 0.73150634765625, 0.839324951171875, 0.9471435546875, 1.054962158203125, 1.16278076171875, 1.270599365234375, 1.37841796875, 1.486236572265625, 1.59405517578125, 1.701873779296875, 1.8096923828125, 1.917510986328125, 2.02532958984375, 2.133148193359375, 2.240966796875, 2.348785400390625, 2.45660400390625, 2.564422607421875, 2.6722412109375, 2.780059814453125, 2.88787841796875, 2.995697021484375, 3.103515625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 0.0, 7.0, 7.0, 3.0, 10.0, 10.0, 8.0, 10.0, 18.0, 21.0, 23.0, 34.0, 27.0, 27.0, 26.0, 44.0, 47.0, 51.0, 50.0, 36.0, 56.0, 41.0, 50.0, 39.0, 49.0, 52.0, 33.0, 42.0, 36.0, 23.0, 20.0, 20.0, 17.0, 20.0, 6.0, 9.0, 6.0, 5.0, 3.0, 5.0, 3.0, 2.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5400390625, -1.4932403564453125, -1.446441650390625, -1.3996429443359375, -1.35284423828125, -1.3060455322265625, -1.259246826171875, -1.2124481201171875, -1.1656494140625, -1.1188507080078125, -1.072052001953125, -1.0252532958984375, -0.97845458984375, -0.9316558837890625, -0.884857177734375, -0.8380584716796875, -0.791259765625, -0.7444610595703125, -0.697662353515625, -0.6508636474609375, -0.60406494140625, -0.5572662353515625, -0.510467529296875, -0.4636688232421875, -0.4168701171875, -0.3700714111328125, -0.323272705078125, -0.2764739990234375, -0.22967529296875, -0.1828765869140625, -0.136077880859375, -0.0892791748046875, -0.04248046875, 0.0043182373046875, 0.051116943359375, 0.0979156494140625, 0.14471435546875, 0.1915130615234375, 0.238311767578125, 0.2851104736328125, 0.3319091796875, 0.3787078857421875, 0.425506591796875, 0.4723052978515625, 0.51910400390625, 0.5659027099609375, 0.612701416015625, 0.6595001220703125, 0.706298828125, 0.7530975341796875, 0.799896240234375, 0.8466949462890625, 0.89349365234375, 0.9402923583984375, 0.987091064453125, 1.0338897705078125, 1.0806884765625, 1.1274871826171875, 1.174285888671875, 1.2210845947265625, 1.26788330078125, 1.3146820068359375, 1.361480712890625, 1.4082794189453125, 1.455078125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 9.0, 7.0, 7.0, 13.0, 12.0, 22.0, 30.0, 61.0, 99.0, 176.0, 313.0, 717.0, 1587.0, 4443.0, 17318.0, 168149.0, 3814817.0, 162101.0, 16936.0, 4436.0, 1530.0, 725.0, 337.0, 165.0, 93.0, 62.0, 34.0, 18.0, 13.0, 15.0, 11.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.765625, -3.628662109375, -3.49169921875, -3.354736328125, -3.2177734375, -3.080810546875, -2.94384765625, -2.806884765625, -2.669921875, -2.532958984375, -2.39599609375, -2.259033203125, -2.1220703125, -1.985107421875, -1.84814453125, -1.711181640625, -1.57421875, -1.437255859375, -1.30029296875, -1.163330078125, -1.0263671875, -0.889404296875, -0.75244140625, -0.615478515625, -0.478515625, -0.341552734375, -0.20458984375, -0.067626953125, 0.0693359375, 0.206298828125, 0.34326171875, 0.480224609375, 0.6171875, 0.754150390625, 0.89111328125, 1.028076171875, 1.1650390625, 1.302001953125, 1.43896484375, 1.575927734375, 1.712890625, 1.849853515625, 1.98681640625, 2.123779296875, 2.2607421875, 2.397705078125, 2.53466796875, 2.671630859375, 2.80859375, 2.945556640625, 3.08251953125, 3.219482421875, 3.3564453125, 3.493408203125, 3.63037109375, 3.767333984375, 3.904296875, 4.041259765625, 4.17822265625, 4.315185546875, 4.4521484375, 4.589111328125, 4.72607421875, 4.863037109375, 5.0]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 3.0, 4.0, 7.0, 11.0, 8.0, 18.0, 22.0, 23.0, 30.0, 61.0, 90.0, 164.0, 304.0, 486.0, 857.0, 817.0, 511.0, 252.0, 142.0, 87.0, 51.0, 28.0, 26.0, 18.0, 12.0, 11.0, 4.0, 9.0, 1.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0556640625, -1.0245361328125, -0.993408203125, -0.9622802734375, -0.93115234375, -0.9000244140625, -0.868896484375, -0.8377685546875, -0.806640625, -0.7755126953125, -0.744384765625, -0.7132568359375, -0.68212890625, -0.6510009765625, -0.619873046875, -0.5887451171875, -0.5576171875, -0.5264892578125, -0.495361328125, -0.4642333984375, -0.43310546875, -0.4019775390625, -0.370849609375, -0.3397216796875, -0.30859375, -0.2774658203125, -0.246337890625, -0.2152099609375, -0.18408203125, -0.1529541015625, -0.121826171875, -0.0906982421875, -0.0595703125, -0.0284423828125, 0.002685546875, 0.0338134765625, 0.06494140625, 0.0960693359375, 0.127197265625, 0.1583251953125, 0.189453125, 0.2205810546875, 0.251708984375, 0.2828369140625, 0.31396484375, 0.3450927734375, 0.376220703125, 0.4073486328125, 0.4384765625, 0.4696044921875, 0.500732421875, 0.5318603515625, 0.56298828125, 0.5941162109375, 0.625244140625, 0.6563720703125, 0.6875, 0.7186279296875, 0.749755859375, 0.7808837890625, 0.81201171875, 0.8431396484375, 0.874267578125, 0.9053955078125, 0.9365234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 4.0, 7.0, 8.0, 15.0, 19.0, 21.0, 43.0, 48.0, 61.0, 78.0, 85.0, 104.0, 107.0, 96.0, 76.0, 63.0, 48.0, 24.0, 23.0, 20.0, 11.0, 5.0, 9.0, 10.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.513014554977417, -3.425304651260376, -3.337594747543335, -3.249885082244873, -3.162175178527832, -3.074465274810791, -2.98675537109375, -2.899045467376709, -2.811335563659668, -2.723625659942627, -2.635915756225586, -2.548205852508545, -2.460496187210083, -2.372786283493042, -2.285076379776001, -2.19736647605896, -2.109656810760498, -2.021946907043457, -1.9342371225357056, -1.8465272188186646, -1.758817434310913, -1.671107530593872, -1.583397626876831, -1.49568772315979, -1.4079779386520386, -1.3202680349349976, -1.232558250427246, -1.144848346710205, -1.057138442993164, -0.9694286584854126, -0.8817187547683716, -0.7940089106559753, -0.706298828125, -0.6185889840126038, -0.5308791399002075, -0.4431692361831665, -0.35545939207077026, -0.267749547958374, -0.180039644241333, -0.09232980012893677, -0.004619956016540527, 0.0830899029970169, 0.17079976201057434, 0.25850963592529297, 0.3462194800376892, 0.43392932415008545, 0.5216392278671265, 0.6093490719795227, 0.697058916091919, 0.7847687602043152, 0.8724786043167114, 0.9601885080337524, 1.047898292541504, 1.135608196258545, 1.223318099975586, 1.311028003692627, 1.3987377882003784, 1.4864476919174194, 1.574157476425171, 1.661867380142212, 1.749577283859253, 1.8372870683670044, 1.9249969720840454, 2.012706756591797, 2.100416660308838]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 4.0, 8.0, 7.0, 11.0, 15.0, 12.0, 18.0, 18.0, 26.0, 29.0, 16.0, 28.0, 29.0, 37.0, 48.0, 30.0, 48.0, 56.0, 46.0, 46.0, 45.0, 45.0, 40.0, 36.0, 52.0, 24.0, 34.0, 24.0, 33.0, 25.0, 21.0, 23.0, 16.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.542176604270935, -1.4889832735061646, -1.435789942741394, -1.3825966119766235, -1.3294031620025635, -1.276209831237793, -1.2230165004730225, -1.169823169708252, -1.1166298389434814, -1.063436508178711, -1.0102431774139404, -0.9570497870445251, -0.9038564562797546, -0.8506631255149841, -0.7974697351455688, -0.7442764043807983, -0.6910830736160278, -0.6378897428512573, -0.5846964120864868, -0.5315030217170715, -0.478309690952301, -0.4251163601875305, -0.3719229996204376, -0.3187296390533447, -0.2655363082885742, -0.21234296262264252, -0.15914961695671082, -0.10595627129077911, -0.05276292562484741, 0.0004304051399230957, 0.05362376570701599, 0.10681712627410889, 0.16001033782958984, 0.21320368349552155, 0.26639702916145325, 0.31959038972854614, 0.37278372049331665, 0.42597705125808716, 0.47917041182518005, 0.532363772392273, 0.5855571031570435, 0.638750433921814, 0.6919437646865845, 0.7451371550559998, 0.7983304858207703, 0.8515238165855408, 0.904717206954956, 0.9579105377197266, 1.011103868484497, 1.0642971992492676, 1.117490530014038, 1.1706838607788086, 1.223877191543579, 1.2770705223083496, 1.3302639722824097, 1.3834573030471802, 1.4366506338119507, 1.4898439645767212, 1.5430372953414917, 1.5962306261062622, 1.6494240760803223, 1.7026174068450928, 1.7558107376098633, 1.8090040683746338, 1.8621973991394043]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 3.0, 4.0, 8.0, 6.0, 20.0, 31.0, 30.0, 65.0, 82.0, 170.0, 354.0, 782.0, 1770.0, 4779.0, 13552.0, 44733.0, 241386.0, 604829.0, 97617.0, 24599.0, 8344.0, 3036.0, 1204.0, 568.0, 238.0, 124.0, 72.0, 28.0, 20.0, 21.0, 14.0, 6.0, 7.0, 8.0, 5.0, 5.0, 6.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1376953125, -1.1024322509765625, -1.067169189453125, -1.0319061279296875, -0.99664306640625, -0.9613800048828125, -0.926116943359375, -0.8908538818359375, -0.8555908203125, -0.8203277587890625, -0.785064697265625, -0.7498016357421875, -0.71453857421875, -0.6792755126953125, -0.644012451171875, -0.6087493896484375, -0.573486328125, -0.5382232666015625, -0.502960205078125, -0.4676971435546875, -0.43243408203125, -0.3971710205078125, -0.361907958984375, -0.3266448974609375, -0.2913818359375, -0.2561187744140625, -0.220855712890625, -0.1855926513671875, -0.15032958984375, -0.1150665283203125, -0.079803466796875, -0.0445404052734375, -0.00927734375, 0.0259857177734375, 0.061248779296875, 0.0965118408203125, 0.13177490234375, 0.1670379638671875, 0.202301025390625, 0.2375640869140625, 0.2728271484375, 0.3080902099609375, 0.343353271484375, 0.3786163330078125, 0.41387939453125, 0.4491424560546875, 0.484405517578125, 0.5196685791015625, 0.554931640625, 0.5901947021484375, 0.625457763671875, 0.6607208251953125, 0.69598388671875, 0.7312469482421875, 0.766510009765625, 0.8017730712890625, 0.8370361328125, 0.8722991943359375, 0.907562255859375, 0.9428253173828125, 0.97808837890625, 1.0133514404296875, 1.048614501953125, 1.0838775634765625, 1.119140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 10.0, 15.0, 16.0, 23.0, 31.0, 28.0, 39.0, 58.0, 60.0, 69.0, 67.0, 98.0, 88.0, 68.0, 75.0, 58.0, 44.0, 44.0, 37.0, 37.0, 12.0, 7.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -0.9990234375, -0.943359375, -0.8876953125, -0.83203125, -0.7763671875, -0.720703125, -0.6650390625, -0.609375, -0.5537109375, -0.498046875, -0.4423828125, -0.38671875, -0.3310546875, -0.275390625, -0.2197265625, -0.1640625, -0.1083984375, -0.052734375, 0.0029296875, 0.05859375, 0.1142578125, 0.169921875, 0.2255859375, 0.28125, 0.3369140625, 0.392578125, 0.4482421875, 0.50390625, 0.5595703125, 0.615234375, 0.6708984375, 0.7265625, 0.7822265625, 0.837890625, 0.8935546875, 0.94921875, 1.0048828125, 1.060546875, 1.1162109375, 1.171875, 1.2275390625, 1.283203125, 1.3388671875, 1.39453125, 1.4501953125, 1.505859375, 1.5615234375, 1.6171875, 1.6728515625, 1.728515625, 1.7841796875, 1.83984375, 1.8955078125, 1.951171875, 2.0068359375, 2.0625, 2.1181640625, 2.173828125, 2.2294921875, 2.28515625, 2.3408203125, 2.396484375, 2.4521484375, 2.5078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 11.0, 12.0, 9.0, 25.0, 31.0, 49.0, 48.0, 77.0, 125.0, 190.0, 241.0, 402.0, 572.0, 981.0, 1572.0, 2609.0, 4730.0, 8528.0, 16858.0, 35077.0, 81820.0, 225758.0, 386250.0, 161816.0, 62943.0, 27787.0, 13506.0, 6969.0, 3770.0, 2182.0, 1292.0, 802.0, 506.0, 309.0, 212.0, 151.0, 110.0, 59.0, 44.0, 27.0, 27.0, 12.0, 16.0, 10.0, 3.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.40283203125, -0.3903770446777344, -0.37792205810546875, -0.3654670715332031, -0.3530120849609375, -0.3405570983886719, -0.32810211181640625, -0.3156471252441406, -0.303192138671875, -0.2907371520996094, -0.27828216552734375, -0.2658271789550781, -0.2533721923828125, -0.24091720581054688, -0.22846221923828125, -0.21600723266601562, -0.20355224609375, -0.19109725952148438, -0.17864227294921875, -0.16618728637695312, -0.1537322998046875, -0.14127731323242188, -0.12882232666015625, -0.11636734008789062, -0.103912353515625, -0.09145736694335938, -0.07900238037109375, -0.06654739379882812, -0.0540924072265625, -0.041637420654296875, -0.02918243408203125, -0.016727447509765625, -0.0042724609375, 0.008182525634765625, 0.02063751220703125, 0.033092498779296875, 0.0455474853515625, 0.058002471923828125, 0.07045745849609375, 0.08291244506835938, 0.095367431640625, 0.10782241821289062, 0.12027740478515625, 0.13273239135742188, 0.1451873779296875, 0.15764236450195312, 0.17009735107421875, 0.18255233764648438, 0.19500732421875, 0.20746231079101562, 0.21991729736328125, 0.23237228393554688, 0.2448272705078125, 0.2572822570800781, 0.26973724365234375, 0.2821922302246094, 0.294647216796875, 0.3071022033691406, 0.31955718994140625, 0.3320121765136719, 0.3444671630859375, 0.3569221496582031, 0.36937713623046875, 0.3818321228027344, 0.394287109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 1.0, 5.0, 4.0, 2.0, 9.0, 15.0, 12.0, 15.0, 26.0, 31.0, 29.0, 44.0, 42.0, 56.0, 54.0, 74.0, 64.0, 70.0, 65.0, 49.0, 62.0, 54.0, 48.0, 26.0, 32.0, 31.0, 24.0, 17.0, 14.0, 5.0, 5.0, 3.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9453125, -1.870819091796875, -1.79632568359375, -1.721832275390625, -1.6473388671875, -1.572845458984375, -1.49835205078125, -1.423858642578125, -1.349365234375, -1.274871826171875, -1.20037841796875, -1.125885009765625, -1.0513916015625, -0.976898193359375, -0.90240478515625, -0.827911376953125, -0.75341796875, -0.678924560546875, -0.60443115234375, -0.529937744140625, -0.4554443359375, -0.380950927734375, -0.30645751953125, -0.231964111328125, -0.157470703125, -0.082977294921875, -0.00848388671875, 0.066009521484375, 0.1405029296875, 0.214996337890625, 0.28948974609375, 0.363983154296875, 0.4384765625, 0.512969970703125, 0.58746337890625, 0.661956787109375, 0.7364501953125, 0.810943603515625, 0.88543701171875, 0.959930419921875, 1.034423828125, 1.108917236328125, 1.18341064453125, 1.257904052734375, 1.3323974609375, 1.406890869140625, 1.48138427734375, 1.555877685546875, 1.63037109375, 1.704864501953125, 1.77935791015625, 1.853851318359375, 1.9283447265625, 2.002838134765625, 2.07733154296875, 2.151824951171875, 2.226318359375, 2.300811767578125, 2.37530517578125, 2.449798583984375, 2.5242919921875, 2.598785400390625, 2.67327880859375, 2.747772216796875, 2.822265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 10.0, 10.0, 19.0, 35.0, 34.0, 40.0, 67.0, 71.0, 120.0, 237.0, 301.0, 617.0, 945.0, 1992.0, 3941.0, 9020.0, 25878.0, 111436.0, 540507.0, 276307.0, 50463.0, 14724.0, 5651.0, 2730.0, 1381.0, 781.0, 454.0, 261.0, 161.0, 87.0, 70.0, 58.0, 34.0, 24.0, 17.0, 17.0, 17.0, 10.0, 6.0, 2.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.18603515625, -0.18017578125, -0.17431640625, -0.16845703125, -0.16259765625, -0.15673828125, -0.15087890625, -0.14501953125, -0.13916015625, -0.13330078125, -0.12744140625, -0.12158203125, -0.11572265625, -0.10986328125, -0.10400390625, -0.09814453125, -0.09228515625, -0.08642578125, -0.08056640625, -0.07470703125, -0.06884765625, -0.06298828125, -0.05712890625, -0.05126953125, -0.04541015625, -0.03955078125, -0.03369140625, -0.02783203125, -0.02197265625, -0.01611328125, -0.01025390625, -0.00439453125, 0.00146484375, 0.00732421875, 0.01318359375, 0.01904296875, 0.02490234375, 0.03076171875, 0.03662109375, 0.04248046875, 0.04833984375, 0.05419921875, 0.06005859375, 0.06591796875, 0.07177734375, 0.07763671875, 0.08349609375, 0.08935546875, 0.09521484375, 0.10107421875, 0.10693359375, 0.11279296875, 0.11865234375, 0.12451171875, 0.13037109375, 0.13623046875, 0.14208984375, 0.14794921875, 0.15380859375, 0.15966796875, 0.16552734375, 0.17138671875, 0.17724609375, 0.18310546875, 0.18896484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 17.0, 14.0, 18.0, 45.0, 33.0, 68.0, 122.0, 143.0, 184.0, 143.0, 65.0, 45.0, 25.0, 21.0, 13.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012826919555664062, -0.00012353435158729553, -0.00011879950761795044, -0.00011406466364860535, -0.00010932981967926025, -0.00010459497570991516, -9.986013174057007e-05, -9.512528777122498e-05, -9.039044380187988e-05, -8.565559983253479e-05, -8.09207558631897e-05, -7.61859118938446e-05, -7.145106792449951e-05, -6.671622395515442e-05, -6.198137998580933e-05, -5.7246536016464233e-05, -5.251169204711914e-05, -4.777684807777405e-05, -4.3042004108428955e-05, -3.830716013908386e-05, -3.357231616973877e-05, -2.8837472200393677e-05, -2.4102628231048584e-05, -1.936778426170349e-05, -1.4632940292358398e-05, -9.898096323013306e-06, -5.163252353668213e-06, -4.284083843231201e-07, 4.306435585021973e-06, 9.041279554367065e-06, 1.3776123523712158e-05, 1.851096749305725e-05, 2.3245811462402344e-05, 2.7980655431747437e-05, 3.271549940109253e-05, 3.745034337043762e-05, 4.2185187339782715e-05, 4.692003130912781e-05, 5.16548752784729e-05, 5.638971924781799e-05, 6.112456321716309e-05, 6.585940718650818e-05, 7.059425115585327e-05, 7.532909512519836e-05, 8.006393909454346e-05, 8.479878306388855e-05, 8.953362703323364e-05, 9.426847100257874e-05, 9.900331497192383e-05, 0.00010373815894126892, 0.00010847300291061401, 0.0001132078468799591, 0.0001179426908493042, 0.0001226775348186493, 0.00012741237878799438, 0.00013214722275733948, 0.00013688206672668457, 0.00014161691069602966, 0.00014635175466537476, 0.00015108659863471985, 0.00015582144260406494, 0.00016055628657341003, 0.00016529113054275513, 0.00017002597451210022, 0.0001747608184814453]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 9.0, 7.0, 7.0, 5.0, 14.0, 16.0, 25.0, 39.0, 48.0, 70.0, 81.0, 114.0, 189.0, 242.0, 407.0, 574.0, 972.0, 1496.0, 2537.0, 4538.0, 9016.0, 20762.0, 59538.0, 227653.0, 469539.0, 169300.0, 46539.0, 16901.0, 7653.0, 4039.0, 2308.0, 1433.0, 783.0, 514.0, 342.0, 251.0, 176.0, 125.0, 81.0, 52.0, 41.0, 32.0, 24.0, 15.0, 13.0, 8.0, 12.0, 4.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.162353515625, -0.15749168395996094, -0.15262985229492188, -0.1477680206298828, -0.14290618896484375, -0.1380443572998047, -0.13318252563476562, -0.12832069396972656, -0.1234588623046875, -0.11859703063964844, -0.11373519897460938, -0.10887336730957031, -0.10401153564453125, -0.09914970397949219, -0.09428787231445312, -0.08942604064941406, -0.084564208984375, -0.07970237731933594, -0.07484054565429688, -0.06997871398925781, -0.06511688232421875, -0.06025505065917969, -0.055393218994140625, -0.05053138732910156, -0.0456695556640625, -0.04080772399902344, -0.035945892333984375, -0.031084060668945312, -0.02622222900390625, -0.021360397338867188, -0.016498565673828125, -0.011636734008789062, -0.00677490234375, -0.0019130706787109375, 0.002948760986328125, 0.0078105926513671875, 0.01267242431640625, 0.017534255981445312, 0.022396087646484375, 0.027257919311523438, 0.0321197509765625, 0.03698158264160156, 0.041843414306640625, 0.04670524597167969, 0.05156707763671875, 0.05642890930175781, 0.061290740966796875, 0.06615257263183594, 0.071014404296875, 0.07587623596191406, 0.08073806762695312, 0.08559989929199219, 0.09046173095703125, 0.09532356262207031, 0.10018539428710938, 0.10504722595214844, 0.1099090576171875, 0.11477088928222656, 0.11963272094726562, 0.12449455261230469, 0.12935638427734375, 0.1342182159423828, 0.13908004760742188, 0.14394187927246094, 0.1488037109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 1.0, 2.0, 6.0, 7.0, 2.0, 8.0, 5.0, 18.0, 11.0, 29.0, 33.0, 59.0, 56.0, 85.0, 96.0, 106.0, 107.0, 105.0, 66.0, 41.0, 32.0, 32.0, 26.0, 14.0, 7.0, 4.0, 7.0, 4.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051055908203125, -0.049384117126464844, -0.04771232604980469, -0.04604053497314453, -0.044368743896484375, -0.04269695281982422, -0.04102516174316406, -0.039353370666503906, -0.03768157958984375, -0.036009788513183594, -0.03433799743652344, -0.03266620635986328, -0.030994415283203125, -0.02932262420654297, -0.027650833129882812, -0.025979042053222656, -0.0243072509765625, -0.022635459899902344, -0.020963668823242188, -0.01929187774658203, -0.017620086669921875, -0.01594829559326172, -0.014276504516601562, -0.012604713439941406, -0.01093292236328125, -0.009261131286621094, -0.0075893402099609375, -0.005917549133300781, -0.004245758056640625, -0.0025739669799804688, -0.0009021759033203125, 0.0007696151733398438, 0.00244140625, 0.004113197326660156, 0.0057849884033203125, 0.007456779479980469, 0.009128570556640625, 0.010800361633300781, 0.012472152709960938, 0.014143943786621094, 0.01581573486328125, 0.017487525939941406, 0.019159317016601562, 0.02083110809326172, 0.022502899169921875, 0.02417469024658203, 0.025846481323242188, 0.027518272399902344, 0.0291900634765625, 0.030861854553222656, 0.03253364562988281, 0.03420543670654297, 0.035877227783203125, 0.03754901885986328, 0.03922080993652344, 0.040892601013183594, 0.04256439208984375, 0.044236183166503906, 0.04590797424316406, 0.04757976531982422, 0.049251556396484375, 0.05092334747314453, 0.05259513854980469, 0.054266929626464844, 0.055938720703125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 3.0, 8.0, 6.0, 18.0, 13.0, 32.0, 37.0, 55.0, 74.0, 92.0, 125.0, 100.0, 118.0, 96.0, 58.0, 42.0, 33.0, 25.0, 14.0, 8.0, 11.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7162421941757202, -1.6597799062728882, -1.6033176183700562, -1.5468553304672241, -1.490393042564392, -1.43393075466156, -1.377468466758728, -1.321006178855896, -1.264543890953064, -1.208081603050232, -1.1516193151474, -1.0951570272445679, -1.0386947393417358, -0.9822324514389038, -0.9257701635360718, -0.8693078756332397, -0.8128455877304077, -0.7563832998275757, -0.6999210119247437, -0.6434587240219116, -0.5869964361190796, -0.5305341482162476, -0.4740718603134155, -0.4176095724105835, -0.36114728450775146, -0.30468499660491943, -0.2482227087020874, -0.19176042079925537, -0.13529813289642334, -0.07883584499359131, -0.022373557090759277, 0.034088730812072754, 0.09055089950561523, 0.14701318740844727, 0.2034754753112793, 0.25993776321411133, 0.31640005111694336, 0.3728623390197754, 0.4293246269226074, 0.48578691482543945, 0.5422492027282715, 0.5987114906311035, 0.6551737785339355, 0.7116360664367676, 0.7680983543395996, 0.8245606422424316, 0.8810229301452637, 0.9374852180480957, 0.9939475059509277, 1.0504097938537598, 1.1068720817565918, 1.1633343696594238, 1.2197966575622559, 1.276258945465088, 1.33272123336792, 1.389183521270752, 1.445645809173584, 1.502108097076416, 1.558570384979248, 1.61503267288208, 1.671494960784912, 1.7279572486877441, 1.7844195365905762, 1.8408818244934082, 1.8973441123962402]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 13.0, 15.0, 16.0, 23.0, 37.0, 45.0, 39.0, 46.0, 66.0, 81.0, 89.0, 74.0, 68.0, 76.0, 65.0, 55.0, 50.0, 43.0, 26.0, 28.0, 18.0, 5.0, 5.0, 9.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.026350736618042, -0.9734401106834412, -0.9205294847488403, -0.8676189184188843, -0.8147082924842834, -0.7617976665496826, -0.7088870406150818, -0.655976414680481, -0.6030658483505249, -0.5501552224159241, -0.49724462628364563, -0.4443340003490448, -0.39142340421676636, -0.3385127782821655, -0.2856021523475647, -0.23269155621528625, -0.17978090047836304, -0.1268702894449234, -0.07395967096090317, -0.021049052476882935, 0.0318615585565567, 0.08477216958999634, 0.13768279552459717, 0.1905933916568756, 0.24350401759147644, 0.29641464352607727, 0.3493252396583557, 0.40223586559295654, 0.4551464915275574, 0.5080571174621582, 0.5609676837921143, 0.6138783097267151, 0.6667889356613159, 0.7196995615959167, 0.7726101875305176, 0.8255207538604736, 0.8784313797950745, 0.9313420057296753, 0.9842526316642761, 1.037163257598877, 1.090073823928833, 1.142984390258789, 1.1958950757980347, 1.2488056421279907, 1.3017163276672363, 1.3546268939971924, 1.4075374603271484, 1.460448145866394, 1.5133588314056396, 1.5662693977355957, 1.6191800832748413, 1.6720906496047974, 1.725001335144043, 1.777911901473999, 1.830822467803955, 1.8837331533432007, 1.9366437196731567, 1.9895542860031128, 2.0424649715423584, 2.0953755378723145, 2.1482861042022705, 2.2011966705322266, 2.2541074752807617, 2.3070180416107178, 2.359928607940674]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 1.0, 14.0, 10.0, 25.0, 25.0, 28.0, 55.0, 62.0, 94.0, 123.0, 207.0, 265.0, 345.0, 526.0, 822.0, 1146.0, 1768.0, 2706.0, 4422.0, 8017.0, 15830.0, 37824.0, 123136.0, 547042.0, 205484.0, 53515.0, 20599.0, 9617.0, 5356.0, 3164.0, 2034.0, 1326.0, 934.0, 555.0, 426.0, 323.0, 238.0, 142.0, 114.0, 75.0, 52.0, 30.0, 26.0, 17.0, 15.0, 10.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.017578125, -0.985443115234375, -0.95330810546875, -0.921173095703125, -0.8890380859375, -0.856903076171875, -0.82476806640625, -0.792633056640625, -0.760498046875, -0.728363037109375, -0.69622802734375, -0.664093017578125, -0.6319580078125, -0.599822998046875, -0.56768798828125, -0.535552978515625, -0.50341796875, -0.471282958984375, -0.43914794921875, -0.407012939453125, -0.3748779296875, -0.342742919921875, -0.31060791015625, -0.278472900390625, -0.246337890625, -0.214202880859375, -0.18206787109375, -0.149932861328125, -0.1177978515625, -0.085662841796875, -0.05352783203125, -0.021392822265625, 0.0107421875, 0.042877197265625, 0.07501220703125, 0.107147216796875, 0.1392822265625, 0.171417236328125, 0.20355224609375, 0.235687255859375, 0.267822265625, 0.299957275390625, 0.33209228515625, 0.364227294921875, 0.3963623046875, 0.428497314453125, 0.46063232421875, 0.492767333984375, 0.52490234375, 0.557037353515625, 0.58917236328125, 0.621307373046875, 0.6534423828125, 0.685577392578125, 0.71771240234375, 0.749847412109375, 0.781982421875, 0.814117431640625, 0.84625244140625, 0.878387451171875, 0.9105224609375, 0.942657470703125, 0.97479248046875, 1.006927490234375, 1.0390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 14.0, 10.0, 10.0, 22.0, 25.0, 38.0, 41.0, 43.0, 55.0, 69.0, 77.0, 79.0, 86.0, 67.0, 90.0, 67.0, 52.0, 43.0, 34.0, 29.0, 16.0, 10.0, 10.0, 5.0, 7.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28515625, -2.18115234375, -2.0771484375, -1.97314453125, -1.869140625, -1.76513671875, -1.6611328125, -1.55712890625, -1.453125, -1.34912109375, -1.2451171875, -1.14111328125, -1.037109375, -0.93310546875, -0.8291015625, -0.72509765625, -0.62109375, -0.51708984375, -0.4130859375, -0.30908203125, -0.205078125, -0.10107421875, 0.0029296875, 0.10693359375, 0.2109375, 0.31494140625, 0.4189453125, 0.52294921875, 0.626953125, 0.73095703125, 0.8349609375, 0.93896484375, 1.04296875, 1.14697265625, 1.2509765625, 1.35498046875, 1.458984375, 1.56298828125, 1.6669921875, 1.77099609375, 1.875, 1.97900390625, 2.0830078125, 2.18701171875, 2.291015625, 2.39501953125, 2.4990234375, 2.60302734375, 2.70703125, 2.81103515625, 2.9150390625, 3.01904296875, 3.123046875, 3.22705078125, 3.3310546875, 3.43505859375, 3.5390625, 3.64306640625, 3.7470703125, 3.85107421875, 3.955078125, 4.05908203125, 4.1630859375, 4.26708984375, 4.37109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 3.0, 7.0, 11.0, 8.0, 12.0, 17.0, 18.0, 21.0, 24.0, 31.0, 40.0, 39.0, 45.0, 88.0, 119.0, 636.0, 8420.0, 994516.0, 42276.0, 1603.0, 205.0, 77.0, 52.0, 47.0, 48.0, 25.0, 35.0, 18.0, 11.0, 17.0, 17.0, 14.0, 13.0, 12.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-8.3515625, -8.10382080078125, -7.8560791015625, -7.60833740234375, -7.360595703125, -7.11285400390625, -6.8651123046875, -6.61737060546875, -6.36962890625, -6.12188720703125, -5.8741455078125, -5.62640380859375, -5.378662109375, -5.13092041015625, -4.8831787109375, -4.63543701171875, -4.3876953125, -4.13995361328125, -3.8922119140625, -3.64447021484375, -3.396728515625, -3.14898681640625, -2.9012451171875, -2.65350341796875, -2.40576171875, -2.15802001953125, -1.9102783203125, -1.66253662109375, -1.414794921875, -1.16705322265625, -0.9193115234375, -0.67156982421875, -0.423828125, -0.17608642578125, 0.0716552734375, 0.31939697265625, 0.567138671875, 0.81488037109375, 1.0626220703125, 1.31036376953125, 1.55810546875, 1.80584716796875, 2.0535888671875, 2.30133056640625, 2.549072265625, 2.79681396484375, 3.0445556640625, 3.29229736328125, 3.5400390625, 3.78778076171875, 4.0355224609375, 4.28326416015625, 4.531005859375, 4.77874755859375, 5.0264892578125, 5.27423095703125, 5.52197265625, 5.76971435546875, 6.0174560546875, 6.26519775390625, 6.512939453125, 6.76068115234375, 7.0084228515625, 7.25616455078125, 7.50390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 11.0, 7.0, 12.0, 15.0, 20.0, 22.0, 25.0, 25.0, 32.0, 37.0, 31.0, 50.0, 42.0, 48.0, 46.0, 52.0, 47.0, 51.0, 41.0, 38.0, 38.0, 43.0, 31.0, 36.0, 26.0, 32.0, 22.0, 23.0, 18.0, 19.0, 15.0, 9.0, 8.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.8883056640625, -1.821533203125, -1.7547607421875, -1.68798828125, -1.6212158203125, -1.554443359375, -1.4876708984375, -1.4208984375, -1.3541259765625, -1.287353515625, -1.2205810546875, -1.15380859375, -1.0870361328125, -1.020263671875, -0.9534912109375, -0.88671875, -0.8199462890625, -0.753173828125, -0.6864013671875, -0.61962890625, -0.5528564453125, -0.486083984375, -0.4193115234375, -0.3525390625, -0.2857666015625, -0.218994140625, -0.1522216796875, -0.08544921875, -0.0186767578125, 0.048095703125, 0.1148681640625, 0.181640625, 0.2484130859375, 0.315185546875, 0.3819580078125, 0.44873046875, 0.5155029296875, 0.582275390625, 0.6490478515625, 0.7158203125, 0.7825927734375, 0.849365234375, 0.9161376953125, 0.98291015625, 1.0496826171875, 1.116455078125, 1.1832275390625, 1.25, 1.3167724609375, 1.383544921875, 1.4503173828125, 1.51708984375, 1.5838623046875, 1.650634765625, 1.7174072265625, 1.7841796875, 1.8509521484375, 1.917724609375, 1.9844970703125, 2.05126953125, 2.1180419921875, 2.184814453125, 2.2515869140625, 2.318359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 4.0, 7.0, 3.0, 4.0, 19.0, 30.0, 54.0, 92.0, 172.0, 387.0, 1057.0, 4290.0, 45112.0, 964552.0, 27935.0, 3269.0, 848.0, 345.0, 157.0, 77.0, 45.0, 28.0, 22.0, 15.0, 12.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9736328125, -0.9259796142578125, -0.878326416015625, -0.8306732177734375, -0.78302001953125, -0.7353668212890625, -0.687713623046875, -0.6400604248046875, -0.5924072265625, -0.5447540283203125, -0.497100830078125, -0.4494476318359375, -0.40179443359375, -0.3541412353515625, -0.306488037109375, -0.2588348388671875, -0.211181640625, -0.1635284423828125, -0.115875244140625, -0.0682220458984375, -0.02056884765625, 0.0270843505859375, 0.074737548828125, 0.1223907470703125, 0.1700439453125, 0.2176971435546875, 0.265350341796875, 0.3130035400390625, 0.36065673828125, 0.4083099365234375, 0.455963134765625, 0.5036163330078125, 0.55126953125, 0.5989227294921875, 0.646575927734375, 0.6942291259765625, 0.74188232421875, 0.7895355224609375, 0.837188720703125, 0.8848419189453125, 0.9324951171875, 0.9801483154296875, 1.027801513671875, 1.0754547119140625, 1.12310791015625, 1.1707611083984375, 1.218414306640625, 1.2660675048828125, 1.313720703125, 1.3613739013671875, 1.409027099609375, 1.4566802978515625, 1.50433349609375, 1.5519866943359375, 1.599639892578125, 1.6472930908203125, 1.6949462890625, 1.7425994873046875, 1.790252685546875, 1.8379058837890625, 1.88555908203125, 1.9332122802734375, 1.980865478515625, 2.0285186767578125, 2.076171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 12.0, 27.0, 33.0, 75.0, 151.0, 322.0, 184.0, 88.0, 47.0, 20.0, 7.0, 9.0, 3.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022733211517333984, -0.00022200308740139008, -0.0002166740596294403, -0.00021134503185749054, -0.00020601600408554077, -0.000200686976313591, -0.00019535794854164124, -0.00019002892076969147, -0.0001846998929977417, -0.00017937086522579193, -0.00017404183745384216, -0.0001687128096818924, -0.00016338378190994263, -0.00015805475413799286, -0.0001527257263660431, -0.00014739669859409332, -0.00014206767082214355, -0.0001367386430501938, -0.00013140961527824402, -0.00012608058750629425, -0.00012075155973434448, -0.00011542253196239471, -0.00011009350419044495, -0.00010476447641849518, -9.943544864654541e-05, -9.410642087459564e-05, -8.877739310264587e-05, -8.34483653306961e-05, -7.811933755874634e-05, -7.279030978679657e-05, -6.74612820148468e-05, -6.213225424289703e-05, -5.6803226470947266e-05, -5.14741986989975e-05, -4.614517092704773e-05, -4.081614315509796e-05, -3.548711538314819e-05, -3.0158087611198425e-05, -2.4829059839248657e-05, -1.950003206729889e-05, -1.4171004295349121e-05, -8.841976523399353e-06, -3.512948751449585e-06, 1.816079020500183e-06, 7.145106792449951e-06, 1.247413456439972e-05, 1.7803162336349487e-05, 2.3132190108299255e-05, 2.8461217880249023e-05, 3.379024565219879e-05, 3.911927342414856e-05, 4.444830119609833e-05, 4.9777328968048096e-05, 5.5106356739997864e-05, 6.043538451194763e-05, 6.57644122838974e-05, 7.109344005584717e-05, 7.642246782779694e-05, 8.17514955997467e-05, 8.708052337169647e-05, 9.240955114364624e-05, 9.773857891559601e-05, 0.00010306760668754578, 0.00010839663445949554, 0.00011372566223144531]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 9.0, 5.0, 4.0, 13.0, 20.0, 29.0, 41.0, 86.0, 95.0, 144.0, 244.0, 495.0, 904.0, 1809.0, 4231.0, 13512.0, 101330.0, 818044.0, 86986.0, 12631.0, 4084.0, 1754.0, 853.0, 499.0, 259.0, 169.0, 94.0, 56.0, 46.0, 29.0, 24.0, 21.0, 13.0, 10.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.849609375, -0.8242263793945312, -0.7988433837890625, -0.7734603881835938, -0.748077392578125, -0.7226943969726562, -0.6973114013671875, -0.6719284057617188, -0.64654541015625, -0.6211624145507812, -0.5957794189453125, -0.5703964233398438, -0.545013427734375, -0.5196304321289062, -0.4942474365234375, -0.46886444091796875, -0.4434814453125, -0.41809844970703125, -0.3927154541015625, -0.36733245849609375, -0.341949462890625, -0.31656646728515625, -0.2911834716796875, -0.26580047607421875, -0.24041748046875, -0.21503448486328125, -0.1896514892578125, -0.16426849365234375, -0.138885498046875, -0.11350250244140625, -0.0881195068359375, -0.06273651123046875, -0.037353515625, -0.01197052001953125, 0.0134124755859375, 0.03879547119140625, 0.064178466796875, 0.08956146240234375, 0.1149444580078125, 0.14032745361328125, 0.16571044921875, 0.19109344482421875, 0.2164764404296875, 0.24185943603515625, 0.267242431640625, 0.29262542724609375, 0.3180084228515625, 0.34339141845703125, 0.3687744140625, 0.39415740966796875, 0.4195404052734375, 0.44492340087890625, 0.470306396484375, 0.49568939208984375, 0.5210723876953125, 0.5464553833007812, 0.57183837890625, 0.5972213745117188, 0.6226043701171875, 0.6479873657226562, 0.673370361328125, 0.6987533569335938, 0.7241363525390625, 0.7495193481445312, 0.77490234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 19.0, 33.0, 58.0, 118.0, 143.0, 235.0, 137.0, 101.0, 62.0, 34.0, 15.0, 12.0, 7.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4111328125, -0.39762115478515625, -0.3841094970703125, -0.37059783935546875, -0.357086181640625, -0.34357452392578125, -0.3300628662109375, -0.31655120849609375, -0.30303955078125, -0.28952789306640625, -0.2760162353515625, -0.26250457763671875, -0.248992919921875, -0.23548126220703125, -0.2219696044921875, -0.20845794677734375, -0.1949462890625, -0.18143463134765625, -0.1679229736328125, -0.15441131591796875, -0.140899658203125, -0.12738800048828125, -0.1138763427734375, -0.10036468505859375, -0.08685302734375, -0.07334136962890625, -0.0598297119140625, -0.04631805419921875, -0.032806396484375, -0.01929473876953125, -0.0057830810546875, 0.00772857666015625, 0.021240234375, 0.03475189208984375, 0.0482635498046875, 0.06177520751953125, 0.075286865234375, 0.08879852294921875, 0.1023101806640625, 0.11582183837890625, 0.12933349609375, 0.14284515380859375, 0.1563568115234375, 0.16986846923828125, 0.183380126953125, 0.19689178466796875, 0.2104034423828125, 0.22391510009765625, 0.2374267578125, 0.25093841552734375, 0.2644500732421875, 0.27796173095703125, 0.291473388671875, 0.30498504638671875, 0.3184967041015625, 0.33200836181640625, 0.34552001953125, 0.35903167724609375, 0.3725433349609375, 0.38605499267578125, 0.399566650390625, 0.41307830810546875, 0.4265899658203125, 0.44010162353515625, 0.45361328125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 5.0, 20.0, 47.0, 104.0, 233.0, 313.0, 179.0, 65.0, 24.0, 17.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6970584392547607, -2.3720474243164062, -2.0470364093780518, -1.7220252752304077, -1.3970142602920532, -1.0720032453536987, -0.7469921112060547, -0.4219810962677002, -0.0969700813293457, 0.22804096341133118, 0.5530520081520081, 0.8780630826950073, 1.2030740976333618, 1.5280851125717163, 1.8530962467193604, 2.178107261657715, 2.5031182765960693, 2.828129291534424, 3.1531403064727783, 3.478151321411133, 3.8031625747680664, 4.128173351287842, 4.453184604644775, 4.778195381164551, 5.103206634521484, 5.428217887878418, 5.753228664398193, 6.078239917755127, 6.403250694274902, 6.728261947631836, 7.0532732009887695, 7.378283977508545, 7.703295707702637, 8.02830696105957, 8.353318214416504, 8.678328514099121, 9.003339767456055, 9.328351020812988, 9.653362274169922, 9.978372573852539, 10.303383827209473, 10.628395080566406, 10.95340633392334, 11.278416633605957, 11.60342788696289, 11.928439140319824, 12.253450393676758, 12.578460693359375, 12.903472900390625, 13.228484153747559, 13.553495407104492, 13.87850570678711, 14.203516960144043, 14.528528213500977, 14.85353946685791, 15.178550720214844, 15.503561019897461, 15.828572273254395, 16.153583526611328, 16.478593826293945, 16.803606033325195, 17.128616333007812, 17.45362663269043, 17.77863883972168, 18.103649139404297]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 8.0, 6.0, 9.0, 6.0, 8.0, 18.0, 16.0, 15.0, 23.0, 26.0, 19.0, 39.0, 27.0, 44.0, 55.0, 53.0, 59.0, 42.0, 44.0, 51.0, 59.0, 49.0, 42.0, 47.0, 38.0, 43.0, 28.0, 22.0, 17.0, 23.0, 18.0, 7.0, 13.0, 7.0, 8.0, 4.0, 6.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0049030780792236, -2.897496461868286, -2.7900896072387695, -2.682682991027832, -2.5752763748168945, -2.467869758605957, -2.3604631423950195, -2.253056287765503, -2.1456496715545654, -2.038243055343628, -1.9308363199234009, -1.8234295845031738, -1.7160229682922363, -1.6086163520812988, -1.5012096166610718, -1.3938028812408447, -1.2863962650299072, -1.1789896488189697, -1.0715829133987427, -0.9641762375831604, -0.8567695617675781, -0.7493628859519958, -0.6419562101364136, -0.5345495343208313, -0.427142858505249, -0.31973618268966675, -0.21232950687408447, -0.1049228310585022, 0.002483844757080078, 0.10989052057266235, 0.21729719638824463, 0.3247038722038269, 0.4321105480194092, 0.5395172238349915, 0.6469238996505737, 0.754330575466156, 0.8617372512817383, 0.9691439270973206, 1.0765506029129028, 1.1839573383331299, 1.2913639545440674, 1.3987705707550049, 1.506177306175232, 1.613584041595459, 1.7209906578063965, 1.828397274017334, 1.935804009437561, 2.043210744857788, 2.1506173610687256, 2.258023977279663, 2.3654308319091797, 2.472837448120117, 2.5802440643310547, 2.687650680541992, 2.7950572967529297, 2.9024641513824463, 3.009870767593384, 3.1172773838043213, 3.224684238433838, 3.3320908546447754, 3.439497470855713, 3.5469040870666504, 3.654310703277588, 3.7617175579071045, 3.869124174118042]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 11.0, 12.0, 15.0, 19.0, 24.0, 32.0, 53.0, 77.0, 85.0, 104.0, 142.0, 163.0, 217.0, 251.0, 365.0, 598.0, 906.0, 1427.0, 2432.0, 5175.0, 17227.0, 102406.0, 881280.0, 2528036.0, 563739.0, 67542.0, 11799.0, 4112.0, 2031.0, 1225.0, 758.0, 527.0, 382.0, 302.0, 185.0, 126.0, 91.0, 87.0, 63.0, 53.0, 49.0, 31.0, 24.0, 15.0, 17.0, 15.0, 15.0, 10.0, 7.0, 4.0, 1.0, 8.0, 3.0, 3.0, 3.0, 3.0], "bins": [-2.390625, -2.314483642578125, -2.23834228515625, -2.162200927734375, -2.0860595703125, -2.009918212890625, -1.93377685546875, -1.857635498046875, -1.781494140625, -1.705352783203125, -1.62921142578125, -1.553070068359375, -1.4769287109375, -1.400787353515625, -1.32464599609375, -1.248504638671875, -1.17236328125, -1.096221923828125, -1.02008056640625, -0.943939208984375, -0.8677978515625, -0.791656494140625, -0.71551513671875, -0.639373779296875, -0.563232421875, -0.487091064453125, -0.41094970703125, -0.334808349609375, -0.2586669921875, -0.182525634765625, -0.10638427734375, -0.030242919921875, 0.0458984375, 0.122039794921875, 0.19818115234375, 0.274322509765625, 0.3504638671875, 0.426605224609375, 0.50274658203125, 0.578887939453125, 0.655029296875, 0.731170654296875, 0.80731201171875, 0.883453369140625, 0.9595947265625, 1.035736083984375, 1.11187744140625, 1.188018798828125, 1.26416015625, 1.340301513671875, 1.41644287109375, 1.492584228515625, 1.5687255859375, 1.644866943359375, 1.72100830078125, 1.797149658203125, 1.873291015625, 1.949432373046875, 2.02557373046875, 2.101715087890625, 2.1778564453125, 2.253997802734375, 2.33013916015625, 2.406280517578125, 2.482421875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 8.0, 5.0, 9.0, 11.0, 19.0, 10.0, 16.0, 30.0, 18.0, 18.0, 44.0, 32.0, 38.0, 37.0, 37.0, 38.0, 49.0, 57.0, 40.0, 35.0, 45.0, 52.0, 43.0, 37.0, 34.0, 40.0, 27.0, 25.0, 17.0, 21.0, 20.0, 15.0, 15.0, 11.0, 9.0, 9.0, 7.0, 4.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4345703125, -1.3902435302734375, -1.345916748046875, -1.3015899658203125, -1.25726318359375, -1.2129364013671875, -1.168609619140625, -1.1242828369140625, -1.0799560546875, -1.0356292724609375, -0.991302490234375, -0.9469757080078125, -0.90264892578125, -0.8583221435546875, -0.813995361328125, -0.7696685791015625, -0.725341796875, -0.6810150146484375, -0.636688232421875, -0.5923614501953125, -0.54803466796875, -0.5037078857421875, -0.459381103515625, -0.4150543212890625, -0.3707275390625, -0.3264007568359375, -0.282073974609375, -0.2377471923828125, -0.19342041015625, -0.1490936279296875, -0.104766845703125, -0.0604400634765625, -0.01611328125, 0.0282135009765625, 0.072540283203125, 0.1168670654296875, 0.16119384765625, 0.2055206298828125, 0.249847412109375, 0.2941741943359375, 0.3385009765625, 0.3828277587890625, 0.427154541015625, 0.4714813232421875, 0.51580810546875, 0.5601348876953125, 0.604461669921875, 0.6487884521484375, 0.693115234375, 0.7374420166015625, 0.781768798828125, 0.8260955810546875, 0.87042236328125, 0.9147491455078125, 0.959075927734375, 1.0034027099609375, 1.0477294921875, 1.0920562744140625, 1.136383056640625, 1.1807098388671875, 1.22503662109375, 1.2693634033203125, 1.313690185546875, 1.3580169677734375, 1.40234375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 8.0, 13.0, 20.0, 42.0, 52.0, 138.0, 250.0, 543.0, 1417.0, 4287.0, 18573.0, 195568.0, 3747551.0, 200162.0, 18682.0, 4402.0, 1457.0, 592.0, 240.0, 132.0, 64.0, 42.0, 16.0, 13.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1796875, -4.073883056640625, -3.96807861328125, -3.862274169921875, -3.7564697265625, -3.650665283203125, -3.54486083984375, -3.439056396484375, -3.333251953125, -3.227447509765625, -3.12164306640625, -3.015838623046875, -2.9100341796875, -2.804229736328125, -2.69842529296875, -2.592620849609375, -2.48681640625, -2.381011962890625, -2.27520751953125, -2.169403076171875, -2.0635986328125, -1.957794189453125, -1.85198974609375, -1.746185302734375, -1.640380859375, -1.534576416015625, -1.42877197265625, -1.322967529296875, -1.2171630859375, -1.111358642578125, -1.00555419921875, -0.899749755859375, -0.7939453125, -0.688140869140625, -0.58233642578125, -0.476531982421875, -0.3707275390625, -0.264923095703125, -0.15911865234375, -0.053314208984375, 0.052490234375, 0.158294677734375, 0.26409912109375, 0.369903564453125, 0.4757080078125, 0.581512451171875, 0.68731689453125, 0.793121337890625, 0.89892578125, 1.004730224609375, 1.11053466796875, 1.216339111328125, 1.3221435546875, 1.427947998046875, 1.53375244140625, 1.639556884765625, 1.745361328125, 1.851165771484375, 1.95697021484375, 2.062774658203125, 2.1685791015625, 2.274383544921875, 2.38018798828125, 2.485992431640625, 2.591796875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 6.0, 10.0, 14.0, 19.0, 27.0, 33.0, 54.0, 85.0, 127.0, 248.0, 438.0, 608.0, 751.0, 595.0, 397.0, 222.0, 142.0, 77.0, 65.0, 37.0, 34.0, 16.0, 9.0, 11.0, 11.0, 5.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6650390625, -0.6416778564453125, -0.618316650390625, -0.5949554443359375, -0.57159423828125, -0.5482330322265625, -0.524871826171875, -0.5015106201171875, -0.4781494140625, -0.4547882080078125, -0.431427001953125, -0.4080657958984375, -0.38470458984375, -0.3613433837890625, -0.337982177734375, -0.3146209716796875, -0.291259765625, -0.2678985595703125, -0.244537353515625, -0.2211761474609375, -0.19781494140625, -0.1744537353515625, -0.151092529296875, -0.1277313232421875, -0.1043701171875, -0.0810089111328125, -0.057647705078125, -0.0342864990234375, -0.01092529296875, 0.0124359130859375, 0.035797119140625, 0.0591583251953125, 0.08251953125, 0.1058807373046875, 0.129241943359375, 0.1526031494140625, 0.17596435546875, 0.1993255615234375, 0.222686767578125, 0.2460479736328125, 0.2694091796875, 0.2927703857421875, 0.316131591796875, 0.3394927978515625, 0.36285400390625, 0.3862152099609375, 0.409576416015625, 0.4329376220703125, 0.456298828125, 0.4796600341796875, 0.503021240234375, 0.5263824462890625, 0.54974365234375, 0.5731048583984375, 0.596466064453125, 0.6198272705078125, 0.6431884765625, 0.6665496826171875, 0.689910888671875, 0.7132720947265625, 0.73663330078125, 0.7599945068359375, 0.783355712890625, 0.8067169189453125, 0.830078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 14.0, 9.0, 15.0, 20.0, 24.0, 23.0, 31.0, 39.0, 45.0, 60.0, 64.0, 84.0, 83.0, 74.0, 100.0, 58.0, 53.0, 53.0, 28.0, 24.0, 17.0, 13.0, 11.0, 10.0, 10.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8108224868774414, -1.7480031251907349, -1.6851836442947388, -1.6223642826080322, -1.5595448017120361, -1.4967254400253296, -1.433906078338623, -1.371086597442627, -1.3082672357559204, -1.2454478740692139, -1.1826283931732178, -1.1198090314865112, -1.0569896697998047, -0.9941701889038086, -0.931350827217102, -0.8685314059257507, -0.8057119846343994, -0.7428925633430481, -0.6800731420516968, -0.6172537803649902, -0.5544343590736389, -0.4916149377822876, -0.42879554629325867, -0.36597615480422974, -0.3031567335128784, -0.2403373271226883, -0.17751792073249817, -0.11469851434230804, -0.05187910795211792, 0.010940313339233398, 0.07375970482826233, 0.13657909631729126, 0.19939851760864258, 0.2622179388999939, 0.3250373303890228, 0.38785672187805176, 0.4506761431694031, 0.5134955644607544, 0.5763149261474609, 0.6391343474388123, 0.7019537687301636, 0.7647731900215149, 0.8275926113128662, 0.8904119729995728, 0.9532313942909241, 1.0160508155822754, 1.078870177268982, 1.1416895389556885, 1.2045090198516846, 1.2673283815383911, 1.3301478624343872, 1.3929672241210938, 1.4557867050170898, 1.5186060667037964, 1.581425428390503, 1.644244909286499, 1.7070642709732056, 1.769883632659912, 1.8327031135559082, 1.8955224752426147, 1.9583418369293213, 2.0211613178253174, 2.0839807987213135, 2.1468000411987305, 2.2096195220947266]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 7.0, 4.0, 8.0, 6.0, 10.0, 7.0, 13.0, 10.0, 15.0, 19.0, 10.0, 16.0, 25.0, 39.0, 22.0, 28.0, 41.0, 38.0, 44.0, 45.0, 31.0, 45.0, 38.0, 49.0, 40.0, 37.0, 29.0, 24.0, 37.0, 30.0, 33.0, 35.0, 34.0, 18.0, 16.0, 17.0, 16.0, 11.0, 10.0, 8.0, 4.0, 9.0, 7.0, 1.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.416862964630127, -1.375201940536499, -1.3335410356521606, -1.2918800115585327, -1.2502191066741943, -1.2085580825805664, -1.1668970584869385, -1.1252360343933105, -1.0835751295089722, -1.0419141054153442, -1.0002532005310059, -0.9585921764373779, -0.9169312119483948, -0.8752702474594116, -0.8336092233657837, -0.7919482588768005, -0.7502872943878174, -0.7086263298988342, -0.6669653654098511, -0.6253043413162231, -0.58364337682724, -0.5419824123382568, -0.5003213882446289, -0.45866042375564575, -0.4169994592666626, -0.37533849477767944, -0.3336775004863739, -0.29201650619506836, -0.2503555417060852, -0.20869456231594086, -0.1670335829257965, -0.12537258863449097, -0.08371162414550781, -0.042050644755363464, -0.0003896653652191162, 0.04127131402492523, 0.08293229341506958, 0.12459327280521393, 0.16625425219535828, 0.20791524648666382, 0.24957621097564697, 0.2912371754646301, 0.33289816975593567, 0.3745591640472412, 0.41622012853622437, 0.4578810930252075, 0.49954208731651306, 0.5412030816078186, 0.5828640460968018, 0.6245250105857849, 0.6661859750747681, 0.707846999168396, 0.7495079636573792, 0.7911689281463623, 0.8328299522399902, 0.8744909167289734, 0.9161518812179565, 0.9578128457069397, 0.9994738101959229, 1.0411348342895508, 1.0827958583831787, 1.124456763267517, 1.166117787361145, 1.2077786922454834, 1.2494397163391113]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 13.0, 11.0, 25.0, 33.0, 61.0, 97.0, 241.0, 380.0, 913.0, 1902.0, 4693.0, 12713.0, 54116.0, 734344.0, 201335.0, 24453.0, 7710.0, 2961.0, 1226.0, 626.0, 313.0, 164.0, 75.0, 55.0, 26.0, 22.0, 18.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.29296875, -1.254669189453125, -1.21636962890625, -1.178070068359375, -1.1397705078125, -1.101470947265625, -1.06317138671875, -1.024871826171875, -0.986572265625, -0.948272705078125, -0.90997314453125, -0.871673583984375, -0.8333740234375, -0.795074462890625, -0.75677490234375, -0.718475341796875, -0.68017578125, -0.641876220703125, -0.60357666015625, -0.565277099609375, -0.5269775390625, -0.488677978515625, -0.45037841796875, -0.412078857421875, -0.373779296875, -0.335479736328125, -0.29718017578125, -0.258880615234375, -0.2205810546875, -0.182281494140625, -0.14398193359375, -0.105682373046875, -0.0673828125, -0.029083251953125, 0.00921630859375, 0.047515869140625, 0.0858154296875, 0.124114990234375, 0.16241455078125, 0.200714111328125, 0.239013671875, 0.277313232421875, 0.31561279296875, 0.353912353515625, 0.3922119140625, 0.430511474609375, 0.46881103515625, 0.507110595703125, 0.54541015625, 0.583709716796875, 0.62200927734375, 0.660308837890625, 0.6986083984375, 0.736907958984375, 0.77520751953125, 0.813507080078125, 0.851806640625, 0.890106201171875, 0.92840576171875, 0.966705322265625, 1.0050048828125, 1.043304443359375, 1.08160400390625, 1.119903564453125, 1.158203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 10.0, 18.0, 11.0, 24.0, 23.0, 33.0, 38.0, 43.0, 60.0, 62.0, 71.0, 66.0, 79.0, 69.0, 50.0, 43.0, 58.0, 35.0, 54.0, 37.0, 28.0, 18.0, 11.0, 13.0, 10.0, 6.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88330078125, -0.8438644409179688, -0.8044281005859375, -0.7649917602539062, -0.725555419921875, -0.6861190795898438, -0.6466827392578125, -0.6072463989257812, -0.56781005859375, -0.5283737182617188, -0.4889373779296875, -0.44950103759765625, -0.410064697265625, -0.37062835693359375, -0.3311920166015625, -0.29175567626953125, -0.2523193359375, -0.21288299560546875, -0.1734466552734375, -0.13401031494140625, -0.094573974609375, -0.05513763427734375, -0.0157012939453125, 0.02373504638671875, 0.06317138671875, 0.10260772705078125, 0.1420440673828125, 0.18148040771484375, 0.220916748046875, 0.26035308837890625, 0.2997894287109375, 0.33922576904296875, 0.378662109375, 0.41809844970703125, 0.4575347900390625, 0.49697113037109375, 0.536407470703125, 0.5758438110351562, 0.6152801513671875, 0.6547164916992188, 0.69415283203125, 0.7335891723632812, 0.7730255126953125, 0.8124618530273438, 0.851898193359375, 0.8913345336914062, 0.9307708740234375, 0.9702072143554688, 1.0096435546875, 1.0490798950195312, 1.0885162353515625, 1.1279525756835938, 1.167388916015625, 1.2068252563476562, 1.2462615966796875, 1.2856979370117188, 1.32513427734375, 1.3645706176757812, 1.4040069580078125, 1.4434432983398438, 1.482879638671875, 1.5223159790039062, 1.5617523193359375, 1.6011886596679688, 1.640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 8.0, 3.0, 6.0, 6.0, 17.0, 20.0, 25.0, 41.0, 65.0, 90.0, 126.0, 201.0, 286.0, 406.0, 656.0, 979.0, 1589.0, 2768.0, 4835.0, 8822.0, 16944.0, 35915.0, 90356.0, 267321.0, 372340.0, 143313.0, 51979.0, 23015.0, 11303.0, 6115.0, 3442.0, 2003.0, 1187.0, 791.0, 511.0, 317.0, 219.0, 165.0, 116.0, 79.0, 63.0, 32.0, 23.0, 22.0, 12.0, 7.0, 10.0, 1.0, 4.0, 1.0, 4.0, 1.0, 2.0], "bins": [-0.31982421875, -0.3107414245605469, -0.30165863037109375, -0.2925758361816406, -0.2834930419921875, -0.2744102478027344, -0.26532745361328125, -0.2562446594238281, -0.247161865234375, -0.23807907104492188, -0.22899627685546875, -0.21991348266601562, -0.2108306884765625, -0.20174789428710938, -0.19266510009765625, -0.18358230590820312, -0.17449951171875, -0.16541671752929688, -0.15633392333984375, -0.14725112915039062, -0.1381683349609375, -0.12908554077148438, -0.12000274658203125, -0.11091995239257812, -0.101837158203125, -0.09275436401367188, -0.08367156982421875, -0.07458877563476562, -0.0655059814453125, -0.056423187255859375, -0.04734039306640625, -0.038257598876953125, -0.0291748046875, -0.020092010498046875, -0.01100921630859375, -0.001926422119140625, 0.0071563720703125, 0.016239166259765625, 0.02532196044921875, 0.034404754638671875, 0.043487548828125, 0.052570343017578125, 0.06165313720703125, 0.07073593139648438, 0.0798187255859375, 0.08890151977539062, 0.09798431396484375, 0.10706710815429688, 0.11614990234375, 0.12523269653320312, 0.13431549072265625, 0.14339828491210938, 0.1524810791015625, 0.16156387329101562, 0.17064666748046875, 0.17972946166992188, 0.188812255859375, 0.19789505004882812, 0.20697784423828125, 0.21606063842773438, 0.2251434326171875, 0.23422622680664062, 0.24330902099609375, 0.2523918151855469, 0.261474609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 9.0, 10.0, 15.0, 8.0, 21.0, 24.0, 30.0, 34.0, 39.0, 41.0, 57.0, 53.0, 38.0, 49.0, 55.0, 63.0, 64.0, 48.0, 39.0, 40.0, 47.0, 44.0, 27.0, 31.0, 31.0, 14.0, 9.0, 9.0, 7.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6396484375, -1.5795440673828125, -1.519439697265625, -1.4593353271484375, -1.39923095703125, -1.3391265869140625, -1.279022216796875, -1.2189178466796875, -1.1588134765625, -1.0987091064453125, -1.038604736328125, -0.9785003662109375, -0.91839599609375, -0.8582916259765625, -0.798187255859375, -0.7380828857421875, -0.677978515625, -0.6178741455078125, -0.557769775390625, -0.4976654052734375, -0.43756103515625, -0.3774566650390625, -0.317352294921875, -0.2572479248046875, -0.1971435546875, -0.1370391845703125, -0.076934814453125, -0.0168304443359375, 0.04327392578125, 0.1033782958984375, 0.163482666015625, 0.2235870361328125, 0.28369140625, 0.3437957763671875, 0.403900146484375, 0.4640045166015625, 0.52410888671875, 0.5842132568359375, 0.644317626953125, 0.7044219970703125, 0.7645263671875, 0.8246307373046875, 0.884735107421875, 0.9448394775390625, 1.00494384765625, 1.0650482177734375, 1.125152587890625, 1.1852569580078125, 1.245361328125, 1.3054656982421875, 1.365570068359375, 1.4256744384765625, 1.48577880859375, 1.5458831787109375, 1.605987548828125, 1.6660919189453125, 1.7261962890625, 1.7863006591796875, 1.846405029296875, 1.9065093994140625, 1.96661376953125, 2.0267181396484375, 2.086822509765625, 2.1469268798828125, 2.20703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 4.0, 6.0, 13.0, 18.0, 28.0, 42.0, 47.0, 70.0, 88.0, 167.0, 283.0, 439.0, 672.0, 1180.0, 2137.0, 3860.0, 7794.0, 16823.0, 41834.0, 124473.0, 361771.0, 319869.0, 102729.0, 34988.0, 14394.0, 6708.0, 3397.0, 1899.0, 1089.0, 663.0, 405.0, 203.0, 156.0, 102.0, 59.0, 41.0, 38.0, 20.0, 9.0, 10.0, 8.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.079833984375, -0.07716560363769531, -0.07449722290039062, -0.07182884216308594, -0.06916046142578125, -0.06649208068847656, -0.06382369995117188, -0.06115531921386719, -0.0584869384765625, -0.05581855773925781, -0.053150177001953125, -0.05048179626464844, -0.04781341552734375, -0.04514503479003906, -0.042476654052734375, -0.03980827331542969, -0.037139892578125, -0.03447151184082031, -0.031803131103515625, -0.029134750366210938, -0.02646636962890625, -0.023797988891601562, -0.021129608154296875, -0.018461227416992188, -0.0157928466796875, -0.013124465942382812, -0.010456085205078125, -0.0077877044677734375, -0.00511932373046875, -0.0024509429931640625, 0.000217437744140625, 0.0028858184814453125, 0.00555419921875, 0.008222579956054688, 0.010890960693359375, 0.013559341430664062, 0.01622772216796875, 0.018896102905273438, 0.021564483642578125, 0.024232864379882812, 0.0269012451171875, 0.029569625854492188, 0.032238006591796875, 0.03490638732910156, 0.03757476806640625, 0.04024314880371094, 0.042911529541015625, 0.04557991027832031, 0.048248291015625, 0.05091667175292969, 0.053585052490234375, 0.05625343322753906, 0.05892181396484375, 0.06159019470214844, 0.06425857543945312, 0.06692695617675781, 0.0695953369140625, 0.07226371765136719, 0.07493209838867188, 0.07760047912597656, 0.08026885986328125, 0.08293724060058594, 0.08560562133789062, 0.08827400207519531, 0.0909423828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 17.0, 15.0, 18.0, 29.0, 51.0, 65.0, 92.0, 114.0, 128.0, 105.0, 95.0, 65.0, 41.0, 30.0, 29.0, 19.0, 12.0, 12.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.176399230957031e-05, -6.942637264728546e-05, -6.708875298500061e-05, -6.475113332271576e-05, -6.241351366043091e-05, -6.007589399814606e-05, -5.7738274335861206e-05, -5.5400654673576355e-05, -5.3063035011291504e-05, -5.072541534900665e-05, -4.83877956867218e-05, -4.605017602443695e-05, -4.37125563621521e-05, -4.137493669986725e-05, -3.90373170375824e-05, -3.6699697375297546e-05, -3.4362077713012695e-05, -3.2024458050727844e-05, -2.9686838388442993e-05, -2.7349218726158142e-05, -2.501159906387329e-05, -2.267397940158844e-05, -2.033635973930359e-05, -1.7998740077018738e-05, -1.5661120414733887e-05, -1.3323500752449036e-05, -1.0985881090164185e-05, -8.648261427879333e-06, -6.310641765594482e-06, -3.973022103309631e-06, -1.6354024410247803e-06, 7.022172212600708e-07, 3.039836883544922e-06, 5.377456545829773e-06, 7.715076208114624e-06, 1.0052695870399475e-05, 1.2390315532684326e-05, 1.4727935194969177e-05, 1.706555485725403e-05, 1.940317451953888e-05, 2.174079418182373e-05, 2.407841384410858e-05, 2.6416033506393433e-05, 2.8753653168678284e-05, 3.1091272830963135e-05, 3.3428892493247986e-05, 3.576651215553284e-05, 3.810413181781769e-05, 4.044175148010254e-05, 4.277937114238739e-05, 4.511699080467224e-05, 4.745461046695709e-05, 4.979223012924194e-05, 5.2129849791526794e-05, 5.4467469453811646e-05, 5.6805089116096497e-05, 5.914270877838135e-05, 6.14803284406662e-05, 6.381794810295105e-05, 6.61555677652359e-05, 6.849318742752075e-05, 7.08308070898056e-05, 7.316842675209045e-05, 7.55060464143753e-05, 7.784366607666016e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 8.0, 4.0, 12.0, 13.0, 19.0, 25.0, 30.0, 68.0, 80.0, 131.0, 194.0, 342.0, 624.0, 1171.0, 2258.0, 4635.0, 10312.0, 27167.0, 92578.0, 389316.0, 382450.0, 90793.0, 26763.0, 10218.0, 4579.0, 2146.0, 1090.0, 623.0, 336.0, 204.0, 119.0, 72.0, 59.0, 29.0, 29.0, 19.0, 12.0, 12.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12103271484375, -0.1171274185180664, -0.11322212219238281, -0.10931682586669922, -0.10541152954101562, -0.10150623321533203, -0.09760093688964844, -0.09369564056396484, -0.08979034423828125, -0.08588504791259766, -0.08197975158691406, -0.07807445526123047, -0.07416915893554688, -0.07026386260986328, -0.06635856628417969, -0.062453269958496094, -0.0585479736328125, -0.054642677307128906, -0.05073738098144531, -0.04683208465576172, -0.042926788330078125, -0.03902149200439453, -0.03511619567871094, -0.031210899353027344, -0.02730560302734375, -0.023400306701660156, -0.019495010375976562, -0.015589714050292969, -0.011684417724609375, -0.007779121398925781, -0.0038738250732421875, 3.147125244140625e-05, 0.003936767578125, 0.007842063903808594, 0.011747360229492188, 0.01565265655517578, 0.019557952880859375, 0.02346324920654297, 0.027368545532226562, 0.031273841857910156, 0.03517913818359375, 0.039084434509277344, 0.04298973083496094, 0.04689502716064453, 0.050800323486328125, 0.05470561981201172, 0.05861091613769531, 0.0625162124633789, 0.0664215087890625, 0.0703268051147461, 0.07423210144042969, 0.07813739776611328, 0.08204269409179688, 0.08594799041748047, 0.08985328674316406, 0.09375858306884766, 0.09766387939453125, 0.10156917572021484, 0.10547447204589844, 0.10937976837158203, 0.11328506469726562, 0.11719036102294922, 0.12109565734863281, 0.1250009536743164, 0.12890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 8.0, 2.0, 8.0, 9.0, 16.0, 7.0, 12.0, 10.0, 18.0, 24.0, 30.0, 33.0, 52.0, 35.0, 49.0, 43.0, 55.0, 63.0, 63.0, 53.0, 54.0, 59.0, 47.0, 38.0, 27.0, 33.0, 23.0, 26.0, 12.0, 14.0, 7.0, 16.0, 11.0, 10.0, 2.0, 7.0, 3.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.025909423828125, -0.025172948837280273, -0.024436473846435547, -0.02369999885559082, -0.022963523864746094, -0.022227048873901367, -0.02149057388305664, -0.020754098892211914, -0.020017623901367188, -0.01928114891052246, -0.018544673919677734, -0.017808198928833008, -0.01707172393798828, -0.016335248947143555, -0.015598773956298828, -0.014862298965454102, -0.014125823974609375, -0.013389348983764648, -0.012652873992919922, -0.011916399002075195, -0.011179924011230469, -0.010443449020385742, -0.009706974029541016, -0.008970499038696289, -0.008234024047851562, -0.007497549057006836, -0.006761074066162109, -0.006024599075317383, -0.005288124084472656, -0.00455164909362793, -0.003815174102783203, -0.0030786991119384766, -0.00234222412109375, -0.0016057491302490234, -0.0008692741394042969, -0.0001327991485595703, 0.0006036758422851562, 0.0013401508331298828, 0.0020766258239746094, 0.002813100814819336, 0.0035495758056640625, 0.004286050796508789, 0.005022525787353516, 0.005759000778198242, 0.006495475769042969, 0.007231950759887695, 0.007968425750732422, 0.008704900741577148, 0.009441375732421875, 0.010177850723266602, 0.010914325714111328, 0.011650800704956055, 0.012387275695800781, 0.013123750686645508, 0.013860225677490234, 0.014596700668334961, 0.015333175659179688, 0.016069650650024414, 0.01680612564086914, 0.017542600631713867, 0.018279075622558594, 0.01901555061340332, 0.019752025604248047, 0.020488500595092773, 0.0212249755859375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 13.0, 15.0, 28.0, 44.0, 51.0, 92.0, 95.0, 124.0, 127.0, 111.0, 96.0, 58.0, 39.0, 26.0, 22.0, 16.0, 3.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1636282205581665, -1.111046314239502, -1.058464527130127, -1.0058826208114624, -0.9533007144927979, -0.9007188677787781, -0.8481370210647583, -0.7955551147460938, -0.742973268032074, -0.6903914213180542, -0.6378095149993896, -0.5852276682853699, -0.5326458215713501, -0.48006391525268555, -0.42748206853866577, -0.3749001920223236, -0.32231831550598145, -0.2697364389896393, -0.2171545773744583, -0.16457271575927734, -0.11199083924293518, -0.05940896272659302, -0.006827116012573242, 0.04575476050376892, 0.09833663702011108, 0.15091851353645325, 0.20350037515163422, 0.2560822367668152, 0.30866411328315735, 0.3612459897994995, 0.4138278365135193, 0.46640971302986145, 0.5189917087554932, 0.5715735554695129, 0.6241554617881775, 0.6767373085021973, 0.7293192148208618, 0.7819010615348816, 0.8344829082489014, 0.8870648145675659, 0.9396466612815857, 0.9922285079956055, 1.04481041431427, 1.0973923206329346, 1.1499741077423096, 1.2025560140609741, 1.2551379203796387, 1.3077197074890137, 1.3603016138076782, 1.4128835201263428, 1.4654653072357178, 1.5180472135543823, 1.5706291198730469, 1.6232109069824219, 1.6757928133010864, 1.728374719619751, 1.780956506729126, 1.8335384130477905, 1.8861202001571655, 1.93870210647583, 1.9912840127944946, 2.043865919113159, 2.096447706222534, 2.149029493331909, 2.2016115188598633]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 12.0, 17.0, 25.0, 15.0, 27.0, 53.0, 53.0, 73.0, 80.0, 86.0, 93.0, 83.0, 68.0, 79.0, 64.0, 59.0, 29.0, 37.0, 8.0, 13.0, 14.0, 9.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8270987868309021, -0.7772533893585205, -0.7274079322814941, -0.6775625348091125, -0.627717137336731, -0.5778717398643494, -0.5280263423919678, -0.4781808853149414, -0.4283354878425598, -0.3784900903701782, -0.32864466309547424, -0.27879923582077026, -0.22895383834838867, -0.1791084259748459, -0.1292630136013031, -0.07941758632659912, -0.02957218885421753, 0.020273223519325256, 0.07011863589286804, 0.11996404826641083, 0.1698094606399536, 0.2196548730134964, 0.2695002853870392, 0.31934571266174316, 0.36919111013412476, 0.41903650760650635, 0.4688819348812103, 0.5187273621559143, 0.5685727596282959, 0.6184181571006775, 0.6682635545730591, 0.7181090116500854, 0.7679543495178223, 0.8177997469902039, 0.8676451444625854, 0.9174906015396118, 0.9673359990119934, 1.017181396484375, 1.0670268535614014, 1.1168723106384277, 1.1667176485061646, 1.216563105583191, 1.2664084434509277, 1.316253900527954, 1.3660993576049805, 1.4159446954727173, 1.4657901525497437, 1.5156354904174805, 1.5654809474945068, 1.6153264045715332, 1.66517174243927, 1.7150171995162964, 1.7648625373840332, 1.8147079944610596, 1.864553451538086, 1.9143989086151123, 1.9642442464828491, 2.014089584350586, 2.0639350414276123, 2.1137804985046387, 2.163625955581665, 2.2134714126586914, 2.2633166313171387, 2.313162088394165, 2.3630075454711914]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 11.0, 8.0, 15.0, 37.0, 33.0, 64.0, 63.0, 100.0, 175.0, 236.0, 476.0, 746.0, 1351.0, 2576.0, 5525.0, 15953.0, 80616.0, 709161.0, 190723.0, 25710.0, 7759.0, 3280.0, 1562.0, 897.0, 512.0, 333.0, 193.0, 133.0, 105.0, 62.0, 43.0, 27.0, 19.0, 9.0, 16.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7099609375, -1.655975341796875, -1.60198974609375, -1.548004150390625, -1.4940185546875, -1.440032958984375, -1.38604736328125, -1.332061767578125, -1.278076171875, -1.224090576171875, -1.17010498046875, -1.116119384765625, -1.0621337890625, -1.008148193359375, -0.95416259765625, -0.900177001953125, -0.84619140625, -0.792205810546875, -0.73822021484375, -0.684234619140625, -0.6302490234375, -0.576263427734375, -0.52227783203125, -0.468292236328125, -0.414306640625, -0.360321044921875, -0.30633544921875, -0.252349853515625, -0.1983642578125, -0.144378662109375, -0.09039306640625, -0.036407470703125, 0.017578125, 0.071563720703125, 0.12554931640625, 0.179534912109375, 0.2335205078125, 0.287506103515625, 0.34149169921875, 0.395477294921875, 0.449462890625, 0.503448486328125, 0.55743408203125, 0.611419677734375, 0.6654052734375, 0.719390869140625, 0.77337646484375, 0.827362060546875, 0.88134765625, 0.935333251953125, 0.98931884765625, 1.043304443359375, 1.0972900390625, 1.151275634765625, 1.20526123046875, 1.259246826171875, 1.313232421875, 1.367218017578125, 1.42120361328125, 1.475189208984375, 1.5291748046875, 1.583160400390625, 1.63714599609375, 1.691131591796875, 1.7451171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 12.0, 14.0, 16.0, 15.0, 23.0, 24.0, 32.0, 57.0, 61.0, 48.0, 61.0, 71.0, 69.0, 54.0, 63.0, 56.0, 64.0, 48.0, 41.0, 41.0, 21.0, 22.0, 23.0, 11.0, 13.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.734375, -1.66424560546875, -1.5941162109375, -1.52398681640625, -1.453857421875, -1.38372802734375, -1.3135986328125, -1.24346923828125, -1.17333984375, -1.10321044921875, -1.0330810546875, -0.96295166015625, -0.892822265625, -0.82269287109375, -0.7525634765625, -0.68243408203125, -0.6123046875, -0.54217529296875, -0.4720458984375, -0.40191650390625, -0.331787109375, -0.26165771484375, -0.1915283203125, -0.12139892578125, -0.05126953125, 0.01885986328125, 0.0889892578125, 0.15911865234375, 0.229248046875, 0.29937744140625, 0.3695068359375, 0.43963623046875, 0.509765625, 0.57989501953125, 0.6500244140625, 0.72015380859375, 0.790283203125, 0.86041259765625, 0.9305419921875, 1.00067138671875, 1.07080078125, 1.14093017578125, 1.2110595703125, 1.28118896484375, 1.351318359375, 1.42144775390625, 1.4915771484375, 1.56170654296875, 1.6318359375, 1.70196533203125, 1.7720947265625, 1.84222412109375, 1.912353515625, 1.98248291015625, 2.0526123046875, 2.12274169921875, 2.19287109375, 2.26300048828125, 2.3331298828125, 2.40325927734375, 2.473388671875, 2.54351806640625, 2.6136474609375, 2.68377685546875, 2.75390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 6.0, 11.0, 8.0, 14.0, 11.0, 16.0, 19.0, 12.0, 20.0, 23.0, 28.0, 30.0, 34.0, 47.0, 64.0, 77.0, 165.0, 593.0, 3780.0, 105108.0, 926682.0, 9995.0, 1109.0, 224.0, 106.0, 54.0, 37.0, 46.0, 34.0, 27.0, 25.0, 31.0, 17.0, 17.0, 16.0, 13.0, 11.0, 10.0, 5.0, 4.0, 5.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.24609375, -4.09552001953125, -3.9449462890625, -3.79437255859375, -3.643798828125, -3.49322509765625, -3.3426513671875, -3.19207763671875, -3.04150390625, -2.89093017578125, -2.7403564453125, -2.58978271484375, -2.439208984375, -2.28863525390625, -2.1380615234375, -1.98748779296875, -1.8369140625, -1.68634033203125, -1.5357666015625, -1.38519287109375, -1.234619140625, -1.08404541015625, -0.9334716796875, -0.78289794921875, -0.63232421875, -0.48175048828125, -0.3311767578125, -0.18060302734375, -0.030029296875, 0.12054443359375, 0.2711181640625, 0.42169189453125, 0.572265625, 0.72283935546875, 0.8734130859375, 1.02398681640625, 1.174560546875, 1.32513427734375, 1.4757080078125, 1.62628173828125, 1.77685546875, 1.92742919921875, 2.0780029296875, 2.22857666015625, 2.379150390625, 2.52972412109375, 2.6802978515625, 2.83087158203125, 2.9814453125, 3.13201904296875, 3.2825927734375, 3.43316650390625, 3.583740234375, 3.73431396484375, 3.8848876953125, 4.03546142578125, 4.18603515625, 4.33660888671875, 4.4871826171875, 4.63775634765625, 4.788330078125, 4.93890380859375, 5.0894775390625, 5.24005126953125, 5.390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 13.0, 7.0, 12.0, 15.0, 18.0, 21.0, 15.0, 16.0, 24.0, 29.0, 35.0, 23.0, 33.0, 35.0, 49.0, 34.0, 34.0, 54.0, 39.0, 54.0, 44.0, 44.0, 46.0, 25.0, 35.0, 29.0, 27.0, 34.0, 24.0, 21.0, 21.0, 26.0, 11.0, 10.0, 10.0, 8.0, 6.0, 4.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.68359375, -1.6319580078125, -1.580322265625, -1.5286865234375, -1.47705078125, -1.4254150390625, -1.373779296875, -1.3221435546875, -1.2705078125, -1.2188720703125, -1.167236328125, -1.1156005859375, -1.06396484375, -1.0123291015625, -0.960693359375, -0.9090576171875, -0.857421875, -0.8057861328125, -0.754150390625, -0.7025146484375, -0.65087890625, -0.5992431640625, -0.547607421875, -0.4959716796875, -0.4443359375, -0.3927001953125, -0.341064453125, -0.2894287109375, -0.23779296875, -0.1861572265625, -0.134521484375, -0.0828857421875, -0.03125, 0.0203857421875, 0.072021484375, 0.1236572265625, 0.17529296875, 0.2269287109375, 0.278564453125, 0.3302001953125, 0.3818359375, 0.4334716796875, 0.485107421875, 0.5367431640625, 0.58837890625, 0.6400146484375, 0.691650390625, 0.7432861328125, 0.794921875, 0.8465576171875, 0.898193359375, 0.9498291015625, 1.00146484375, 1.0531005859375, 1.104736328125, 1.1563720703125, 1.2080078125, 1.2596435546875, 1.311279296875, 1.3629150390625, 1.41455078125, 1.4661865234375, 1.517822265625, 1.5694580078125, 1.62109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 2.0, 6.0, 3.0, 11.0, 22.0, 33.0, 35.0, 51.0, 95.0, 247.0, 493.0, 1152.0, 3497.0, 18253.0, 537929.0, 464536.0, 16715.0, 3413.0, 1100.0, 468.0, 219.0, 109.0, 62.0, 39.0, 31.0, 15.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50634765625, -0.48431396484375, -0.4622802734375, -0.44024658203125, -0.418212890625, -0.39617919921875, -0.3741455078125, -0.35211181640625, -0.330078125, -0.30804443359375, -0.2860107421875, -0.26397705078125, -0.241943359375, -0.21990966796875, -0.1978759765625, -0.17584228515625, -0.15380859375, -0.13177490234375, -0.1097412109375, -0.08770751953125, -0.065673828125, -0.04364013671875, -0.0216064453125, 0.00042724609375, 0.0224609375, 0.04449462890625, 0.0665283203125, 0.08856201171875, 0.110595703125, 0.13262939453125, 0.1546630859375, 0.17669677734375, 0.19873046875, 0.22076416015625, 0.2427978515625, 0.26483154296875, 0.286865234375, 0.30889892578125, 0.3309326171875, 0.35296630859375, 0.375, 0.39703369140625, 0.4190673828125, 0.44110107421875, 0.463134765625, 0.48516845703125, 0.5072021484375, 0.52923583984375, 0.55126953125, 0.57330322265625, 0.5953369140625, 0.61737060546875, 0.639404296875, 0.66143798828125, 0.6834716796875, 0.70550537109375, 0.7275390625, 0.74957275390625, 0.7716064453125, 0.79364013671875, 0.815673828125, 0.83770751953125, 0.8597412109375, 0.88177490234375, 0.90380859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 12.0, 6.0, 20.0, 26.0, 46.0, 89.0, 126.0, 191.0, 198.0, 114.0, 70.0, 33.0, 19.0, 16.0, 6.0, 12.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00012129545211791992, -0.00011854059994220734, -0.00011578574776649475, -0.00011303089559078217, -0.00011027604341506958, -0.000107521191239357, -0.00010476633906364441, -0.00010201148688793182, -9.925663471221924e-05, -9.650178253650665e-05, -9.374693036079407e-05, -9.099207818508148e-05, -8.82372260093689e-05, -8.548237383365631e-05, -8.272752165794373e-05, -7.997266948223114e-05, -7.721781730651855e-05, -7.446296513080597e-05, -7.170811295509338e-05, -6.89532607793808e-05, -6.619840860366821e-05, -6.344355642795563e-05, -6.068870425224304e-05, -5.7933852076530457e-05, -5.517899990081787e-05, -5.2424147725105286e-05, -4.96692955493927e-05, -4.6914443373680115e-05, -4.415959119796753e-05, -4.1404739022254944e-05, -3.864988684654236e-05, -3.589503467082977e-05, -3.314018249511719e-05, -3.0385330319404602e-05, -2.7630478143692017e-05, -2.487562596797943e-05, -2.2120773792266846e-05, -1.936592161655426e-05, -1.6611069440841675e-05, -1.385621726512909e-05, -1.1101365089416504e-05, -8.346512913703918e-06, -5.591660737991333e-06, -2.8368085622787476e-06, -8.195638656616211e-08, 2.6728957891464233e-06, 5.427747964859009e-06, 8.182600140571594e-06, 1.093745231628418e-05, 1.3692304491996765e-05, 1.644715666770935e-05, 1.9202008843421936e-05, 2.195686101913452e-05, 2.4711713194847107e-05, 2.7466565370559692e-05, 3.0221417546272278e-05, 3.297626972198486e-05, 3.573112189769745e-05, 3.8485974073410034e-05, 4.124082624912262e-05, 4.3995678424835205e-05, 4.675053060054779e-05, 4.9505382776260376e-05, 5.226023495197296e-05, 5.501508712768555e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 4.0, 17.0, 6.0, 11.0, 22.0, 39.0, 72.0, 92.0, 192.0, 333.0, 694.0, 1582.0, 3878.0, 12771.0, 79289.0, 786494.0, 137611.0, 17149.0, 4731.0, 1823.0, 841.0, 381.0, 192.0, 106.0, 65.0, 45.0, 27.0, 15.0, 18.0, 13.0, 10.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.52001953125, -0.5030288696289062, -0.4860382080078125, -0.46904754638671875, -0.452056884765625, -0.43506622314453125, -0.4180755615234375, -0.40108489990234375, -0.38409423828125, -0.36710357666015625, -0.3501129150390625, -0.33312225341796875, -0.316131591796875, -0.29914093017578125, -0.2821502685546875, -0.26515960693359375, -0.2481689453125, -0.23117828369140625, -0.2141876220703125, -0.19719696044921875, -0.180206298828125, -0.16321563720703125, -0.1462249755859375, -0.12923431396484375, -0.11224365234375, -0.09525299072265625, -0.0782623291015625, -0.06127166748046875, -0.044281005859375, -0.02729034423828125, -0.0102996826171875, 0.00669097900390625, 0.023681640625, 0.04067230224609375, 0.0576629638671875, 0.07465362548828125, 0.091644287109375, 0.10863494873046875, 0.1256256103515625, 0.14261627197265625, 0.15960693359375, 0.17659759521484375, 0.1935882568359375, 0.21057891845703125, 0.227569580078125, 0.24456024169921875, 0.2615509033203125, 0.27854156494140625, 0.2955322265625, 0.31252288818359375, 0.3295135498046875, 0.34650421142578125, 0.363494873046875, 0.38048553466796875, 0.3974761962890625, 0.41446685791015625, 0.43145751953125, 0.44844818115234375, 0.4654388427734375, 0.48242950439453125, 0.499420166015625, 0.5164108276367188, 0.5334014892578125, 0.5503921508789062, 0.5673828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 10.0, 7.0, 8.0, 21.0, 25.0, 35.0, 35.0, 66.0, 85.0, 119.0, 135.0, 127.0, 96.0, 63.0, 41.0, 35.0, 20.0, 13.0, 12.0, 4.0, 9.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1953125, -0.1896800994873047, -0.18404769897460938, -0.17841529846191406, -0.17278289794921875, -0.16715049743652344, -0.16151809692382812, -0.1558856964111328, -0.1502532958984375, -0.1446208953857422, -0.13898849487304688, -0.13335609436035156, -0.12772369384765625, -0.12209129333496094, -0.11645889282226562, -0.11082649230957031, -0.105194091796875, -0.09956169128417969, -0.09392929077148438, -0.08829689025878906, -0.08266448974609375, -0.07703208923339844, -0.07139968872070312, -0.06576728820800781, -0.0601348876953125, -0.05450248718261719, -0.048870086669921875, -0.04323768615722656, -0.03760528564453125, -0.03197288513183594, -0.026340484619140625, -0.020708084106445312, -0.01507568359375, -0.009443283081054688, -0.003810882568359375, 0.0018215179443359375, 0.00745391845703125, 0.013086318969726562, 0.018718719482421875, 0.024351119995117188, 0.0299835205078125, 0.03561592102050781, 0.041248321533203125, 0.04688072204589844, 0.05251312255859375, 0.05814552307128906, 0.06377792358398438, 0.06941032409667969, 0.075042724609375, 0.08067512512207031, 0.08630752563476562, 0.09193992614746094, 0.09757232666015625, 0.10320472717285156, 0.10883712768554688, 0.11446952819824219, 0.1201019287109375, 0.1257343292236328, 0.13136672973632812, 0.13699913024902344, 0.14263153076171875, 0.14826393127441406, 0.15389633178710938, 0.1595287322998047, 0.1651611328125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 16.0, 11.0, 13.0, 25.0, 16.0, 34.0, 49.0, 62.0, 85.0, 81.0, 98.0, 102.0, 106.0, 72.0, 54.0, 44.0, 37.0, 29.0, 19.0, 6.0, 7.0, 5.0, 5.0, 6.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2271065711975098, -2.1438546180725098, -2.060602903366089, -1.9773510694503784, -1.894099235534668, -1.810847282409668, -1.7275954484939575, -1.644343614578247, -1.5610917806625366, -1.4778399467468262, -1.3945881128311157, -1.3113362789154053, -1.2280843257904053, -1.1448326110839844, -1.0615806579589844, -0.9783288240432739, -0.8950769901275635, -0.811825156211853, -0.7285733222961426, -0.6453214287757874, -0.5620695948600769, -0.47881776094436646, -0.3955658972263336, -0.3123140335083008, -0.22906219959259033, -0.1458103507757187, -0.06255850195884705, 0.020693346858024597, 0.10394519567489624, 0.1871970295906067, 0.2704488933086395, 0.35370075702667236, 0.4369525909423828, 0.5202044248580933, 0.6034562587738037, 0.6867081522941589, 0.7699599862098694, 0.8532118201255798, 0.9364637136459351, 1.0197155475616455, 1.102967381477356, 1.1862192153930664, 1.2694710493087769, 1.3527228832244873, 1.4359748363494873, 1.5192265510559082, 1.6024785041809082, 1.6857303380966187, 1.768982172012329, 1.8522340059280396, 1.93548583984375, 2.01873779296875, 2.101989507675171, 2.185241460800171, 2.268493175506592, 2.351745128631592, 2.434997081756592, 2.518249034881592, 2.6015007495880127, 2.6847527027130127, 2.7680044174194336, 2.8512563705444336, 2.9345080852508545, 3.0177600383758545, 3.1010117530822754]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 8.0, 9.0, 12.0, 22.0, 21.0, 14.0, 26.0, 23.0, 32.0, 32.0, 39.0, 48.0, 34.0, 47.0, 39.0, 64.0, 41.0, 62.0, 49.0, 37.0, 35.0, 33.0, 35.0, 28.0, 36.0, 25.0, 26.0, 20.0, 19.0, 20.0, 7.0, 8.0, 12.0, 6.0, 1.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.779217481613159, -2.685767650604248, -2.592317819595337, -2.498867988586426, -2.4054181575775146, -2.3119683265686035, -2.2185182571411133, -2.125068426132202, -2.031618595123291, -1.9381687641143799, -1.8447189331054688, -1.7512691020965576, -1.657819151878357, -1.5643693208694458, -1.4709194898605347, -1.377469539642334, -1.2840198278427124, -1.1905699968338013, -1.0971201658248901, -1.0036702156066895, -0.9102203845977783, -0.8167705535888672, -0.723320722579956, -0.6298708319664001, -0.536421000957489, -0.4429711401462555, -0.349521279335022, -0.25607144832611084, -0.16262158751487732, -0.0691717267036438, 0.024278104305267334, 0.11772799491882324, 0.21117782592773438, 0.3046276867389679, 0.3980775475502014, 0.49152737855911255, 0.5849772691726685, 0.6784271001815796, 0.7718769311904907, 0.8653268218040466, 0.9587766528129578, 1.0522265434265137, 1.1456763744354248, 1.239126205444336, 1.332576036453247, 1.4260258674621582, 1.5194756984710693, 1.61292564868927, 1.7063754796981812, 1.7998253107070923, 1.8932751417160034, 1.986725091934204, 2.0801749229431152, 2.1736247539520264, 2.2670745849609375, 2.3605244159698486, 2.4539742469787598, 2.547424077987671, 2.640873908996582, 2.734323740005493, 2.8277735710144043, 2.9212236404418945, 3.0146732330322266, 3.108123302459717, 3.201573133468628]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 6.0, 11.0, 16.0, 35.0, 42.0, 82.0, 105.0, 204.0, 446.0, 940.0, 3120.0, 22146.0, 1122835.0, 2969094.0, 67752.0, 5163.0, 1281.0, 514.0, 221.0, 120.0, 58.0, 36.0, 15.0, 16.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66015625, -5.534820556640625, -5.40948486328125, -5.284149169921875, -5.1588134765625, -5.033477783203125, -4.90814208984375, -4.782806396484375, -4.657470703125, -4.532135009765625, -4.40679931640625, -4.281463623046875, -4.1561279296875, -4.030792236328125, -3.90545654296875, -3.780120849609375, -3.65478515625, -3.529449462890625, -3.40411376953125, -3.278778076171875, -3.1534423828125, -3.028106689453125, -2.90277099609375, -2.777435302734375, -2.652099609375, -2.526763916015625, -2.40142822265625, -2.276092529296875, -2.1507568359375, -2.025421142578125, -1.90008544921875, -1.774749755859375, -1.6494140625, -1.524078369140625, -1.39874267578125, -1.273406982421875, -1.1480712890625, -1.022735595703125, -0.89739990234375, -0.772064208984375, -0.646728515625, -0.521392822265625, -0.39605712890625, -0.270721435546875, -0.1453857421875, -0.020050048828125, 0.10528564453125, 0.230621337890625, 0.35595703125, 0.481292724609375, 0.60662841796875, 0.731964111328125, 0.8572998046875, 0.982635498046875, 1.10797119140625, 1.233306884765625, 1.358642578125, 1.483978271484375, 1.60931396484375, 1.734649658203125, 1.8599853515625, 1.985321044921875, 2.11065673828125, 2.235992431640625, 2.361328125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 7.0, 2.0, 6.0, 8.0, 7.0, 14.0, 15.0, 20.0, 24.0, 17.0, 21.0, 28.0, 41.0, 46.0, 54.0, 44.0, 51.0, 57.0, 64.0, 43.0, 41.0, 46.0, 60.0, 49.0, 35.0, 38.0, 30.0, 24.0, 19.0, 24.0, 16.0, 11.0, 8.0, 11.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.421875, -1.3794708251953125, -1.337066650390625, -1.2946624755859375, -1.25225830078125, -1.2098541259765625, -1.167449951171875, -1.1250457763671875, -1.0826416015625, -1.0402374267578125, -0.997833251953125, -0.9554290771484375, -0.91302490234375, -0.8706207275390625, -0.828216552734375, -0.7858123779296875, -0.743408203125, -0.7010040283203125, -0.658599853515625, -0.6161956787109375, -0.57379150390625, -0.5313873291015625, -0.488983154296875, -0.4465789794921875, -0.4041748046875, -0.3617706298828125, -0.319366455078125, -0.2769622802734375, -0.23455810546875, -0.1921539306640625, -0.149749755859375, -0.1073455810546875, -0.06494140625, -0.0225372314453125, 0.019866943359375, 0.0622711181640625, 0.10467529296875, 0.1470794677734375, 0.189483642578125, 0.2318878173828125, 0.2742919921875, 0.3166961669921875, 0.359100341796875, 0.4015045166015625, 0.44390869140625, 0.4863128662109375, 0.528717041015625, 0.5711212158203125, 0.613525390625, 0.6559295654296875, 0.698333740234375, 0.7407379150390625, 0.78314208984375, 0.8255462646484375, 0.867950439453125, 0.9103546142578125, 0.9527587890625, 0.9951629638671875, 1.037567138671875, 1.0799713134765625, 1.12237548828125, 1.1647796630859375, 1.207183837890625, 1.2495880126953125, 1.2919921875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 8.0, 11.0, 18.0, 25.0, 31.0, 37.0, 64.0, 96.0, 170.0, 307.0, 893.0, 3514.0, 33618.0, 3730756.0, 411355.0, 10470.0, 1757.0, 535.0, 253.0, 126.0, 76.0, 49.0, 37.0, 15.0, 13.0, 15.0, 7.0, 8.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.29071044921875, -4.1673583984375, -4.04400634765625, -3.920654296875, -3.79730224609375, -3.6739501953125, -3.55059814453125, -3.42724609375, -3.30389404296875, -3.1805419921875, -3.05718994140625, -2.933837890625, -2.81048583984375, -2.6871337890625, -2.56378173828125, -2.4404296875, -2.31707763671875, -2.1937255859375, -2.07037353515625, -1.947021484375, -1.82366943359375, -1.7003173828125, -1.57696533203125, -1.45361328125, -1.33026123046875, -1.2069091796875, -1.08355712890625, -0.960205078125, -0.83685302734375, -0.7135009765625, -0.59014892578125, -0.466796875, -0.34344482421875, -0.2200927734375, -0.09674072265625, 0.026611328125, 0.14996337890625, 0.2733154296875, 0.39666748046875, 0.52001953125, 0.64337158203125, 0.7667236328125, 0.89007568359375, 1.013427734375, 1.13677978515625, 1.2601318359375, 1.38348388671875, 1.5068359375, 1.63018798828125, 1.7535400390625, 1.87689208984375, 2.000244140625, 2.12359619140625, 2.2469482421875, 2.37030029296875, 2.49365234375, 2.61700439453125, 2.7403564453125, 2.86370849609375, 2.987060546875, 3.11041259765625, 3.2337646484375, 3.35711669921875, 3.48046875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 12.0, 24.0, 56.0, 111.0, 233.0, 649.0, 1215.0, 979.0, 427.0, 178.0, 91.0, 34.0, 24.0, 9.0, 11.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6552734375, -0.623779296875, -0.59228515625, -0.560791015625, -0.529296875, -0.497802734375, -0.46630859375, -0.434814453125, -0.4033203125, -0.371826171875, -0.34033203125, -0.308837890625, -0.27734375, -0.245849609375, -0.21435546875, -0.182861328125, -0.1513671875, -0.119873046875, -0.08837890625, -0.056884765625, -0.025390625, 0.006103515625, 0.03759765625, 0.069091796875, 0.1005859375, 0.132080078125, 0.16357421875, 0.195068359375, 0.2265625, 0.258056640625, 0.28955078125, 0.321044921875, 0.3525390625, 0.384033203125, 0.41552734375, 0.447021484375, 0.478515625, 0.510009765625, 0.54150390625, 0.572998046875, 0.6044921875, 0.635986328125, 0.66748046875, 0.698974609375, 0.73046875, 0.761962890625, 0.79345703125, 0.824951171875, 0.8564453125, 0.887939453125, 0.91943359375, 0.950927734375, 0.982421875, 1.013916015625, 1.04541015625, 1.076904296875, 1.1083984375, 1.139892578125, 1.17138671875, 1.202880859375, 1.234375, 1.265869140625, 1.29736328125, 1.328857421875, 1.3603515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 5.0, 6.0, 9.0, 10.0, 15.0, 16.0, 20.0, 25.0, 38.0, 31.0, 43.0, 65.0, 69.0, 79.0, 82.0, 94.0, 68.0, 66.0, 65.0, 50.0, 33.0, 22.0, 20.0, 19.0, 8.0, 7.0, 11.0, 5.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7913415431976318, -1.7379173040390015, -1.684493064880371, -1.6310687065124512, -1.5776444673538208, -1.5242202281951904, -1.47079598903656, -1.4173717498779297, -1.3639473915100098, -1.3105231523513794, -1.257098913192749, -1.203674554824829, -1.1502503156661987, -1.0968260765075684, -1.043401837348938, -0.9899775385856628, -0.9365532994270325, -0.8831290602684021, -0.829704761505127, -0.7762805223464966, -0.7228562235832214, -0.6694319844245911, -0.6160076856613159, -0.5625834465026855, -0.5091592073440552, -0.4557349383831024, -0.40231066942214966, -0.3488864302635193, -0.29546213150024414, -0.24203789234161377, -0.188613623380661, -0.13518935441970825, -0.0817650556564331, -0.028340790420770645, 0.025083474814891815, 0.07850773632526398, 0.13193200528621674, 0.1853562593460083, 0.23878052830696106, 0.2922047972679138, 0.3456290662288666, 0.39905333518981934, 0.4524776041507721, 0.5059018731117249, 0.5593261122703552, 0.6127504110336304, 0.6661746501922607, 0.7195988893508911, 0.7730231881141663, 0.8264474272727966, 0.8798717260360718, 0.9332959651947021, 0.9867202639579773, 1.040144443511963, 1.0935688018798828, 1.1469930410385132, 1.2004172801971436, 1.253841519355774, 1.3072657585144043, 1.3606901168823242, 1.4141143560409546, 1.467538595199585, 1.5209628343582153, 1.5743870735168457, 1.6278114318847656]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 4.0, 9.0, 12.0, 10.0, 19.0, 17.0, 10.0, 29.0, 17.0, 22.0, 24.0, 28.0, 32.0, 32.0, 33.0, 37.0, 42.0, 55.0, 52.0, 38.0, 51.0, 39.0, 49.0, 38.0, 33.0, 38.0, 28.0, 30.0, 27.0, 32.0, 24.0, 18.0, 16.0, 6.0, 12.0, 9.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1734586954116821, -1.1348876953125, -1.0963165760040283, -1.0577454566955566, -1.0191744565963745, -0.9806033968925476, -0.9420323371887207, -0.9034612774848938, -0.8648902177810669, -0.82631915807724, -0.7877480983734131, -0.7491770386695862, -0.7106059789657593, -0.6720349192619324, -0.6334638595581055, -0.5948927998542786, -0.5563217401504517, -0.5177506804466248, -0.47917962074279785, -0.44060856103897095, -0.40203750133514404, -0.36346644163131714, -0.32489538192749023, -0.28632432222366333, -0.24775326251983643, -0.20918220281600952, -0.17061114311218262, -0.1320400834083557, -0.09346902370452881, -0.054897964000701904, -0.016326904296875, 0.022244155406951904, 0.06081533432006836, 0.09938639402389526, 0.13795745372772217, 0.17652851343154907, 0.21509957313537598, 0.2536706328392029, 0.2922416925430298, 0.3308127522468567, 0.3693838119506836, 0.4079548716545105, 0.4465259313583374, 0.4850969910621643, 0.5236680507659912, 0.5622391104698181, 0.600810170173645, 0.6393812298774719, 0.6779522895812988, 0.7165233492851257, 0.7550944089889526, 0.7936654686927795, 0.8322365283966064, 0.8708075881004333, 0.9093786478042603, 0.9479497075080872, 0.9865207672119141, 1.0250918865203857, 1.0636628866195679, 1.10223388671875, 1.1408050060272217, 1.1793761253356934, 1.2179471254348755, 1.2565181255340576, 1.2950892448425293]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 11.0, 12.0, 25.0, 13.0, 25.0, 46.0, 66.0, 90.0, 171.0, 290.0, 489.0, 901.0, 1556.0, 3001.0, 6200.0, 13426.0, 32023.0, 80648.0, 219038.0, 369870.0, 195340.0, 72270.0, 28589.0, 12493.0, 5739.0, 2806.0, 1425.0, 789.0, 435.0, 273.0, 156.0, 99.0, 69.0, 58.0, 30.0, 23.0, 8.0, 7.0, 7.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1812744140625, -0.17531967163085938, -0.16936492919921875, -0.16341018676757812, -0.1574554443359375, -0.15150070190429688, -0.14554595947265625, -0.13959121704101562, -0.133636474609375, -0.12768173217773438, -0.12172698974609375, -0.11577224731445312, -0.1098175048828125, -0.10386276245117188, -0.09790802001953125, -0.09195327758789062, -0.08599853515625, -0.08004379272460938, -0.07408905029296875, -0.06813430786132812, -0.0621795654296875, -0.056224822998046875, -0.05027008056640625, -0.044315338134765625, -0.038360595703125, -0.032405853271484375, -0.02645111083984375, -0.020496368408203125, -0.0145416259765625, -0.008586883544921875, -0.00263214111328125, 0.003322601318359375, 0.00927734375, 0.015232086181640625, 0.02118682861328125, 0.027141571044921875, 0.0330963134765625, 0.039051055908203125, 0.04500579833984375, 0.050960540771484375, 0.056915283203125, 0.06287002563476562, 0.06882476806640625, 0.07477951049804688, 0.0807342529296875, 0.08668899536132812, 0.09264373779296875, 0.09859848022460938, 0.10455322265625, 0.11050796508789062, 0.11646270751953125, 0.12241744995117188, 0.1283721923828125, 0.13432693481445312, 0.14028167724609375, 0.14623641967773438, 0.152191162109375, 0.15814590454101562, 0.16410064697265625, 0.17005538940429688, 0.1760101318359375, 0.18196487426757812, 0.18791961669921875, 0.19387435913085938, 0.1998291015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 8.0, 15.0, 10.0, 15.0, 14.0, 17.0, 29.0, 28.0, 30.0, 21.0, 35.0, 41.0, 44.0, 42.0, 36.0, 49.0, 60.0, 49.0, 54.0, 45.0, 53.0, 38.0, 32.0, 30.0, 26.0, 37.0, 23.0, 28.0, 13.0, 15.0, 14.0, 5.0, 5.0, 7.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7978515625, -0.7707443237304688, -0.7436370849609375, -0.7165298461914062, -0.689422607421875, -0.6623153686523438, -0.6352081298828125, -0.6081008911132812, -0.58099365234375, -0.5538864135742188, -0.5267791748046875, -0.49967193603515625, -0.472564697265625, -0.44545745849609375, -0.4183502197265625, -0.39124298095703125, -0.3641357421875, -0.33702850341796875, -0.3099212646484375, -0.28281402587890625, -0.255706787109375, -0.22859954833984375, -0.2014923095703125, -0.17438507080078125, -0.14727783203125, -0.12017059326171875, -0.0930633544921875, -0.06595611572265625, -0.038848876953125, -0.01174163818359375, 0.0153656005859375, 0.04247283935546875, 0.069580078125, 0.09668731689453125, 0.1237945556640625, 0.15090179443359375, 0.178009033203125, 0.20511627197265625, 0.2322235107421875, 0.25933074951171875, 0.28643798828125, 0.31354522705078125, 0.3406524658203125, 0.36775970458984375, 0.394866943359375, 0.42197418212890625, 0.4490814208984375, 0.47618865966796875, 0.5032958984375, 0.5304031372070312, 0.5575103759765625, 0.5846176147460938, 0.611724853515625, 0.6388320922851562, 0.6659393310546875, 0.6930465698242188, 0.72015380859375, 0.7472610473632812, 0.7743682861328125, 0.8014755249023438, 0.828582763671875, 0.8556900024414062, 0.8827972412109375, 0.9099044799804688, 0.93701171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 9.0, 13.0, 15.0, 20.0, 39.0, 59.0, 64.0, 96.0, 149.0, 268.0, 387.0, 676.0, 1217.0, 2180.0, 4355.0, 9050.0, 20123.0, 45847.0, 113247.0, 260336.0, 315118.0, 159519.0, 64608.0, 27087.0, 11961.0, 5618.0, 2838.0, 1500.0, 791.0, 499.0, 282.0, 201.0, 133.0, 69.0, 66.0, 33.0, 25.0, 19.0, 10.0, 12.0, 9.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1536865234375, -0.1487598419189453, -0.14383316040039062, -0.13890647888183594, -0.13397979736328125, -0.12905311584472656, -0.12412643432617188, -0.11919975280761719, -0.1142730712890625, -0.10934638977050781, -0.10441970825195312, -0.09949302673339844, -0.09456634521484375, -0.08963966369628906, -0.08471298217773438, -0.07978630065917969, -0.074859619140625, -0.06993293762207031, -0.06500625610351562, -0.06007957458496094, -0.05515289306640625, -0.05022621154785156, -0.045299530029296875, -0.04037284851074219, -0.0354461669921875, -0.030519485473632812, -0.025592803955078125, -0.020666122436523438, -0.01573944091796875, -0.010812759399414062, -0.005886077880859375, -0.0009593963623046875, 0.00396728515625, 0.008893966674804688, 0.013820648193359375, 0.018747329711914062, 0.02367401123046875, 0.028600692749023438, 0.033527374267578125, 0.03845405578613281, 0.0433807373046875, 0.04830741882324219, 0.053234100341796875, 0.05816078186035156, 0.06308746337890625, 0.06801414489746094, 0.07294082641601562, 0.07786750793457031, 0.082794189453125, 0.08772087097167969, 0.09264755249023438, 0.09757423400878906, 0.10250091552734375, 0.10742759704589844, 0.11235427856445312, 0.11728096008300781, 0.1222076416015625, 0.1271343231201172, 0.13206100463867188, 0.13698768615722656, 0.14191436767578125, 0.14684104919433594, 0.15176773071289062, 0.1566944122314453, 0.16162109375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 7.0, 15.0, 13.0, 15.0, 27.0, 29.0, 42.0, 24.0, 38.0, 48.0, 43.0, 58.0, 64.0, 61.0, 54.0, 53.0, 61.0, 58.0, 47.0, 44.0, 30.0, 24.0, 22.0, 25.0, 16.0, 20.0, 13.0, 6.0, 14.0, 8.0, 5.0, 0.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.93359375, -1.875396728515625, -1.81719970703125, -1.759002685546875, -1.7008056640625, -1.642608642578125, -1.58441162109375, -1.526214599609375, -1.468017578125, -1.409820556640625, -1.35162353515625, -1.293426513671875, -1.2352294921875, -1.177032470703125, -1.11883544921875, -1.060638427734375, -1.00244140625, -0.944244384765625, -0.88604736328125, -0.827850341796875, -0.7696533203125, -0.711456298828125, -0.65325927734375, -0.595062255859375, -0.536865234375, -0.478668212890625, -0.42047119140625, -0.362274169921875, -0.3040771484375, -0.245880126953125, -0.18768310546875, -0.129486083984375, -0.0712890625, -0.013092041015625, 0.04510498046875, 0.103302001953125, 0.1614990234375, 0.219696044921875, 0.27789306640625, 0.336090087890625, 0.394287109375, 0.452484130859375, 0.51068115234375, 0.568878173828125, 0.6270751953125, 0.685272216796875, 0.74346923828125, 0.801666259765625, 0.85986328125, 0.918060302734375, 0.97625732421875, 1.034454345703125, 1.0926513671875, 1.150848388671875, 1.20904541015625, 1.267242431640625, 1.325439453125, 1.383636474609375, 1.44183349609375, 1.500030517578125, 1.5582275390625, 1.616424560546875, 1.67462158203125, 1.732818603515625, 1.791015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 9.0, 7.0, 12.0, 22.0, 40.0, 54.0, 60.0, 110.0, 166.0, 260.0, 499.0, 941.0, 1729.0, 3774.0, 8849.0, 23578.0, 73514.0, 242579.0, 417381.0, 186681.0, 55700.0, 18755.0, 7208.0, 3199.0, 1503.0, 766.0, 448.0, 250.0, 149.0, 101.0, 60.0, 41.0, 30.0, 19.0, 14.0, 13.0, 4.0, 5.0, 5.0, 1.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06231689453125, -0.06033134460449219, -0.058345794677734375, -0.05636024475097656, -0.05437469482421875, -0.05238914489746094, -0.050403594970703125, -0.04841804504394531, -0.0464324951171875, -0.04444694519042969, -0.042461395263671875, -0.04047584533691406, -0.03849029541015625, -0.03650474548339844, -0.034519195556640625, -0.03253364562988281, -0.030548095703125, -0.028562545776367188, -0.026576995849609375, -0.024591445922851562, -0.02260589599609375, -0.020620346069335938, -0.018634796142578125, -0.016649246215820312, -0.0146636962890625, -0.012678146362304688, -0.010692596435546875, -0.008707046508789062, -0.00672149658203125, -0.0047359466552734375, -0.002750396728515625, -0.0007648468017578125, 0.001220703125, 0.0032062530517578125, 0.005191802978515625, 0.0071773529052734375, 0.00916290283203125, 0.011148452758789062, 0.013134002685546875, 0.015119552612304688, 0.0171051025390625, 0.019090652465820312, 0.021076202392578125, 0.023061752319335938, 0.02504730224609375, 0.027032852172851562, 0.029018402099609375, 0.031003952026367188, 0.032989501953125, 0.03497505187988281, 0.036960601806640625, 0.03894615173339844, 0.04093170166015625, 0.04291725158691406, 0.044902801513671875, 0.04688835144042969, 0.0488739013671875, 0.05085945129394531, 0.052845001220703125, 0.05483055114746094, 0.05681610107421875, 0.05880165100097656, 0.060787200927734375, 0.06277275085449219, 0.06475830078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 6.0, 4.0, 2.0, 6.0, 7.0, 12.0, 14.0, 16.0, 24.0, 31.0, 48.0, 54.0, 55.0, 75.0, 86.0, 91.0, 96.0, 76.0, 82.0, 61.0, 30.0, 41.0, 14.0, 14.0, 7.0, 9.0, 12.0, 5.0, 6.0, 7.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8252601623535156e-05, -2.7004629373550415e-05, -2.5756657123565674e-05, -2.4508684873580933e-05, -2.326071262359619e-05, -2.201274037361145e-05, -2.076476812362671e-05, -1.9516795873641968e-05, -1.8268823623657227e-05, -1.7020851373672485e-05, -1.5772879123687744e-05, -1.4524906873703003e-05, -1.3276934623718262e-05, -1.202896237373352e-05, -1.078099012374878e-05, -9.533017873764038e-06, -8.285045623779297e-06, -7.037073373794556e-06, -5.7891011238098145e-06, -4.541128873825073e-06, -3.293156623840332e-06, -2.045184373855591e-06, -7.972121238708496e-07, 4.507601261138916e-07, 1.6987323760986328e-06, 2.946704626083374e-06, 4.194676876068115e-06, 5.4426491260528564e-06, 6.690621376037598e-06, 7.938593626022339e-06, 9.18656587600708e-06, 1.0434538125991821e-05, 1.1682510375976562e-05, 1.2930482625961304e-05, 1.4178454875946045e-05, 1.5426427125930786e-05, 1.6674399375915527e-05, 1.792237162590027e-05, 1.917034387588501e-05, 2.041831612586975e-05, 2.1666288375854492e-05, 2.2914260625839233e-05, 2.4162232875823975e-05, 2.5410205125808716e-05, 2.6658177375793457e-05, 2.7906149625778198e-05, 2.915412187576294e-05, 3.040209412574768e-05, 3.165006637573242e-05, 3.289803862571716e-05, 3.4146010875701904e-05, 3.5393983125686646e-05, 3.664195537567139e-05, 3.788992762565613e-05, 3.913789987564087e-05, 4.038587212562561e-05, 4.163384437561035e-05, 4.288181662559509e-05, 4.4129788875579834e-05, 4.5377761125564575e-05, 4.6625733375549316e-05, 4.787370562553406e-05, 4.91216778755188e-05, 5.036965012550354e-05, 5.161762237548828e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 12.0, 11.0, 7.0, 14.0, 29.0, 36.0, 60.0, 99.0, 164.0, 272.0, 459.0, 1032.0, 2122.0, 5023.0, 13332.0, 38877.0, 126587.0, 364841.0, 332903.0, 109368.0, 33380.0, 11505.0, 4493.0, 1859.0, 894.0, 483.0, 280.0, 173.0, 78.0, 39.0, 25.0, 31.0, 14.0, 16.0, 7.0, 10.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061553955078125, -0.05942678451538086, -0.05729961395263672, -0.05517244338989258, -0.05304527282714844, -0.0509181022644043, -0.048790931701660156, -0.046663761138916016, -0.044536590576171875, -0.042409420013427734, -0.040282249450683594, -0.03815507888793945, -0.03602790832519531, -0.03390073776245117, -0.03177356719970703, -0.02964639663696289, -0.02751922607421875, -0.02539205551147461, -0.02326488494873047, -0.021137714385986328, -0.019010543823242188, -0.016883373260498047, -0.014756202697753906, -0.012629032135009766, -0.010501861572265625, -0.008374691009521484, -0.006247520446777344, -0.004120349884033203, -0.0019931793212890625, 0.00013399124145507812, 0.0022611618041992188, 0.004388332366943359, 0.0065155029296875, 0.00864267349243164, 0.010769844055175781, 0.012897014617919922, 0.015024185180664062, 0.017151355743408203, 0.019278526306152344, 0.021405696868896484, 0.023532867431640625, 0.025660037994384766, 0.027787208557128906, 0.029914379119873047, 0.03204154968261719, 0.03416872024536133, 0.03629589080810547, 0.03842306137084961, 0.04055023193359375, 0.04267740249633789, 0.04480457305908203, 0.04693174362182617, 0.04905891418457031, 0.05118608474731445, 0.053313255310058594, 0.055440425872802734, 0.057567596435546875, 0.059694766998291016, 0.061821937561035156, 0.0639491081237793, 0.06607627868652344, 0.06820344924926758, 0.07033061981201172, 0.07245779037475586, 0.0745849609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 7.0, 12.0, 15.0, 11.0, 12.0, 23.0, 23.0, 18.0, 29.0, 40.0, 44.0, 51.0, 55.0, 42.0, 66.0, 57.0, 54.0, 66.0, 58.0, 54.0, 54.0, 40.0, 37.0, 26.0, 24.0, 18.0, 14.0, 17.0, 4.0, 13.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0203094482421875, -0.019755244255065918, -0.019201040267944336, -0.018646836280822754, -0.018092632293701172, -0.01753842830657959, -0.016984224319458008, -0.016430020332336426, -0.015875816345214844, -0.015321612358093262, -0.01476740837097168, -0.014213204383850098, -0.013659000396728516, -0.013104796409606934, -0.012550592422485352, -0.01199638843536377, -0.011442184448242188, -0.010887980461120605, -0.010333776473999023, -0.009779572486877441, -0.00922536849975586, -0.008671164512634277, -0.008116960525512695, -0.007562756538391113, -0.007008552551269531, -0.006454348564147949, -0.005900144577026367, -0.005345940589904785, -0.004791736602783203, -0.004237532615661621, -0.003683328628540039, -0.003129124641418457, -0.002574920654296875, -0.002020716667175293, -0.001466512680053711, -0.0009123086929321289, -0.0003581047058105469, 0.00019609928131103516, 0.0007503032684326172, 0.0013045072555541992, 0.0018587112426757812, 0.0024129152297973633, 0.0029671192169189453, 0.0035213232040405273, 0.004075527191162109, 0.004629731178283691, 0.0051839351654052734, 0.0057381391525268555, 0.0062923431396484375, 0.0068465471267700195, 0.0074007511138916016, 0.007954955101013184, 0.008509159088134766, 0.009063363075256348, 0.00961756706237793, 0.010171771049499512, 0.010725975036621094, 0.011280179023742676, 0.011834383010864258, 0.01238858699798584, 0.012942790985107422, 0.013496994972229004, 0.014051198959350586, 0.014605402946472168, 0.01515960693359375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 11.0, 9.0, 19.0, 25.0, 21.0, 46.0, 58.0, 68.0, 94.0, 104.0, 115.0, 118.0, 85.0, 65.0, 45.0, 28.0, 23.0, 11.0, 16.0, 5.0, 5.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3488291501998901, -1.305383563041687, -1.2619378566741943, -1.2184922695159912, -1.1750465631484985, -1.1316009759902954, -1.0881552696228027, -1.0447096824645996, -1.0012640953063965, -0.9578184485435486, -0.9143728017807007, -0.8709272146224976, -0.8274815082550049, -0.7840359210968018, -0.7405902743339539, -0.697144627571106, -0.6536989212036133, -0.6102532744407654, -0.5668076276779175, -0.5233620405197144, -0.47991636395454407, -0.43647071719169617, -0.39302510023117065, -0.34957945346832275, -0.30613380670547485, -0.26268815994262695, -0.21924252808094025, -0.17579689621925354, -0.13235124945640564, -0.08890560269355774, -0.04545998573303223, -0.002014338970184326, 0.041431307792663574, 0.08487694710493088, 0.12832258641719818, 0.1717682182788849, 0.2152138650417328, 0.2586595118045807, 0.3021051287651062, 0.3455507755279541, 0.388996422290802, 0.4324420690536499, 0.4758877158164978, 0.5193333625793457, 0.5627789497375488, 0.6062246561050415, 0.6496702432632446, 0.6931158900260925, 0.7365615367889404, 0.7800071835517883, 0.8234528303146362, 0.8668984174728394, 0.910344123840332, 0.9537897109985352, 0.9972353577613831, 1.040681004524231, 1.0841267108917236, 1.1275722980499268, 1.1710180044174194, 1.2144635915756226, 1.2579092979431152, 1.3013548851013184, 1.3448004722595215, 1.3882461786270142, 1.4316917657852173]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 6.0, 3.0, 9.0, 13.0, 14.0, 20.0, 10.0, 19.0, 23.0, 31.0, 24.0, 25.0, 30.0, 38.0, 38.0, 38.0, 58.0, 61.0, 49.0, 53.0, 48.0, 50.0, 41.0, 40.0, 40.0, 28.0, 31.0, 33.0, 32.0, 20.0, 14.0, 16.0, 10.0, 8.0, 4.0, 2.0, 5.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7549246549606323, -0.7283146977424622, -0.701704740524292, -0.675094723701477, -0.6484847664833069, -0.6218748092651367, -0.5952647924423218, -0.5686548352241516, -0.5420448780059814, -0.5154349207878113, -0.4888249337673187, -0.46221494674682617, -0.435604989528656, -0.40899503231048584, -0.3823850452899933, -0.35577505826950073, -0.32916510105133057, -0.3025551438331604, -0.27594515681266785, -0.2493351846933365, -0.22272521257400513, -0.19611524045467377, -0.1695052683353424, -0.14289529621601105, -0.11628532409667969, -0.08967535197734833, -0.06306537985801697, -0.03645540773868561, -0.009845435619354248, 0.016764536499977112, 0.04337450861930847, 0.06998448073863983, 0.09659439325332642, 0.12320436537265778, 0.14981433749198914, 0.1764243096113205, 0.20303428173065186, 0.22964425384998322, 0.2562542259693146, 0.28286421298980713, 0.3094741702079773, 0.33608412742614746, 0.36269411444664, 0.38930410146713257, 0.41591405868530273, 0.4425240159034729, 0.46913400292396545, 0.495743989944458, 0.5223539471626282, 0.5489639043807983, 0.5755739212036133, 0.6021838784217834, 0.6287938356399536, 0.6554037928581238, 0.682013750076294, 0.7086237668991089, 0.735233724117279, 0.7618436813354492, 0.7884536981582642, 0.8150636553764343, 0.8416736125946045, 0.8682835698127747, 0.8948935270309448, 0.9215035438537598, 0.9481135010719299]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 9.0, 5.0, 11.0, 10.0, 12.0, 30.0, 41.0, 62.0, 100.0, 221.0, 426.0, 1008.0, 3341.0, 18429.0, 329275.0, 656255.0, 32156.0, 4736.0, 1306.0, 553.0, 238.0, 128.0, 65.0, 41.0, 35.0, 15.0, 12.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01953125, -1.952484130859375, -1.88543701171875, -1.818389892578125, -1.7513427734375, -1.684295654296875, -1.61724853515625, -1.550201416015625, -1.483154296875, -1.416107177734375, -1.34906005859375, -1.282012939453125, -1.2149658203125, -1.147918701171875, -1.08087158203125, -1.013824462890625, -0.94677734375, -0.879730224609375, -0.81268310546875, -0.745635986328125, -0.6785888671875, -0.611541748046875, -0.54449462890625, -0.477447509765625, -0.410400390625, -0.343353271484375, -0.27630615234375, -0.209259033203125, -0.1422119140625, -0.075164794921875, -0.00811767578125, 0.058929443359375, 0.1259765625, 0.193023681640625, 0.26007080078125, 0.327117919921875, 0.3941650390625, 0.461212158203125, 0.52825927734375, 0.595306396484375, 0.662353515625, 0.729400634765625, 0.79644775390625, 0.863494873046875, 0.9305419921875, 0.997589111328125, 1.06463623046875, 1.131683349609375, 1.19873046875, 1.265777587890625, 1.33282470703125, 1.399871826171875, 1.4669189453125, 1.533966064453125, 1.60101318359375, 1.668060302734375, 1.735107421875, 1.802154541015625, 1.86920166015625, 1.936248779296875, 2.0032958984375, 2.070343017578125, 2.13739013671875, 2.204437255859375, 2.271484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 9.0, 14.0, 22.0, 35.0, 44.0, 50.0, 67.0, 98.0, 100.0, 116.0, 101.0, 98.0, 66.0, 60.0, 49.0, 22.0, 24.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6279296875, -1.5217437744140625, -1.415557861328125, -1.3093719482421875, -1.20318603515625, -1.0970001220703125, -0.990814208984375, -0.8846282958984375, -0.7784423828125, -0.6722564697265625, -0.566070556640625, -0.4598846435546875, -0.35369873046875, -0.2475128173828125, -0.141326904296875, -0.0351409912109375, 0.071044921875, 0.1772308349609375, 0.283416748046875, 0.3896026611328125, 0.49578857421875, 0.6019744873046875, 0.708160400390625, 0.8143463134765625, 0.9205322265625, 1.0267181396484375, 1.132904052734375, 1.2390899658203125, 1.34527587890625, 1.4514617919921875, 1.557647705078125, 1.6638336181640625, 1.77001953125, 1.8762054443359375, 1.982391357421875, 2.0885772705078125, 2.19476318359375, 2.3009490966796875, 2.407135009765625, 2.5133209228515625, 2.6195068359375, 2.7256927490234375, 2.831878662109375, 2.9380645751953125, 3.04425048828125, 3.1504364013671875, 3.256622314453125, 3.3628082275390625, 3.468994140625, 3.5751800537109375, 3.681365966796875, 3.7875518798828125, 3.89373779296875, 3.9999237060546875, 4.106109619140625, 4.2122955322265625, 4.3184814453125, 4.4246673583984375, 4.530853271484375, 4.6370391845703125, 4.74322509765625, 4.8494110107421875, 4.955596923828125, 5.0617828369140625, 5.16796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 3.0, 6.0, 4.0, 12.0, 7.0, 9.0, 18.0, 19.0, 34.0, 24.0, 62.0, 64.0, 75.0, 100.0, 173.0, 338.0, 924.0, 3654.0, 47879.0, 953721.0, 36531.0, 3147.0, 806.0, 313.0, 169.0, 117.0, 94.0, 59.0, 54.0, 31.0, 29.0, 14.0, 15.0, 10.0, 9.0, 8.0, 5.0, 7.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.37890625, -2.29229736328125, -2.2056884765625, -2.11907958984375, -2.032470703125, -1.94586181640625, -1.8592529296875, -1.77264404296875, -1.68603515625, -1.59942626953125, -1.5128173828125, -1.42620849609375, -1.339599609375, -1.25299072265625, -1.1663818359375, -1.07977294921875, -0.9931640625, -0.90655517578125, -0.8199462890625, -0.73333740234375, -0.646728515625, -0.56011962890625, -0.4735107421875, -0.38690185546875, -0.30029296875, -0.21368408203125, -0.1270751953125, -0.04046630859375, 0.046142578125, 0.13275146484375, 0.2193603515625, 0.30596923828125, 0.392578125, 0.47918701171875, 0.5657958984375, 0.65240478515625, 0.739013671875, 0.82562255859375, 0.9122314453125, 0.99884033203125, 1.08544921875, 1.17205810546875, 1.2586669921875, 1.34527587890625, 1.431884765625, 1.51849365234375, 1.6051025390625, 1.69171142578125, 1.7783203125, 1.86492919921875, 1.9515380859375, 2.03814697265625, 2.124755859375, 2.21136474609375, 2.2979736328125, 2.38458251953125, 2.47119140625, 2.55780029296875, 2.6444091796875, 2.73101806640625, 2.817626953125, 2.90423583984375, 2.9908447265625, 3.07745361328125, 3.1640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 7.0, 10.0, 11.0, 14.0, 15.0, 9.0, 15.0, 14.0, 16.0, 33.0, 25.0, 24.0, 29.0, 33.0, 41.0, 37.0, 38.0, 41.0, 46.0, 44.0, 35.0, 37.0, 40.0, 39.0, 43.0, 36.0, 31.0, 24.0, 31.0, 17.0, 26.0, 18.0, 19.0, 13.0, 19.0, 13.0, 7.0, 6.0, 5.0, 4.0, 7.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.533203125, -1.489593505859375, -1.44598388671875, -1.402374267578125, -1.3587646484375, -1.315155029296875, -1.27154541015625, -1.227935791015625, -1.184326171875, -1.140716552734375, -1.09710693359375, -1.053497314453125, -1.0098876953125, -0.966278076171875, -0.92266845703125, -0.879058837890625, -0.83544921875, -0.791839599609375, -0.74822998046875, -0.704620361328125, -0.6610107421875, -0.617401123046875, -0.57379150390625, -0.530181884765625, -0.486572265625, -0.442962646484375, -0.39935302734375, -0.355743408203125, -0.3121337890625, -0.268524169921875, -0.22491455078125, -0.181304931640625, -0.1376953125, -0.094085693359375, -0.05047607421875, -0.006866455078125, 0.0367431640625, 0.080352783203125, 0.12396240234375, 0.167572021484375, 0.211181640625, 0.254791259765625, 0.29840087890625, 0.342010498046875, 0.3856201171875, 0.429229736328125, 0.47283935546875, 0.516448974609375, 0.56005859375, 0.603668212890625, 0.64727783203125, 0.690887451171875, 0.7344970703125, 0.778106689453125, 0.82171630859375, 0.865325927734375, 0.908935546875, 0.952545166015625, 0.99615478515625, 1.039764404296875, 1.0833740234375, 1.126983642578125, 1.17059326171875, 1.214202880859375, 1.2578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 10.0, 6.0, 14.0, 20.0, 31.0, 59.0, 64.0, 137.0, 250.0, 518.0, 1064.0, 3280.0, 18147.0, 816157.0, 195840.0, 9105.0, 2143.0, 812.0, 365.0, 198.0, 112.0, 80.0, 44.0, 31.0, 19.0, 14.0, 10.0, 5.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0384368896484375, -1.003631591796875, -0.9688262939453125, -0.93402099609375, -0.8992156982421875, -0.864410400390625, -0.8296051025390625, -0.7947998046875, -0.7599945068359375, -0.725189208984375, -0.6903839111328125, -0.65557861328125, -0.6207733154296875, -0.585968017578125, -0.5511627197265625, -0.516357421875, -0.4815521240234375, -0.446746826171875, -0.4119415283203125, -0.37713623046875, -0.3423309326171875, -0.307525634765625, -0.2727203369140625, -0.2379150390625, -0.2031097412109375, -0.168304443359375, -0.1334991455078125, -0.09869384765625, -0.0638885498046875, -0.029083251953125, 0.0057220458984375, 0.04052734375, 0.0753326416015625, 0.110137939453125, 0.1449432373046875, 0.17974853515625, 0.2145538330078125, 0.249359130859375, 0.2841644287109375, 0.3189697265625, 0.3537750244140625, 0.388580322265625, 0.4233856201171875, 0.45819091796875, 0.4929962158203125, 0.527801513671875, 0.5626068115234375, 0.597412109375, 0.6322174072265625, 0.667022705078125, 0.7018280029296875, 0.73663330078125, 0.7714385986328125, 0.806243896484375, 0.8410491943359375, 0.8758544921875, 0.9106597900390625, 0.945465087890625, 0.9802703857421875, 1.01507568359375, 1.0498809814453125, 1.084686279296875, 1.1194915771484375, 1.154296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 10.0, 11.0, 21.0, 22.0, 43.0, 66.0, 119.0, 235.0, 206.0, 108.0, 58.0, 31.0, 18.0, 16.0, 13.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.296966552734375e-05, -7.933378219604492e-05, -7.56978988647461e-05, -7.206201553344727e-05, -6.842613220214844e-05, -6.479024887084961e-05, -6.115436553955078e-05, -5.751848220825195e-05, -5.3882598876953125e-05, -5.02467155456543e-05, -4.661083221435547e-05, -4.297494888305664e-05, -3.933906555175781e-05, -3.5703182220458984e-05, -3.2067298889160156e-05, -2.8431415557861328e-05, -2.47955322265625e-05, -2.1159648895263672e-05, -1.7523765563964844e-05, -1.3887882232666016e-05, -1.0251998901367188e-05, -6.616115570068359e-06, -2.9802322387695312e-06, 6.556510925292969e-07, 4.291534423828125e-06, 7.927417755126953e-06, 1.1563301086425781e-05, 1.519918441772461e-05, 1.8835067749023438e-05, 2.2470951080322266e-05, 2.6106834411621094e-05, 2.9742717742919922e-05, 3.337860107421875e-05, 3.701448440551758e-05, 4.0650367736816406e-05, 4.4286251068115234e-05, 4.792213439941406e-05, 5.155801773071289e-05, 5.519390106201172e-05, 5.882978439331055e-05, 6.246566772460938e-05, 6.61015510559082e-05, 6.973743438720703e-05, 7.337331771850586e-05, 7.700920104980469e-05, 8.064508438110352e-05, 8.428096771240234e-05, 8.791685104370117e-05, 9.1552734375e-05, 9.518861770629883e-05, 9.882450103759766e-05, 0.00010246038436889648, 0.00010609626770019531, 0.00010973215103149414, 0.00011336803436279297, 0.0001170039176940918, 0.00012063980102539062, 0.00012427568435668945, 0.00012791156768798828, 0.0001315474510192871, 0.00013518333435058594, 0.00013881921768188477, 0.0001424551010131836, 0.00014609098434448242, 0.00014972686767578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 4.0, 5.0, 14.0, 16.0, 30.0, 43.0, 73.0, 87.0, 160.0, 314.0, 556.0, 1075.0, 2239.0, 5790.0, 35311.0, 910913.0, 78781.0, 7666.0, 2708.0, 1298.0, 652.0, 345.0, 209.0, 89.0, 71.0, 33.0, 21.0, 15.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1728515625, -1.13897705078125, -1.1051025390625, -1.07122802734375, -1.037353515625, -1.00347900390625, -0.9696044921875, -0.93572998046875, -0.90185546875, -0.86798095703125, -0.8341064453125, -0.80023193359375, -0.766357421875, -0.73248291015625, -0.6986083984375, -0.66473388671875, -0.630859375, -0.59698486328125, -0.5631103515625, -0.52923583984375, -0.495361328125, -0.46148681640625, -0.4276123046875, -0.39373779296875, -0.35986328125, -0.32598876953125, -0.2921142578125, -0.25823974609375, -0.224365234375, -0.19049072265625, -0.1566162109375, -0.12274169921875, -0.0888671875, -0.05499267578125, -0.0211181640625, 0.01275634765625, 0.046630859375, 0.08050537109375, 0.1143798828125, 0.14825439453125, 0.18212890625, 0.21600341796875, 0.2498779296875, 0.28375244140625, 0.317626953125, 0.35150146484375, 0.3853759765625, 0.41925048828125, 0.453125, 0.48699951171875, 0.5208740234375, 0.55474853515625, 0.588623046875, 0.62249755859375, 0.6563720703125, 0.69024658203125, 0.72412109375, 0.75799560546875, 0.7918701171875, 0.82574462890625, 0.859619140625, 0.89349365234375, 0.9273681640625, 0.96124267578125, 0.9951171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 7.0, 3.0, 16.0, 18.0, 37.0, 51.0, 111.0, 186.0, 261.0, 123.0, 85.0, 32.0, 22.0, 13.0, 11.0, 3.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35400390625, -0.3423042297363281, -0.33060455322265625, -0.3189048767089844, -0.3072052001953125, -0.2955055236816406, -0.28380584716796875, -0.2721061706542969, -0.260406494140625, -0.24870681762695312, -0.23700714111328125, -0.22530746459960938, -0.2136077880859375, -0.20190811157226562, -0.19020843505859375, -0.17850875854492188, -0.16680908203125, -0.15510940551757812, -0.14340972900390625, -0.13171005249023438, -0.1200103759765625, -0.10831069946289062, -0.09661102294921875, -0.08491134643554688, -0.073211669921875, -0.061511993408203125, -0.04981231689453125, -0.038112640380859375, -0.0264129638671875, -0.014713287353515625, -0.00301361083984375, 0.008686065673828125, 0.0203857421875, 0.032085418701171875, 0.04378509521484375, 0.055484771728515625, 0.0671844482421875, 0.07888412475585938, 0.09058380126953125, 0.10228347778320312, 0.113983154296875, 0.12568283081054688, 0.13738250732421875, 0.14908218383789062, 0.1607818603515625, 0.17248153686523438, 0.18418121337890625, 0.19588088989257812, 0.20758056640625, 0.21928024291992188, 0.23097991943359375, 0.24267959594726562, 0.2543792724609375, 0.2660789489746094, 0.27777862548828125, 0.2894783020019531, 0.301177978515625, 0.3128776550292969, 0.32457733154296875, 0.3362770080566406, 0.3479766845703125, 0.3596763610839844, 0.37137603759765625, 0.3830757141113281, 0.394775390625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 0.0, 6.0, 7.0, 19.0, 28.0, 42.0, 91.0, 149.0, 220.0, 166.0, 131.0, 66.0, 33.0, 23.0, 15.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.153860569000244, -1.9843436479568481, -1.8148267269134521, -1.6453098058700562, -1.4757928848266602, -1.3062759637832642, -1.1367590427398682, -0.9672421216964722, -0.7977252006530762, -0.6282082796096802, -0.4586913585662842, -0.2891744375228882, -0.11965751647949219, 0.04985940456390381, 0.2193763256072998, 0.3888932466506958, 0.5584101676940918, 0.7279270887374878, 0.8974440097808838, 1.0669609308242798, 1.2364778518676758, 1.4059947729110718, 1.5755116939544678, 1.7450286149978638, 1.9145455360412598, 2.0840625762939453, 2.2535793781280518, 2.423096179962158, 2.5926132202148438, 2.7621302604675293, 2.9316470623016357, 3.101163864135742, 3.2706804275512695, 3.440197467803955, 3.6097142696380615, 3.779231071472168, 3.9487481117248535, 4.118265151977539, 4.287781715393066, 4.457298755645752, 4.6268157958984375, 4.796332836151123, 4.965849876403809, 5.135366439819336, 5.3048834800720215, 5.474400520324707, 5.643917083740234, 5.81343412399292, 5.9829511642456055, 6.152468204498291, 6.321985244750977, 6.491501808166504, 6.6610188484191895, 6.830535888671875, 7.000052452087402, 7.169569492340088, 7.339086532592773, 7.508603572845459, 7.6781206130981445, 7.847637176513672, 8.017154693603516, 8.186671257019043, 8.35618782043457, 8.525705337524414, 8.695221900939941]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 9.0, 13.0, 12.0, 10.0, 16.0, 19.0, 26.0, 19.0, 33.0, 45.0, 52.0, 66.0, 52.0, 74.0, 53.0, 58.0, 56.0, 61.0, 53.0, 52.0, 40.0, 40.0, 30.0, 26.0, 24.0, 22.0, 18.0, 8.0, 3.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6188249588012695, -2.5003929138183594, -2.3819611072540283, -2.263529062271118, -2.145097017288208, -2.026665210723877, -1.9082331657409668, -1.7898011207580566, -1.6713690757751465, -1.5529371500015259, -1.4345051050186157, -1.3160731792449951, -1.197641134262085, -1.0792092084884644, -0.960777223110199, -0.8423452377319336, -0.723913311958313, -0.6054813265800476, -0.4870493412017822, -0.36861738562583923, -0.25018540024757385, -0.13175344467163086, -0.013321459293365479, 0.1051105260848999, 0.22354251146316528, 0.34197449684143066, 0.46040648221969604, 0.5788384675979614, 0.697270393371582, 0.8157023787498474, 0.9341343641281128, 1.0525662899017334, 1.1709983348846436, 1.2894302606582642, 1.4078623056411743, 1.526294231414795, 1.644726276397705, 1.7631582021713257, 1.8815901279449463, 2.0000221729278564, 2.1184542179107666, 2.2368862628936768, 2.355318069458008, 2.473750114440918, 2.592182159423828, 2.7106142044067383, 2.8290460109710693, 2.9474780559539795, 3.0659098625183105, 3.1843419075012207, 3.3027737140655518, 3.421205759048462, 3.539637804031372, 3.658069610595703, 3.7765016555786133, 3.8949337005615234, 4.013365745544434, 4.131797790527344, 4.250229835510254, 4.368661880493164, 4.487093448638916, 4.605525493621826, 4.723957538604736, 4.8423895835876465, 4.960821628570557]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 2.0, 9.0, 9.0, 21.0, 31.0, 49.0, 75.0, 118.0, 302.0, 764.0, 3711.0, 294453.0, 3875978.0, 16500.0, 1461.0, 427.0, 149.0, 100.0, 41.0, 31.0, 17.0, 12.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.86492919921875, -4.6556396484375, -4.44635009765625, -4.237060546875, -4.02777099609375, -3.8184814453125, -3.60919189453125, -3.39990234375, -3.19061279296875, -2.9813232421875, -2.77203369140625, -2.562744140625, -2.35345458984375, -2.1441650390625, -1.93487548828125, -1.7255859375, -1.51629638671875, -1.3070068359375, -1.09771728515625, -0.888427734375, -0.67913818359375, -0.4698486328125, -0.26055908203125, -0.05126953125, 0.15802001953125, 0.3673095703125, 0.57659912109375, 0.785888671875, 0.99517822265625, 1.2044677734375, 1.41375732421875, 1.623046875, 1.83233642578125, 2.0416259765625, 2.25091552734375, 2.460205078125, 2.66949462890625, 2.8787841796875, 3.08807373046875, 3.29736328125, 3.50665283203125, 3.7159423828125, 3.92523193359375, 4.134521484375, 4.34381103515625, 4.5531005859375, 4.76239013671875, 4.9716796875, 5.18096923828125, 5.3902587890625, 5.59954833984375, 5.808837890625, 6.01812744140625, 6.2274169921875, 6.43670654296875, 6.64599609375, 6.85528564453125, 7.0645751953125, 7.27386474609375, 7.483154296875, 7.69244384765625, 7.9017333984375, 8.11102294921875, 8.3203125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 11.0, 7.0, 5.0, 9.0, 12.0, 19.0, 21.0, 22.0, 28.0, 22.0, 38.0, 48.0, 44.0, 37.0, 48.0, 46.0, 54.0, 55.0, 54.0, 64.0, 39.0, 47.0, 44.0, 32.0, 35.0, 29.0, 18.0, 24.0, 21.0, 11.0, 14.0, 6.0, 11.0, 3.0, 7.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.365234375, -1.3252105712890625, -1.285186767578125, -1.2451629638671875, -1.20513916015625, -1.1651153564453125, -1.125091552734375, -1.0850677490234375, -1.0450439453125, -1.0050201416015625, -0.964996337890625, -0.9249725341796875, -0.88494873046875, -0.8449249267578125, -0.804901123046875, -0.7648773193359375, -0.724853515625, -0.6848297119140625, -0.644805908203125, -0.6047821044921875, -0.56475830078125, -0.5247344970703125, -0.484710693359375, -0.4446868896484375, -0.4046630859375, -0.3646392822265625, -0.324615478515625, -0.2845916748046875, -0.24456787109375, -0.2045440673828125, -0.164520263671875, -0.1244964599609375, -0.08447265625, -0.0444488525390625, -0.004425048828125, 0.0355987548828125, 0.07562255859375, 0.1156463623046875, 0.155670166015625, 0.1956939697265625, 0.2357177734375, 0.2757415771484375, 0.315765380859375, 0.3557891845703125, 0.39581298828125, 0.4358367919921875, 0.475860595703125, 0.5158843994140625, 0.555908203125, 0.5959320068359375, 0.635955810546875, 0.6759796142578125, 0.71600341796875, 0.7560272216796875, 0.796051025390625, 0.8360748291015625, 0.8760986328125, 0.9161224365234375, 0.956146240234375, 0.9961700439453125, 1.03619384765625, 1.0762176513671875, 1.116241455078125, 1.1562652587890625, 1.1962890625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 7.0, 12.0, 31.0, 75.0, 151.0, 337.0, 1037.0, 3354.0, 24171.0, 3665836.0, 485726.0, 10296.0, 2104.0, 662.0, 268.0, 95.0, 57.0, 30.0, 15.0, 9.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -2.99163818359375, -2.8660888671875, -2.74053955078125, -2.614990234375, -2.48944091796875, -2.3638916015625, -2.23834228515625, -2.11279296875, -1.98724365234375, -1.8616943359375, -1.73614501953125, -1.610595703125, -1.48504638671875, -1.3594970703125, -1.23394775390625, -1.1083984375, -0.98284912109375, -0.8572998046875, -0.73175048828125, -0.606201171875, -0.48065185546875, -0.3551025390625, -0.22955322265625, -0.10400390625, 0.02154541015625, 0.1470947265625, 0.27264404296875, 0.398193359375, 0.52374267578125, 0.6492919921875, 0.77484130859375, 0.900390625, 1.02593994140625, 1.1514892578125, 1.27703857421875, 1.402587890625, 1.52813720703125, 1.6536865234375, 1.77923583984375, 1.90478515625, 2.03033447265625, 2.1558837890625, 2.28143310546875, 2.406982421875, 2.53253173828125, 2.6580810546875, 2.78363037109375, 2.9091796875, 3.03472900390625, 3.1602783203125, 3.28582763671875, 3.411376953125, 3.53692626953125, 3.6624755859375, 3.78802490234375, 3.91357421875, 4.03912353515625, 4.1646728515625, 4.29022216796875, 4.415771484375, 4.54132080078125, 4.6668701171875, 4.79241943359375, 4.91796875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 6.0, 13.0, 29.0, 43.0, 75.0, 140.0, 264.0, 516.0, 1021.0, 938.0, 497.0, 232.0, 121.0, 69.0, 38.0, 16.0, 10.0, 15.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84228515625, -0.8188247680664062, -0.7953643798828125, -0.7719039916992188, -0.748443603515625, -0.7249832153320312, -0.7015228271484375, -0.6780624389648438, -0.65460205078125, -0.6311416625976562, -0.6076812744140625, -0.5842208862304688, -0.560760498046875, -0.5373001098632812, -0.5138397216796875, -0.49037933349609375, -0.4669189453125, -0.44345855712890625, -0.4199981689453125, -0.39653778076171875, -0.373077392578125, -0.34961700439453125, -0.3261566162109375, -0.30269622802734375, -0.27923583984375, -0.25577545166015625, -0.2323150634765625, -0.20885467529296875, -0.185394287109375, -0.16193389892578125, -0.1384735107421875, -0.11501312255859375, -0.091552734375, -0.06809234619140625, -0.0446319580078125, -0.02117156982421875, 0.002288818359375, 0.02574920654296875, 0.0492095947265625, 0.07266998291015625, 0.09613037109375, 0.11959075927734375, 0.1430511474609375, 0.16651153564453125, 0.189971923828125, 0.21343231201171875, 0.2368927001953125, 0.26035308837890625, 0.2838134765625, 0.30727386474609375, 0.3307342529296875, 0.35419464111328125, 0.377655029296875, 0.40111541748046875, 0.4245758056640625, 0.44803619384765625, 0.47149658203125, 0.49495697021484375, 0.5184173583984375, 0.5418777465820312, 0.565338134765625, 0.5887985229492188, 0.6122589111328125, 0.6357192993164062, 0.6591796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 7.0, 11.0, 4.0, 9.0, 7.0, 20.0, 22.0, 38.0, 20.0, 53.0, 59.0, 84.0, 85.0, 110.0, 95.0, 80.0, 73.0, 61.0, 38.0, 36.0, 17.0, 17.0, 15.0, 7.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8231909275054932, -1.763755202293396, -1.7043195962905884, -1.6448838710784912, -1.5854482650756836, -1.5260125398635864, -1.4665768146514893, -1.4071412086486816, -1.347705602645874, -1.2882698774337769, -1.2288342714309692, -1.169398546218872, -1.1099629402160645, -1.0505272150039673, -0.9910915493965149, -0.9316558837890625, -0.8722201585769653, -0.8127844929695129, -0.7533488273620605, -0.6939131021499634, -0.6344774961471558, -0.5750417709350586, -0.5156061053276062, -0.4561704397201538, -0.3967347741127014, -0.337299108505249, -0.27786344289779663, -0.21842774748802185, -0.15899208188056946, -0.09955641627311707, -0.040120720863342285, 0.019314944744110107, 0.0787506103515625, 0.1381862759590149, 0.19762195646762848, 0.25705763697624207, 0.31649330258369446, 0.37592896819114685, 0.43536466360092163, 0.494800329208374, 0.5542359948158264, 0.6136716604232788, 0.6731073260307312, 0.7325429916381836, 0.7919787168502808, 0.8514143228530884, 0.9108500480651855, 0.9702857136726379, 1.0297213792800903, 1.0891571044921875, 1.1485927104949951, 1.2080284357070923, 1.2674640417099, 1.326899766921997, 1.3863353729248047, 1.4457710981369019, 1.505206823348999, 1.5646425485610962, 1.6240781545639038, 1.683513879776001, 1.7429494857788086, 1.8023852109909058, 1.861820936203003, 1.9212565422058105, 1.9806921482086182]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 10.0, 4.0, 9.0, 17.0, 19.0, 13.0, 13.0, 24.0, 16.0, 23.0, 32.0, 28.0, 34.0, 34.0, 49.0, 50.0, 40.0, 47.0, 44.0, 48.0, 35.0, 52.0, 38.0, 26.0, 45.0, 29.0, 28.0, 26.0, 27.0, 24.0, 18.0, 17.0, 12.0, 10.0, 9.0, 6.0, 9.0, 4.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.2771055698394775, -1.2403209209442139, -1.2035361528396606, -1.166751503944397, -1.1299667358398438, -1.09318208694458, -1.0563974380493164, -1.0196127891540527, -0.9828280210494995, -0.9460433125495911, -0.9092586040496826, -0.872473955154419, -0.8356892466545105, -0.798904538154602, -0.7621198892593384, -0.7253351807594299, -0.6885504722595215, -0.651765763759613, -0.6149810552597046, -0.5781964063644409, -0.5414116978645325, -0.504626989364624, -0.46784231066703796, -0.4310576319694519, -0.39427292346954346, -0.357488214969635, -0.32070353627204895, -0.2839188575744629, -0.24713414907455444, -0.2103494554758072, -0.17356476187705994, -0.13678008317947388, -0.09999525547027588, -0.06321056187152863, -0.026425868272781372, 0.010358825325965881, 0.047143518924713135, 0.08392821252346039, 0.12071290612220764, 0.1574975848197937, 0.19428229331970215, 0.2310669869184494, 0.26785168051719666, 0.3046363592147827, 0.34142106771469116, 0.3782057762145996, 0.41499045491218567, 0.45177513360977173, 0.4885598421096802, 0.5253445506095886, 0.5621292591094971, 0.5989139080047607, 0.6356986165046692, 0.6724833250045776, 0.7092679738998413, 0.7460526823997498, 0.7828373908996582, 0.8196220993995667, 0.8564068078994751, 0.8931914567947388, 0.9299761652946472, 0.9667608737945557, 1.0035455226898193, 1.040330171585083, 1.0771149396896362]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 10.0, 7.0, 16.0, 52.0, 123.0, 344.0, 1461.0, 10214.0, 154159.0, 833900.0, 42747.0, 4411.0, 740.0, 207.0, 81.0, 29.0, 16.0, 3.0, 12.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6162109375, -0.590850830078125, -0.56549072265625, -0.540130615234375, -0.5147705078125, -0.489410400390625, -0.46405029296875, -0.438690185546875, -0.413330078125, -0.387969970703125, -0.36260986328125, -0.337249755859375, -0.3118896484375, -0.286529541015625, -0.26116943359375, -0.235809326171875, -0.21044921875, -0.185089111328125, -0.15972900390625, -0.134368896484375, -0.1090087890625, -0.083648681640625, -0.05828857421875, -0.032928466796875, -0.007568359375, 0.017791748046875, 0.04315185546875, 0.068511962890625, 0.0938720703125, 0.119232177734375, 0.14459228515625, 0.169952392578125, 0.1953125, 0.220672607421875, 0.24603271484375, 0.271392822265625, 0.2967529296875, 0.322113037109375, 0.34747314453125, 0.372833251953125, 0.398193359375, 0.423553466796875, 0.44891357421875, 0.474273681640625, 0.4996337890625, 0.524993896484375, 0.55035400390625, 0.575714111328125, 0.60107421875, 0.626434326171875, 0.65179443359375, 0.677154541015625, 0.7025146484375, 0.727874755859375, 0.75323486328125, 0.778594970703125, 0.803955078125, 0.829315185546875, 0.85467529296875, 0.880035400390625, 0.9053955078125, 0.930755615234375, 0.95611572265625, 0.981475830078125, 1.0068359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 8.0, 12.0, 15.0, 13.0, 16.0, 19.0, 29.0, 29.0, 36.0, 44.0, 60.0, 59.0, 58.0, 67.0, 74.0, 69.0, 71.0, 44.0, 60.0, 43.0, 34.0, 37.0, 17.0, 22.0, 9.0, 9.0, 11.0, 8.0, 2.0, 5.0, 5.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.919921875, -0.8831634521484375, -0.846405029296875, -0.8096466064453125, -0.77288818359375, -0.7361297607421875, -0.699371337890625, -0.6626129150390625, -0.6258544921875, -0.5890960693359375, -0.552337646484375, -0.5155792236328125, -0.47882080078125, -0.4420623779296875, -0.405303955078125, -0.3685455322265625, -0.331787109375, -0.2950286865234375, -0.258270263671875, -0.2215118408203125, -0.18475341796875, -0.1479949951171875, -0.111236572265625, -0.0744781494140625, -0.0377197265625, -0.0009613037109375, 0.035797119140625, 0.0725555419921875, 0.10931396484375, 0.1460723876953125, 0.182830810546875, 0.2195892333984375, 0.25634765625, 0.2931060791015625, 0.329864501953125, 0.3666229248046875, 0.40338134765625, 0.4401397705078125, 0.476898193359375, 0.5136566162109375, 0.5504150390625, 0.5871734619140625, 0.623931884765625, 0.6606903076171875, 0.69744873046875, 0.7342071533203125, 0.770965576171875, 0.8077239990234375, 0.844482421875, 0.8812408447265625, 0.917999267578125, 0.9547576904296875, 0.99151611328125, 1.0282745361328125, 1.065032958984375, 1.1017913818359375, 1.1385498046875, 1.1753082275390625, 1.212066650390625, 1.2488250732421875, 1.28558349609375, 1.3223419189453125, 1.359100341796875, 1.3958587646484375, 1.4326171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 10.0, 13.0, 16.0, 19.0, 35.0, 61.0, 105.0, 154.0, 261.0, 488.0, 882.0, 1728.0, 3423.0, 7999.0, 19785.0, 57524.0, 208773.0, 462509.0, 195696.0, 55228.0, 19196.0, 7630.0, 3332.0, 1646.0, 853.0, 470.0, 266.0, 150.0, 114.0, 65.0, 46.0, 19.0, 19.0, 16.0, 9.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.213623046875, -0.20611953735351562, -0.19861602783203125, -0.19111251831054688, -0.1836090087890625, -0.17610549926757812, -0.16860198974609375, -0.16109848022460938, -0.153594970703125, -0.14609146118164062, -0.13858795166015625, -0.13108444213867188, -0.1235809326171875, -0.11607742309570312, -0.10857391357421875, -0.10107040405273438, -0.09356689453125, -0.08606338500976562, -0.07855987548828125, -0.07105636596679688, -0.0635528564453125, -0.056049346923828125, -0.04854583740234375, -0.041042327880859375, -0.033538818359375, -0.026035308837890625, -0.01853179931640625, -0.011028289794921875, -0.0035247802734375, 0.003978729248046875, 0.01148223876953125, 0.018985748291015625, 0.0264892578125, 0.033992767333984375, 0.04149627685546875, 0.048999786376953125, 0.0565032958984375, 0.06400680541992188, 0.07151031494140625, 0.07901382446289062, 0.086517333984375, 0.09402084350585938, 0.10152435302734375, 0.10902786254882812, 0.1165313720703125, 0.12403488159179688, 0.13153839111328125, 0.13904190063476562, 0.14654541015625, 0.15404891967773438, 0.16155242919921875, 0.16905593872070312, 0.1765594482421875, 0.18406295776367188, 0.19156646728515625, 0.19906997680664062, 0.206573486328125, 0.21407699584960938, 0.22158050537109375, 0.22908401489257812, 0.2365875244140625, 0.24409103393554688, 0.25159454345703125, 0.2590980529785156, 0.2666015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 3.0, 9.0, 9.0, 10.0, 10.0, 14.0, 15.0, 14.0, 20.0, 22.0, 30.0, 20.0, 41.0, 35.0, 45.0, 32.0, 55.0, 53.0, 45.0, 45.0, 43.0, 41.0, 41.0, 45.0, 37.0, 44.0, 38.0, 34.0, 27.0, 16.0, 17.0, 11.0, 14.0, 9.0, 3.0, 7.0, 10.0, 5.0, 11.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7841796875, -1.7292938232421875, -1.674407958984375, -1.6195220947265625, -1.56463623046875, -1.5097503662109375, -1.454864501953125, -1.3999786376953125, -1.3450927734375, -1.2902069091796875, -1.235321044921875, -1.1804351806640625, -1.12554931640625, -1.0706634521484375, -1.015777587890625, -0.9608917236328125, -0.906005859375, -0.8511199951171875, -0.796234130859375, -0.7413482666015625, -0.68646240234375, -0.6315765380859375, -0.576690673828125, -0.5218048095703125, -0.4669189453125, -0.4120330810546875, -0.357147216796875, -0.3022613525390625, -0.24737548828125, -0.1924896240234375, -0.137603759765625, -0.0827178955078125, -0.02783203125, 0.0270538330078125, 0.081939697265625, 0.1368255615234375, 0.19171142578125, 0.2465972900390625, 0.301483154296875, 0.3563690185546875, 0.4112548828125, 0.4661407470703125, 0.521026611328125, 0.5759124755859375, 0.63079833984375, 0.6856842041015625, 0.740570068359375, 0.7954559326171875, 0.850341796875, 0.9052276611328125, 0.960113525390625, 1.0149993896484375, 1.06988525390625, 1.1247711181640625, 1.179656982421875, 1.2345428466796875, 1.2894287109375, 1.3443145751953125, 1.399200439453125, 1.4540863037109375, 1.50897216796875, 1.5638580322265625, 1.618743896484375, 1.6736297607421875, 1.728515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 7.0, 11.0, 12.0, 20.0, 21.0, 26.0, 42.0, 52.0, 84.0, 114.0, 181.0, 265.0, 438.0, 730.0, 1195.0, 2106.0, 3950.0, 7817.0, 17386.0, 45553.0, 141797.0, 386624.0, 290643.0, 91811.0, 31343.0, 12809.0, 5993.0, 3160.0, 1720.0, 922.0, 623.0, 387.0, 228.0, 155.0, 95.0, 66.0, 50.0, 35.0, 23.0, 19.0, 15.0, 11.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06341552734375, -0.06135749816894531, -0.059299468994140625, -0.05724143981933594, -0.05518341064453125, -0.05312538146972656, -0.051067352294921875, -0.04900932312011719, -0.0469512939453125, -0.04489326477050781, -0.042835235595703125, -0.04077720642089844, -0.03871917724609375, -0.03666114807128906, -0.034603118896484375, -0.03254508972167969, -0.030487060546875, -0.028429031372070312, -0.026371002197265625, -0.024312973022460938, -0.02225494384765625, -0.020196914672851562, -0.018138885498046875, -0.016080856323242188, -0.0140228271484375, -0.011964797973632812, -0.009906768798828125, -0.007848739624023438, -0.00579071044921875, -0.0037326812744140625, -0.001674652099609375, 0.0003833770751953125, 0.00244140625, 0.0044994354248046875, 0.006557464599609375, 0.008615493774414062, 0.01067352294921875, 0.012731552124023438, 0.014789581298828125, 0.016847610473632812, 0.0189056396484375, 0.020963668823242188, 0.023021697998046875, 0.025079727172851562, 0.02713775634765625, 0.029195785522460938, 0.031253814697265625, 0.03331184387207031, 0.035369873046875, 0.03742790222167969, 0.039485931396484375, 0.04154396057128906, 0.04360198974609375, 0.04566001892089844, 0.047718048095703125, 0.04977607727050781, 0.0518341064453125, 0.05389213562011719, 0.055950164794921875, 0.05800819396972656, 0.06006622314453125, 0.06212425231933594, 0.06418228149414062, 0.06624031066894531, 0.06829833984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 7.0, 10.0, 17.0, 30.0, 25.0, 33.0, 57.0, 73.0, 81.0, 104.0, 94.0, 108.0, 90.0, 78.0, 53.0, 31.0, 24.0, 19.0, 9.0, 12.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.882978439331055e-05, -5.7256780564785004e-05, -5.568377673625946e-05, -5.411077290773392e-05, -5.2537769079208374e-05, -5.096476525068283e-05, -4.939176142215729e-05, -4.7818757593631744e-05, -4.62457537651062e-05, -4.467274993658066e-05, -4.3099746108055115e-05, -4.152674227952957e-05, -3.995373845100403e-05, -3.8380734622478485e-05, -3.680773079395294e-05, -3.52347269654274e-05, -3.3661723136901855e-05, -3.208871930837631e-05, -3.051571547985077e-05, -2.8942711651325226e-05, -2.7369707822799683e-05, -2.579670399427414e-05, -2.4223700165748596e-05, -2.2650696337223053e-05, -2.107769250869751e-05, -1.9504688680171967e-05, -1.7931684851646423e-05, -1.635868102312088e-05, -1.4785677194595337e-05, -1.3212673366069794e-05, -1.163966953754425e-05, -1.0066665709018707e-05, -8.493661880493164e-06, -6.920658051967621e-06, -5.347654223442078e-06, -3.7746503949165344e-06, -2.201646566390991e-06, -6.28642737865448e-07, 9.443610906600952e-07, 2.5173649191856384e-06, 4.090368747711182e-06, 5.663372576236725e-06, 7.236376404762268e-06, 8.809380233287811e-06, 1.0382384061813354e-05, 1.1955387890338898e-05, 1.3528391718864441e-05, 1.5101395547389984e-05, 1.6674399375915527e-05, 1.824740320444107e-05, 1.9820407032966614e-05, 2.1393410861492157e-05, 2.29664146900177e-05, 2.4539418518543243e-05, 2.6112422347068787e-05, 2.768542617559433e-05, 2.9258430004119873e-05, 3.0831433832645416e-05, 3.240443766117096e-05, 3.39774414896965e-05, 3.5550445318222046e-05, 3.712344914674759e-05, 3.869645297527313e-05, 4.0269456803798676e-05, 4.184246063232422e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 14.0, 17.0, 23.0, 40.0, 39.0, 92.0, 147.0, 211.0, 363.0, 634.0, 1285.0, 2530.0, 5310.0, 12624.0, 34264.0, 115310.0, 353939.0, 350609.0, 113800.0, 34078.0, 12510.0, 5406.0, 2471.0, 1221.0, 715.0, 335.0, 185.0, 122.0, 83.0, 44.0, 34.0, 22.0, 13.0, 16.0, 12.0, 6.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.08294677734375, -0.0807638168334961, -0.07858085632324219, -0.07639789581298828, -0.07421493530273438, -0.07203197479248047, -0.06984901428222656, -0.06766605377197266, -0.06548309326171875, -0.06330013275146484, -0.06111717224121094, -0.05893421173095703, -0.056751251220703125, -0.05456829071044922, -0.05238533020019531, -0.050202369689941406, -0.0480194091796875, -0.045836448669433594, -0.04365348815917969, -0.04147052764892578, -0.039287567138671875, -0.03710460662841797, -0.03492164611816406, -0.032738685607910156, -0.03055572509765625, -0.028372764587402344, -0.026189804077148438, -0.02400684356689453, -0.021823883056640625, -0.01964092254638672, -0.017457962036132812, -0.015275001525878906, -0.013092041015625, -0.010909080505371094, -0.008726119995117188, -0.006543159484863281, -0.004360198974609375, -0.0021772384643554688, 5.7220458984375e-06, 0.0021886825561523438, 0.00437164306640625, 0.006554603576660156, 0.008737564086914062, 0.010920524597167969, 0.013103485107421875, 0.015286445617675781, 0.017469406127929688, 0.019652366638183594, 0.0218353271484375, 0.024018287658691406, 0.026201248168945312, 0.02838420867919922, 0.030567169189453125, 0.03275012969970703, 0.03493309020996094, 0.037116050720214844, 0.03929901123046875, 0.041481971740722656, 0.04366493225097656, 0.04584789276123047, 0.048030853271484375, 0.05021381378173828, 0.05239677429199219, 0.054579734802246094, 0.0567626953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 6.0, 8.0, 11.0, 10.0, 10.0, 20.0, 21.0, 26.0, 30.0, 43.0, 35.0, 62.0, 53.0, 75.0, 56.0, 58.0, 63.0, 49.0, 58.0, 50.0, 48.0, 31.0, 32.0, 21.0, 25.0, 21.0, 9.0, 14.0, 7.0, 5.0, 6.0, 7.0, 5.0, 1.0, 3.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0168914794921875, -0.016341686248779297, -0.015791893005371094, -0.01524209976196289, -0.014692306518554688, -0.014142513275146484, -0.013592720031738281, -0.013042926788330078, -0.012493133544921875, -0.011943340301513672, -0.011393547058105469, -0.010843753814697266, -0.010293960571289062, -0.00974416732788086, -0.009194374084472656, -0.008644580841064453, -0.00809478759765625, -0.007544994354248047, -0.006995201110839844, -0.006445407867431641, -0.0058956146240234375, -0.005345821380615234, -0.004796028137207031, -0.004246234893798828, -0.003696441650390625, -0.003146648406982422, -0.0025968551635742188, -0.0020470619201660156, -0.0014972686767578125, -0.0009474754333496094, -0.00039768218994140625, 0.00015211105346679688, 0.000701904296875, 0.0012516975402832031, 0.0018014907836914062, 0.0023512840270996094, 0.0029010772705078125, 0.0034508705139160156, 0.004000663757324219, 0.004550457000732422, 0.005100250244140625, 0.005650043487548828, 0.006199836730957031, 0.006749629974365234, 0.0072994232177734375, 0.00784921646118164, 0.008399009704589844, 0.008948802947998047, 0.00949859619140625, 0.010048389434814453, 0.010598182678222656, 0.01114797592163086, 0.011697769165039062, 0.012247562408447266, 0.012797355651855469, 0.013347148895263672, 0.013896942138671875, 0.014446735382080078, 0.014996528625488281, 0.015546321868896484, 0.016096115112304688, 0.01664590835571289, 0.017195701599121094, 0.017745494842529297, 0.0182952880859375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 16.0, 21.0, 33.0, 78.0, 162.0, 287.0, 222.0, 107.0, 45.0, 24.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4738221168518066, -1.3661812543869019, -1.258540391921997, -1.1508996486663818, -1.043258786201477, -0.9356179237365723, -0.8279771208763123, -0.7203363180160522, -0.6126954555511475, -0.5050545930862427, -0.39741379022598267, -0.28977295756340027, -0.18213212490081787, -0.07449126243591309, 0.033149540424346924, 0.14079034328460693, 0.24843120574951172, 0.3560720384120941, 0.4637128710746765, 0.5713536739349365, 0.6789945363998413, 0.7866353988647461, 0.8942762017250061, 1.0019170045852661, 1.109557867050171, 1.2171987295150757, 1.3248395919799805, 1.4324803352355957, 1.5401211977005005, 1.6477620601654053, 1.7554028034210205, 1.8630436658859253, 1.97068452835083, 2.0783252716064453, 2.1859662532806396, 2.293606996536255, 2.401247978210449, 2.5088887214660645, 2.6165294647216797, 2.724170207977295, 2.8318111896514893, 2.9394519329071045, 3.047092914581299, 3.154733657836914, 3.2623744010925293, 3.3700153827667236, 3.477656126022339, 3.585297107696533, 3.6929378509521484, 3.8005785942077637, 3.908219575881958, 4.015860557556152, 4.123501300811768, 4.231142044067383, 4.338782787322998, 4.446423530578613, 4.554064750671387, 4.661705493927002, 4.769346237182617, 4.876987457275391, 4.984628200531006, 5.092268943786621, 5.199909687042236, 5.307550430297852, 5.415191173553467]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 7.0, 3.0, 11.0, 13.0, 10.0, 25.0, 17.0, 26.0, 18.0, 39.0, 37.0, 42.0, 66.0, 63.0, 58.0, 67.0, 69.0, 59.0, 62.0, 47.0, 45.0, 43.0, 38.0, 35.0, 21.0, 21.0, 16.0, 9.0, 8.0, 9.0, 5.0, 2.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8897004723548889, -0.8552725315093994, -0.8208446502685547, -0.7864167094230652, -0.7519888281822205, -0.717560887336731, -0.6831330060958862, -0.6487050652503967, -0.6142771244049072, -0.5798491835594177, -0.545421302318573, -0.5109933614730835, -0.47656548023223877, -0.44213753938674927, -0.40770962834358215, -0.37328171730041504, -0.3388538360595703, -0.3044259250164032, -0.2699980139732361, -0.23557008802890778, -0.20114217698574066, -0.16671426594257355, -0.13228633999824524, -0.09785842895507812, -0.06343051791191101, -0.029002603143453598, 0.005425311625003815, 0.039853230118751526, 0.07428114116191864, 0.10870905220508575, 0.14313697814941406, 0.17756488919258118, 0.21199274063110352, 0.24642065167427063, 0.28084856271743774, 0.31527650356292725, 0.349704384803772, 0.3841323256492615, 0.4185602366924286, 0.4529881477355957, 0.4874160587787628, 0.5218439698219299, 0.5562719106674194, 0.5906997919082642, 0.6251277327537537, 0.6595556139945984, 0.6939835548400879, 0.7284114360809326, 0.7628393769264221, 0.7972673177719116, 0.8316951990127563, 0.8661231398582458, 0.9005510210990906, 0.9349789619445801, 0.9694068431854248, 1.0038347244262695, 1.0382627248764038, 1.0726906061172485, 1.1071186065673828, 1.1415464878082275, 1.1759743690490723, 1.210402250289917, 1.2448302507400513, 1.279258131980896, 1.3136860132217407]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 6.0, 9.0, 13.0, 37.0, 51.0, 140.0, 364.0, 1147.0, 6624.0, 712731.0, 320721.0, 5155.0, 960.0, 313.0, 142.0, 63.0, 30.0, 17.0, 9.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.98828125, -5.84881591796875, -5.7093505859375, -5.56988525390625, -5.430419921875, -5.29095458984375, -5.1514892578125, -5.01202392578125, -4.87255859375, -4.73309326171875, -4.5936279296875, -4.45416259765625, -4.314697265625, -4.17523193359375, -4.0357666015625, -3.89630126953125, -3.7568359375, -3.61737060546875, -3.4779052734375, -3.33843994140625, -3.198974609375, -3.05950927734375, -2.9200439453125, -2.78057861328125, -2.64111328125, -2.50164794921875, -2.3621826171875, -2.22271728515625, -2.083251953125, -1.94378662109375, -1.8043212890625, -1.66485595703125, -1.525390625, -1.38592529296875, -1.2464599609375, -1.10699462890625, -0.967529296875, -0.82806396484375, -0.6885986328125, -0.54913330078125, -0.40966796875, -0.27020263671875, -0.1307373046875, 0.00872802734375, 0.148193359375, 0.28765869140625, 0.4271240234375, 0.56658935546875, 0.7060546875, 0.84552001953125, 0.9849853515625, 1.12445068359375, 1.263916015625, 1.40338134765625, 1.5428466796875, 1.68231201171875, 1.82177734375, 1.96124267578125, 2.1007080078125, 2.24017333984375, 2.379638671875, 2.51910400390625, 2.6585693359375, 2.79803466796875, 2.9375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 13.0, 20.0, 30.0, 39.0, 65.0, 86.0, 114.0, 115.0, 124.0, 123.0, 95.0, 57.0, 39.0, 26.0, 23.0, 18.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.748046875, -1.623748779296875, -1.49945068359375, -1.375152587890625, -1.2508544921875, -1.126556396484375, -1.00225830078125, -0.877960205078125, -0.753662109375, -0.629364013671875, -0.50506591796875, -0.380767822265625, -0.2564697265625, -0.132171630859375, -0.00787353515625, 0.116424560546875, 0.24072265625, 0.365020751953125, 0.48931884765625, 0.613616943359375, 0.7379150390625, 0.862213134765625, 0.98651123046875, 1.110809326171875, 1.235107421875, 1.359405517578125, 1.48370361328125, 1.608001708984375, 1.7322998046875, 1.856597900390625, 1.98089599609375, 2.105194091796875, 2.2294921875, 2.353790283203125, 2.47808837890625, 2.602386474609375, 2.7266845703125, 2.850982666015625, 2.97528076171875, 3.099578857421875, 3.223876953125, 3.348175048828125, 3.47247314453125, 3.596771240234375, 3.7210693359375, 3.845367431640625, 3.96966552734375, 4.093963623046875, 4.21826171875, 4.342559814453125, 4.46685791015625, 4.591156005859375, 4.7154541015625, 4.839752197265625, 4.96405029296875, 5.088348388671875, 5.212646484375, 5.336944580078125, 5.46124267578125, 5.585540771484375, 5.7098388671875, 5.834136962890625, 5.95843505859375, 6.082733154296875, 6.20703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 12.0, 14.0, 28.0, 56.0, 144.0, 337.0, 1191.0, 7145.0, 994972.0, 41430.0, 2263.0, 557.0, 207.0, 97.0, 38.0, 27.0, 8.0, 11.0, 5.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4921875, -5.33843994140625, -5.1846923828125, -5.03094482421875, -4.877197265625, -4.72344970703125, -4.5697021484375, -4.41595458984375, -4.26220703125, -4.10845947265625, -3.9547119140625, -3.80096435546875, -3.647216796875, -3.49346923828125, -3.3397216796875, -3.18597412109375, -3.0322265625, -2.87847900390625, -2.7247314453125, -2.57098388671875, -2.417236328125, -2.26348876953125, -2.1097412109375, -1.95599365234375, -1.80224609375, -1.64849853515625, -1.4947509765625, -1.34100341796875, -1.187255859375, -1.03350830078125, -0.8797607421875, -0.72601318359375, -0.572265625, -0.41851806640625, -0.2647705078125, -0.11102294921875, 0.042724609375, 0.19647216796875, 0.3502197265625, 0.50396728515625, 0.65771484375, 0.81146240234375, 0.9652099609375, 1.11895751953125, 1.272705078125, 1.42645263671875, 1.5802001953125, 1.73394775390625, 1.8876953125, 2.04144287109375, 2.1951904296875, 2.34893798828125, 2.502685546875, 2.65643310546875, 2.8101806640625, 2.96392822265625, 3.11767578125, 3.27142333984375, 3.4251708984375, 3.57891845703125, 3.732666015625, 3.88641357421875, 4.0401611328125, 4.19390869140625, 4.34765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 3.0, 12.0, 9.0, 18.0, 17.0, 17.0, 18.0, 25.0, 36.0, 33.0, 26.0, 43.0, 45.0, 54.0, 58.0, 50.0, 49.0, 61.0, 47.0, 46.0, 33.0, 39.0, 35.0, 22.0, 30.0, 26.0, 22.0, 27.0, 12.0, 23.0, 12.0, 19.0, 8.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.93939208984375, -1.8787841796875, -1.81817626953125, -1.757568359375, -1.69696044921875, -1.6363525390625, -1.57574462890625, -1.51513671875, -1.45452880859375, -1.3939208984375, -1.33331298828125, -1.272705078125, -1.21209716796875, -1.1514892578125, -1.09088134765625, -1.0302734375, -0.96966552734375, -0.9090576171875, -0.84844970703125, -0.787841796875, -0.72723388671875, -0.6666259765625, -0.60601806640625, -0.54541015625, -0.48480224609375, -0.4241943359375, -0.36358642578125, -0.302978515625, -0.24237060546875, -0.1817626953125, -0.12115478515625, -0.060546875, 6.103515625e-05, 0.0606689453125, 0.12127685546875, 0.181884765625, 0.24249267578125, 0.3031005859375, 0.36370849609375, 0.42431640625, 0.48492431640625, 0.5455322265625, 0.60614013671875, 0.666748046875, 0.72735595703125, 0.7879638671875, 0.84857177734375, 0.9091796875, 0.96978759765625, 1.0303955078125, 1.09100341796875, 1.151611328125, 1.21221923828125, 1.2728271484375, 1.33343505859375, 1.39404296875, 1.45465087890625, 1.5152587890625, 1.57586669921875, 1.636474609375, 1.69708251953125, 1.7576904296875, 1.81829833984375, 1.87890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 9.0, 11.0, 17.0, 20.0, 48.0, 91.0, 216.0, 848.0, 9849.0, 984756.0, 50500.0, 1647.0, 312.0, 134.0, 44.0, 20.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.90966796875, -0.8609695434570312, -0.8122711181640625, -0.7635726928710938, -0.714874267578125, -0.6661758422851562, -0.6174774169921875, -0.5687789916992188, -0.52008056640625, -0.47138214111328125, -0.4226837158203125, -0.37398529052734375, -0.325286865234375, -0.27658843994140625, -0.2278900146484375, -0.17919158935546875, -0.1304931640625, -0.08179473876953125, -0.0330963134765625, 0.01560211181640625, 0.064300537109375, 0.11299896240234375, 0.1616973876953125, 0.21039581298828125, 0.25909423828125, 0.30779266357421875, 0.3564910888671875, 0.40518951416015625, 0.453887939453125, 0.5025863647460938, 0.5512847900390625, 0.5999832153320312, 0.648681640625, 0.6973800659179688, 0.7460784912109375, 0.7947769165039062, 0.843475341796875, 0.8921737670898438, 0.9408721923828125, 0.9895706176757812, 1.03826904296875, 1.0869674682617188, 1.1356658935546875, 1.1843643188476562, 1.233062744140625, 1.2817611694335938, 1.3304595947265625, 1.3791580200195312, 1.4278564453125, 1.4765548706054688, 1.5252532958984375, 1.5739517211914062, 1.622650146484375, 1.6713485717773438, 1.7200469970703125, 1.7687454223632812, 1.81744384765625, 1.8661422729492188, 1.9148406982421875, 1.9635391235351562, 2.012237548828125, 2.0609359741210938, 2.1096343994140625, 2.1583328247070312, 2.20703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 8.0, 10.0, 15.0, 23.0, 37.0, 51.0, 77.0, 110.0, 131.0, 147.0, 121.0, 90.0, 65.0, 35.0, 26.0, 15.0, 9.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.872415542602539e-05, -6.586965173482895e-05, -6.301514804363251e-05, -6.0160644352436066e-05, -5.7306140661239624e-05, -5.445163697004318e-05, -5.159713327884674e-05, -4.87426295876503e-05, -4.588812589645386e-05, -4.3033622205257416e-05, -4.0179118514060974e-05, -3.732461482286453e-05, -3.447011113166809e-05, -3.161560744047165e-05, -2.8761103749275208e-05, -2.5906600058078766e-05, -2.3052096366882324e-05, -2.0197592675685883e-05, -1.734308898448944e-05, -1.4488585293293e-05, -1.1634081602096558e-05, -8.779577910900116e-06, -5.925074219703674e-06, -3.0705705285072327e-06, -2.1606683731079102e-07, 2.6384368538856506e-06, 5.492940545082092e-06, 8.347444236278534e-06, 1.1201947927474976e-05, 1.4056451618671417e-05, 1.691095530986786e-05, 1.97654590010643e-05, 2.2619962692260742e-05, 2.5474466383457184e-05, 2.8328970074653625e-05, 3.118347376585007e-05, 3.403797745704651e-05, 3.689248114824295e-05, 3.974698483943939e-05, 4.2601488530635834e-05, 4.5455992221832275e-05, 4.831049591302872e-05, 5.116499960422516e-05, 5.40195032954216e-05, 5.687400698661804e-05, 5.9728510677814484e-05, 6.258301436901093e-05, 6.543751806020737e-05, 6.829202175140381e-05, 7.114652544260025e-05, 7.400102913379669e-05, 7.685553282499313e-05, 7.971003651618958e-05, 8.256454020738602e-05, 8.541904389858246e-05, 8.82735475897789e-05, 9.112805128097534e-05, 9.398255497217178e-05, 9.683705866336823e-05, 9.969156235456467e-05, 0.00010254606604576111, 0.00010540056973695755, 0.00010825507342815399, 0.00011110957711935043, 0.00011396408081054688]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 9.0, 18.0, 15.0, 26.0, 91.0, 253.0, 925.0, 9201.0, 983904.0, 51539.0, 1944.0, 391.0, 131.0, 58.0, 24.0, 12.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.74609375, -1.69268798828125, -1.6392822265625, -1.58587646484375, -1.532470703125, -1.47906494140625, -1.4256591796875, -1.37225341796875, -1.31884765625, -1.26544189453125, -1.2120361328125, -1.15863037109375, -1.105224609375, -1.05181884765625, -0.9984130859375, -0.94500732421875, -0.8916015625, -0.83819580078125, -0.7847900390625, -0.73138427734375, -0.677978515625, -0.62457275390625, -0.5711669921875, -0.51776123046875, -0.46435546875, -0.41094970703125, -0.3575439453125, -0.30413818359375, -0.250732421875, -0.19732666015625, -0.1439208984375, -0.09051513671875, -0.037109375, 0.01629638671875, 0.0697021484375, 0.12310791015625, 0.176513671875, 0.22991943359375, 0.2833251953125, 0.33673095703125, 0.39013671875, 0.44354248046875, 0.4969482421875, 0.55035400390625, 0.603759765625, 0.65716552734375, 0.7105712890625, 0.76397705078125, 0.8173828125, 0.87078857421875, 0.9241943359375, 0.97760009765625, 1.031005859375, 1.08441162109375, 1.1378173828125, 1.19122314453125, 1.24462890625, 1.29803466796875, 1.3514404296875, 1.40484619140625, 1.458251953125, 1.51165771484375, 1.5650634765625, 1.61846923828125, 1.671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 10.0, 6.0, 22.0, 47.0, 89.0, 203.0, 254.0, 193.0, 94.0, 40.0, 18.0, 14.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.430908203125, -0.41674041748046875, -0.4025726318359375, -0.38840484619140625, -0.374237060546875, -0.36006927490234375, -0.3459014892578125, -0.33173370361328125, -0.31756591796875, -0.30339813232421875, -0.2892303466796875, -0.27506256103515625, -0.260894775390625, -0.24672698974609375, -0.2325592041015625, -0.21839141845703125, -0.2042236328125, -0.19005584716796875, -0.1758880615234375, -0.16172027587890625, -0.147552490234375, -0.13338470458984375, -0.1192169189453125, -0.10504913330078125, -0.09088134765625, -0.07671356201171875, -0.0625457763671875, -0.04837799072265625, -0.034210205078125, -0.02004241943359375, -0.0058746337890625, 0.00829315185546875, 0.0224609375, 0.03662872314453125, 0.0507965087890625, 0.06496429443359375, 0.079132080078125, 0.09329986572265625, 0.1074676513671875, 0.12163543701171875, 0.13580322265625, 0.14997100830078125, 0.1641387939453125, 0.17830657958984375, 0.192474365234375, 0.20664215087890625, 0.2208099365234375, 0.23497772216796875, 0.2491455078125, 0.26331329345703125, 0.2774810791015625, 0.29164886474609375, 0.305816650390625, 0.31998443603515625, 0.3341522216796875, 0.34832000732421875, 0.36248779296875, 0.37665557861328125, 0.3908233642578125, 0.40499114990234375, 0.419158935546875, 0.43332672119140625, 0.4474945068359375, 0.46166229248046875, 0.475830078125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 9.0, 6.0, 12.0, 16.0, 12.0, 16.0, 21.0, 37.0, 55.0, 45.0, 84.0, 106.0, 94.0, 132.0, 84.0, 69.0, 53.0, 45.0, 25.0, 24.0, 10.0, 11.0, 6.0, 10.0, 8.0, 1.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.9204657077789307, -2.8390283584594727, -2.7575907707214355, -2.6761534214019775, -2.5947160720825195, -2.5132784843444824, -2.4318411350250244, -2.3504037857055664, -2.2689661979675293, -2.1875288486480713, -2.106091260910034, -2.024653911590576, -1.9432165622711182, -1.8617790937423706, -1.780341625213623, -1.698904275894165, -1.617466926574707, -1.5360294580459595, -1.4545921087265015, -1.373154640197754, -1.291717290878296, -1.2102798223495483, -1.1288423538208008, -1.0474050045013428, -0.9659675359725952, -0.8845301270484924, -0.8030927181243896, -0.7216552495956421, -0.6402178406715393, -0.5587804317474365, -0.47734299302101135, -0.3959055542945862, -0.3144681453704834, -0.23303072154521942, -0.15159329771995544, -0.07015587389469147, 0.01128154993057251, 0.09271895885467529, 0.17415639758110046, 0.25559383630752563, 0.3370312452316284, 0.4184686541557312, 0.49990609288215637, 0.5813435316085815, 0.6627809405326843, 0.7442183494567871, 0.8256558179855347, 0.9070932269096375, 0.9885306358337402, 1.0699681043624878, 1.1514054536819458, 1.2328429222106934, 1.3142802715301514, 1.395717740058899, 1.4771552085876465, 1.5585925579071045, 1.640030026435852, 1.7214674949645996, 1.8029048442840576, 1.8843423128128052, 1.9657797813415527, 2.0472171306610107, 2.1286544799804688, 2.210092067718506, 2.291529417037964]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 8.0, 6.0, 9.0, 18.0, 25.0, 18.0, 30.0, 29.0, 46.0, 35.0, 45.0, 68.0, 59.0, 73.0, 57.0, 65.0, 76.0, 59.0, 46.0, 37.0, 48.0, 37.0, 30.0, 29.0, 16.0, 14.0, 13.0, 7.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8982648849487305, -2.756880521774292, -2.6154961585998535, -2.474111795425415, -2.3327274322509766, -2.191343307495117, -2.0499589443206787, -1.9085745811462402, -1.7671902179718018, -1.6258058547973633, -1.4844214916229248, -1.3430372476577759, -1.2016528844833374, -1.060268521308899, -0.9188842177391052, -0.7774999141693115, -0.636115550994873, -0.49473121762275696, -0.35334688425064087, -0.21196255087852478, -0.07057821750640869, 0.07080614566802979, 0.2121904492378235, 0.3535747528076172, 0.49495911598205566, 0.6363434791564941, 0.7777277827262878, 0.9191120862960815, 1.06049644947052, 1.2018808126449585, 1.3432650566101074, 1.484649419784546, 1.6260337829589844, 1.7674181461334229, 1.9088025093078613, 2.0501868724823, 2.1915712356567383, 2.3329553604125977, 2.474339723587036, 2.6157240867614746, 2.757108449935913, 2.8984928131103516, 3.03987717628479, 3.1812615394592285, 3.322645664215088, 3.4640302658081055, 3.605414390563965, 3.7467987537384033, 3.888183116912842, 4.029567241668701, 4.170951843261719, 4.312335968017578, 4.453720569610596, 4.595104694366455, 4.736489295959473, 4.877873420715332, 5.019257545471191, 5.160641670227051, 5.302026271820068, 5.443410396575928, 5.584794998168945, 5.726179122924805, 5.867563724517822, 6.008947849273682, 6.150332450866699]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 6.0, 5.0, 6.0, 11.0, 11.0, 14.0, 21.0, 30.0, 39.0, 64.0, 75.0, 129.0, 201.0, 327.0, 610.0, 1390.0, 3614.0, 17932.0, 284192.0, 3446205.0, 405749.0, 24892.0, 4715.0, 2051.0, 919.0, 448.0, 229.0, 131.0, 81.0, 56.0, 37.0, 26.0, 20.0, 11.0, 9.0, 9.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.310546875, -2.2296142578125, -2.148681640625, -2.0677490234375, -1.98681640625, -1.9058837890625, -1.824951171875, -1.7440185546875, -1.6630859375, -1.5821533203125, -1.501220703125, -1.4202880859375, -1.33935546875, -1.2584228515625, -1.177490234375, -1.0965576171875, -1.015625, -0.9346923828125, -0.853759765625, -0.7728271484375, -0.69189453125, -0.6109619140625, -0.530029296875, -0.4490966796875, -0.3681640625, -0.2872314453125, -0.206298828125, -0.1253662109375, -0.04443359375, 0.0364990234375, 0.117431640625, 0.1983642578125, 0.279296875, 0.3602294921875, 0.441162109375, 0.5220947265625, 0.60302734375, 0.6839599609375, 0.764892578125, 0.8458251953125, 0.9267578125, 1.0076904296875, 1.088623046875, 1.1695556640625, 1.25048828125, 1.3314208984375, 1.412353515625, 1.4932861328125, 1.57421875, 1.6551513671875, 1.736083984375, 1.8170166015625, 1.89794921875, 1.9788818359375, 2.059814453125, 2.1407470703125, 2.2216796875, 2.3026123046875, 2.383544921875, 2.4644775390625, 2.54541015625, 2.6263427734375, 2.707275390625, 2.7882080078125, 2.869140625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 10.0, 24.0, 27.0, 32.0, 51.0, 52.0, 70.0, 105.0, 95.0, 81.0, 89.0, 74.0, 73.0, 73.0, 43.0, 24.0, 21.0, 12.0, 17.0, 4.0, 2.0, 5.0, 4.0, 2.0, 3.0], "bins": [-3.060546875, -2.997100830078125, -2.93365478515625, -2.870208740234375, -2.8067626953125, -2.743316650390625, -2.67987060546875, -2.616424560546875, -2.552978515625, -2.489532470703125, -2.42608642578125, -2.362640380859375, -2.2991943359375, -2.235748291015625, -2.17230224609375, -2.108856201171875, -2.04541015625, -1.981964111328125, -1.91851806640625, -1.855072021484375, -1.7916259765625, -1.728179931640625, -1.66473388671875, -1.601287841796875, -1.537841796875, -1.474395751953125, -1.41094970703125, -1.347503662109375, -1.2840576171875, -1.220611572265625, -1.15716552734375, -1.093719482421875, -1.0302734375, -0.966827392578125, -0.90338134765625, -0.839935302734375, -0.7764892578125, -0.713043212890625, -0.64959716796875, -0.586151123046875, -0.522705078125, -0.459259033203125, -0.39581298828125, -0.332366943359375, -0.2689208984375, -0.205474853515625, -0.14202880859375, -0.078582763671875, -0.01513671875, 0.048309326171875, 0.11175537109375, 0.175201416015625, 0.2386474609375, 0.302093505859375, 0.36553955078125, 0.428985595703125, 0.492431640625, 0.555877685546875, 0.61932373046875, 0.682769775390625, 0.7462158203125, 0.809661865234375, 0.87310791015625, 0.936553955078125, 1.0]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 10.0, 9.0, 17.0, 14.0, 37.0, 57.0, 84.0, 128.0, 184.0, 327.0, 519.0, 1027.0, 1998.0, 4324.0, 11990.0, 47906.0, 482787.0, 3345498.0, 247675.0, 33016.0, 9348.0, 3577.0, 1669.0, 854.0, 454.0, 256.0, 203.0, 95.0, 63.0, 46.0, 34.0, 20.0, 19.0, 8.0, 6.0, 2.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5546875, -1.506683349609375, -1.45867919921875, -1.410675048828125, -1.3626708984375, -1.314666748046875, -1.26666259765625, -1.218658447265625, -1.170654296875, -1.122650146484375, -1.07464599609375, -1.026641845703125, -0.9786376953125, -0.930633544921875, -0.88262939453125, -0.834625244140625, -0.78662109375, -0.738616943359375, -0.69061279296875, -0.642608642578125, -0.5946044921875, -0.546600341796875, -0.49859619140625, -0.450592041015625, -0.402587890625, -0.354583740234375, -0.30657958984375, -0.258575439453125, -0.2105712890625, -0.162567138671875, -0.11456298828125, -0.066558837890625, -0.0185546875, 0.029449462890625, 0.07745361328125, 0.125457763671875, 0.1734619140625, 0.221466064453125, 0.26947021484375, 0.317474365234375, 0.365478515625, 0.413482666015625, 0.46148681640625, 0.509490966796875, 0.5574951171875, 0.605499267578125, 0.65350341796875, 0.701507568359375, 0.74951171875, 0.797515869140625, 0.84552001953125, 0.893524169921875, 0.9415283203125, 0.989532470703125, 1.03753662109375, 1.085540771484375, 1.133544921875, 1.181549072265625, 1.22955322265625, 1.277557373046875, 1.3255615234375, 1.373565673828125, 1.42156982421875, 1.469573974609375, 1.517578125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 8.0, 16.0, 15.0, 25.0, 24.0, 51.0, 72.0, 133.0, 220.0, 385.0, 574.0, 749.0, 638.0, 405.0, 257.0, 169.0, 105.0, 60.0, 42.0, 25.0, 23.0, 13.0, 8.0, 8.0, 2.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.464599609375, -0.4489860534667969, -0.43337249755859375, -0.4177589416503906, -0.4021453857421875, -0.3865318298339844, -0.37091827392578125, -0.3553047180175781, -0.339691162109375, -0.3240776062011719, -0.30846405029296875, -0.2928504943847656, -0.2772369384765625, -0.2616233825683594, -0.24600982666015625, -0.23039627075195312, -0.21478271484375, -0.19916915893554688, -0.18355560302734375, -0.16794204711914062, -0.1523284912109375, -0.13671493530273438, -0.12110137939453125, -0.10548782348632812, -0.089874267578125, -0.07426071166992188, -0.05864715576171875, -0.043033599853515625, -0.0274200439453125, -0.011806488037109375, 0.00380706787109375, 0.019420623779296875, 0.0350341796875, 0.050647735595703125, 0.06626129150390625, 0.08187484741210938, 0.0974884033203125, 0.11310195922851562, 0.12871551513671875, 0.14432907104492188, 0.159942626953125, 0.17555618286132812, 0.19116973876953125, 0.20678329467773438, 0.2223968505859375, 0.23801040649414062, 0.25362396240234375, 0.2692375183105469, 0.28485107421875, 0.3004646301269531, 0.31607818603515625, 0.3316917419433594, 0.3473052978515625, 0.3629188537597656, 0.37853240966796875, 0.3941459655761719, 0.409759521484375, 0.4253730773925781, 0.44098663330078125, 0.4566001892089844, 0.4722137451171875, 0.4878273010253906, 0.5034408569335938, 0.5190544128417969, 0.53466796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 3.0, 11.0, 9.0, 12.0, 16.0, 34.0, 37.0, 44.0, 57.0, 82.0, 95.0, 123.0, 103.0, 107.0, 67.0, 61.0, 31.0, 27.0, 22.0, 16.0, 9.0, 7.0, 10.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9541956186294556, -1.8948231935501099, -1.8354507684707642, -1.7760783433914185, -1.7167059183120728, -1.657333493232727, -1.597961187362671, -1.5385887622833252, -1.4792163372039795, -1.4198439121246338, -1.360471487045288, -1.3010990619659424, -1.2417266368865967, -1.182354211807251, -1.1229817867279053, -1.0636093616485596, -1.0042369365692139, -0.9448645114898682, -0.8854920864105225, -0.8261196613311768, -0.766747236251831, -0.7073748111724854, -0.6480024456977844, -0.5886300206184387, -0.529257595539093, -0.4698851704597473, -0.4105127453804016, -0.3511403501033783, -0.2917679250240326, -0.2323954999446869, -0.17302310466766357, -0.11365067958831787, -0.05427825450897217, 0.005094163119792938, 0.06446658074855804, 0.12383899092674255, 0.18321141600608826, 0.24258384108543396, 0.3019562363624573, 0.361328661441803, 0.4207010865211487, 0.4800735116004944, 0.5394459366798401, 0.598818302154541, 0.6581907272338867, 0.7175631523132324, 0.7769355773925781, 0.8363080024719238, 0.8956804275512695, 0.9550528526306152, 1.014425277709961, 1.0737977027893066, 1.1331701278686523, 1.192542552947998, 1.2519149780273438, 1.3112874031066895, 1.3706598281860352, 1.4300322532653809, 1.4894046783447266, 1.5487771034240723, 1.608149528503418, 1.6675219535827637, 1.7268943786621094, 1.786266803741455, 1.8456391096115112]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 3.0, 5.0, 7.0, 7.0, 13.0, 20.0, 17.0, 18.0, 17.0, 30.0, 31.0, 29.0, 28.0, 42.0, 51.0, 57.0, 49.0, 59.0, 71.0, 52.0, 57.0, 46.0, 39.0, 31.0, 41.0, 29.0, 28.0, 21.0, 14.0, 18.0, 18.0, 12.0, 7.0, 6.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1175644397735596, -1.0779024362564087, -1.0382405519485474, -0.9985785484313965, -0.9589165449142456, -0.9192546010017395, -0.8795926570892334, -0.8399306535720825, -0.8002687096595764, -0.7606067657470703, -0.7209447622299194, -0.6812828183174133, -0.6416208744049072, -0.6019588708877563, -0.5622969269752502, -0.5226349830627441, -0.48297297954559326, -0.44331100583076477, -0.4036490321159363, -0.3639870882034302, -0.3243251144886017, -0.2846631407737732, -0.2450011819601059, -0.2053392231464386, -0.1656772494316101, -0.12601527571678162, -0.08635331690311432, -0.046691350638866425, -0.00702938437461853, 0.03263258934020996, 0.07229454815387726, 0.11195650696754456, 0.1516183614730835, 0.191280335187912, 0.23094229400157928, 0.2706042528152466, 0.3102662265300751, 0.34992820024490356, 0.38959014415740967, 0.42925211787223816, 0.46891409158706665, 0.5085760354995728, 0.5482380390167236, 0.5878999829292297, 0.6275619268417358, 0.6672239303588867, 0.7068858742713928, 0.7465478181838989, 0.7862098217010498, 0.8258717656135559, 0.8655337691307068, 0.9051957130432129, 0.9448577165603638, 0.9845196604728699, 1.024181604385376, 1.0638436079025269, 1.1035056114196777, 1.1431676149368286, 1.18282949924469, 1.2224915027618408, 1.2621535062789917, 1.3018155097961426, 1.341477394104004, 1.3811393976211548, 1.4208012819290161]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 5.0, 7.0, 3.0, 9.0, 7.0, 15.0, 18.0, 15.0, 16.0, 29.0, 25.0, 43.0, 51.0, 77.0, 122.0, 361.0, 894.0, 2629.0, 9265.0, 45213.0, 329901.0, 550525.0, 87733.0, 15344.0, 3846.0, 1378.0, 446.0, 196.0, 99.0, 62.0, 57.0, 28.0, 25.0, 20.0, 18.0, 13.0, 9.0, 8.0, 7.0, 12.0, 8.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.316650390625, -0.3068084716796875, -0.296966552734375, -0.2871246337890625, -0.27728271484375, -0.2674407958984375, -0.257598876953125, -0.2477569580078125, -0.2379150390625, -0.2280731201171875, -0.218231201171875, -0.2083892822265625, -0.19854736328125, -0.1887054443359375, -0.178863525390625, -0.1690216064453125, -0.1591796875, -0.1493377685546875, -0.139495849609375, -0.1296539306640625, -0.11981201171875, -0.1099700927734375, -0.100128173828125, -0.0902862548828125, -0.0804443359375, -0.0706024169921875, -0.060760498046875, -0.0509185791015625, -0.04107666015625, -0.0312347412109375, -0.021392822265625, -0.0115509033203125, -0.001708984375, 0.0081329345703125, 0.017974853515625, 0.0278167724609375, 0.03765869140625, 0.0475006103515625, 0.057342529296875, 0.0671844482421875, 0.0770263671875, 0.0868682861328125, 0.096710205078125, 0.1065521240234375, 0.11639404296875, 0.1262359619140625, 0.136077880859375, 0.1459197998046875, 0.15576171875, 0.1656036376953125, 0.175445556640625, 0.1852874755859375, 0.19512939453125, 0.2049713134765625, 0.214813232421875, 0.2246551513671875, 0.2344970703125, 0.2443389892578125, 0.254180908203125, 0.2640228271484375, 0.27386474609375, 0.2837066650390625, 0.293548583984375, 0.3033905029296875, 0.313232421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 5.0, 21.0, 30.0, 49.0, 58.0, 97.0, 126.0, 160.0, 156.0, 103.0, 63.0, 52.0, 35.0, 17.0, 7.0, 8.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.154296875, -3.08795166015625, -3.0216064453125, -2.95526123046875, -2.888916015625, -2.82257080078125, -2.7562255859375, -2.68988037109375, -2.62353515625, -2.55718994140625, -2.4908447265625, -2.42449951171875, -2.358154296875, -2.29180908203125, -2.2254638671875, -2.15911865234375, -2.0927734375, -2.02642822265625, -1.9600830078125, -1.89373779296875, -1.827392578125, -1.76104736328125, -1.6947021484375, -1.62835693359375, -1.56201171875, -1.49566650390625, -1.4293212890625, -1.36297607421875, -1.296630859375, -1.23028564453125, -1.1639404296875, -1.09759521484375, -1.03125, -0.96490478515625, -0.8985595703125, -0.83221435546875, -0.765869140625, -0.69952392578125, -0.6331787109375, -0.56683349609375, -0.50048828125, -0.43414306640625, -0.3677978515625, -0.30145263671875, -0.235107421875, -0.16876220703125, -0.1024169921875, -0.03607177734375, 0.0302734375, 0.09661865234375, 0.1629638671875, 0.22930908203125, 0.295654296875, 0.36199951171875, 0.4283447265625, 0.49468994140625, 0.56103515625, 0.62738037109375, 0.6937255859375, 0.76007080078125, 0.826416015625, 0.89276123046875, 0.9591064453125, 1.02545166015625, 1.091796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 2.0, 3.0, 7.0, 8.0, 13.0, 16.0, 20.0, 29.0, 29.0, 66.0, 91.0, 130.0, 231.0, 316.0, 566.0, 964.0, 1922.0, 3874.0, 9119.0, 24534.0, 72144.0, 231511.0, 419048.0, 188609.0, 59000.0, 20840.0, 8259.0, 3403.0, 1667.0, 862.0, 459.0, 263.0, 197.0, 94.0, 79.0, 51.0, 40.0, 24.0, 21.0, 15.0, 16.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.1949462890625, -0.1895923614501953, -0.18423843383789062, -0.17888450622558594, -0.17353057861328125, -0.16817665100097656, -0.16282272338867188, -0.1574687957763672, -0.1521148681640625, -0.1467609405517578, -0.14140701293945312, -0.13605308532714844, -0.13069915771484375, -0.12534523010253906, -0.11999130249023438, -0.11463737487792969, -0.109283447265625, -0.10392951965332031, -0.09857559204101562, -0.09322166442871094, -0.08786773681640625, -0.08251380920410156, -0.07715988159179688, -0.07180595397949219, -0.0664520263671875, -0.06109809875488281, -0.055744171142578125, -0.05039024353027344, -0.04503631591796875, -0.03968238830566406, -0.034328460693359375, -0.028974533081054688, -0.02362060546875, -0.018266677856445312, -0.012912750244140625, -0.0075588226318359375, -0.00220489501953125, 0.0031490325927734375, 0.008502960205078125, 0.013856887817382812, 0.0192108154296875, 0.024564743041992188, 0.029918670654296875, 0.03527259826660156, 0.04062652587890625, 0.04598045349121094, 0.051334381103515625, 0.05668830871582031, 0.062042236328125, 0.06739616394042969, 0.07275009155273438, 0.07810401916503906, 0.08345794677734375, 0.08881187438964844, 0.09416580200195312, 0.09951972961425781, 0.1048736572265625, 0.11022758483886719, 0.11558151245117188, 0.12093544006347656, 0.12628936767578125, 0.13164329528808594, 0.13699722290039062, 0.1423511505126953, 0.147705078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 5.0, 8.0, 8.0, 22.0, 22.0, 14.0, 15.0, 24.0, 31.0, 37.0, 34.0, 49.0, 51.0, 55.0, 51.0, 45.0, 44.0, 62.0, 50.0, 49.0, 34.0, 37.0, 37.0, 33.0, 25.0, 24.0, 28.0, 19.0, 19.0, 7.0, 16.0, 11.0, 6.0, 8.0, 1.0, 4.0, 5.0, 4.0], "bins": [-2.1484375, -2.0975341796875, -2.046630859375, -1.9957275390625, -1.94482421875, -1.8939208984375, -1.843017578125, -1.7921142578125, -1.7412109375, -1.6903076171875, -1.639404296875, -1.5885009765625, -1.53759765625, -1.4866943359375, -1.435791015625, -1.3848876953125, -1.333984375, -1.2830810546875, -1.232177734375, -1.1812744140625, -1.13037109375, -1.0794677734375, -1.028564453125, -0.9776611328125, -0.9267578125, -0.8758544921875, -0.824951171875, -0.7740478515625, -0.72314453125, -0.6722412109375, -0.621337890625, -0.5704345703125, -0.51953125, -0.4686279296875, -0.417724609375, -0.3668212890625, -0.31591796875, -0.2650146484375, -0.214111328125, -0.1632080078125, -0.1123046875, -0.0614013671875, -0.010498046875, 0.0404052734375, 0.09130859375, 0.1422119140625, 0.193115234375, 0.2440185546875, 0.294921875, 0.3458251953125, 0.396728515625, 0.4476318359375, 0.49853515625, 0.5494384765625, 0.600341796875, 0.6512451171875, 0.7021484375, 0.7530517578125, 0.803955078125, 0.8548583984375, 0.90576171875, 0.9566650390625, 1.007568359375, 1.0584716796875, 1.109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 14.0, 10.0, 15.0, 19.0, 36.0, 50.0, 84.0, 139.0, 227.0, 448.0, 1068.0, 2792.0, 10085.0, 53132.0, 440815.0, 466199.0, 57611.0, 10579.0, 2975.0, 1091.0, 500.0, 255.0, 135.0, 89.0, 60.0, 33.0, 28.0, 16.0, 17.0, 6.0, 6.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09307861328125, -0.09025955200195312, -0.08744049072265625, -0.08462142944335938, -0.0818023681640625, -0.07898330688476562, -0.07616424560546875, -0.07334518432617188, -0.070526123046875, -0.06770706176757812, -0.06488800048828125, -0.062068939208984375, -0.0592498779296875, -0.056430816650390625, -0.05361175537109375, -0.050792694091796875, -0.0479736328125, -0.045154571533203125, -0.04233551025390625, -0.039516448974609375, -0.0366973876953125, -0.033878326416015625, -0.03105926513671875, -0.028240203857421875, -0.025421142578125, -0.022602081298828125, -0.01978302001953125, -0.016963958740234375, -0.0141448974609375, -0.011325836181640625, -0.00850677490234375, -0.005687713623046875, -0.00286865234375, -4.9591064453125e-05, 0.00276947021484375, 0.005588531494140625, 0.0084075927734375, 0.011226654052734375, 0.01404571533203125, 0.016864776611328125, 0.019683837890625, 0.022502899169921875, 0.02532196044921875, 0.028141021728515625, 0.0309600830078125, 0.033779144287109375, 0.03659820556640625, 0.039417266845703125, 0.042236328125, 0.045055389404296875, 0.04787445068359375, 0.050693511962890625, 0.0535125732421875, 0.056331634521484375, 0.05915069580078125, 0.061969757080078125, 0.064788818359375, 0.06760787963867188, 0.07042694091796875, 0.07324600219726562, 0.0760650634765625, 0.07888412475585938, 0.08170318603515625, 0.08452224731445312, 0.08734130859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 8.0, 8.0, 11.0, 8.0, 22.0, 28.0, 32.0, 46.0, 63.0, 78.0, 94.0, 110.0, 110.0, 96.0, 75.0, 54.0, 58.0, 23.0, 24.0, 15.0, 13.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.820657730102539e-05, -3.700517117977142e-05, -3.5803765058517456e-05, -3.460235893726349e-05, -3.340095281600952e-05, -3.2199546694755554e-05, -3.099814057350159e-05, -2.979673445224762e-05, -2.8595328330993652e-05, -2.7393922209739685e-05, -2.6192516088485718e-05, -2.499110996723175e-05, -2.3789703845977783e-05, -2.2588297724723816e-05, -2.138689160346985e-05, -2.018548548221588e-05, -1.8984079360961914e-05, -1.7782673239707947e-05, -1.658126711845398e-05, -1.5379860997200012e-05, -1.4178454875946045e-05, -1.2977048754692078e-05, -1.177564263343811e-05, -1.0574236512184143e-05, -9.372830390930176e-06, -8.171424269676208e-06, -6.970018148422241e-06, -5.768612027168274e-06, -4.567205905914307e-06, -3.3657997846603394e-06, -2.164393663406372e-06, -9.629875421524048e-07, 2.384185791015625e-07, 1.4398247003555298e-06, 2.641230821609497e-06, 3.842636942863464e-06, 5.044043064117432e-06, 6.245449185371399e-06, 7.446855306625366e-06, 8.648261427879333e-06, 9.8496675491333e-06, 1.1051073670387268e-05, 1.2252479791641235e-05, 1.3453885912895203e-05, 1.465529203414917e-05, 1.5856698155403137e-05, 1.7058104276657104e-05, 1.8259510397911072e-05, 1.946091651916504e-05, 2.0662322640419006e-05, 2.1863728761672974e-05, 2.306513488292694e-05, 2.4266541004180908e-05, 2.5467947125434875e-05, 2.6669353246688843e-05, 2.787075936794281e-05, 2.9072165489196777e-05, 3.0273571610450745e-05, 3.147497773170471e-05, 3.267638385295868e-05, 3.3877789974212646e-05, 3.5079196095466614e-05, 3.628060221672058e-05, 3.748200833797455e-05, 3.8683414459228516e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 13.0, 20.0, 30.0, 31.0, 73.0, 96.0, 169.0, 303.0, 565.0, 1111.0, 2258.0, 5093.0, 13241.0, 37969.0, 117304.0, 308031.0, 343093.0, 144606.0, 46842.0, 16039.0, 6301.0, 2623.0, 1236.0, 659.0, 327.0, 192.0, 119.0, 73.0, 48.0, 27.0, 17.0, 9.0, 9.0, 3.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0579833984375, -0.056461334228515625, -0.05493927001953125, -0.053417205810546875, -0.0518951416015625, -0.050373077392578125, -0.04885101318359375, -0.047328948974609375, -0.045806884765625, -0.044284820556640625, -0.04276275634765625, -0.041240692138671875, -0.0397186279296875, -0.038196563720703125, -0.03667449951171875, -0.035152435302734375, -0.03363037109375, -0.032108306884765625, -0.03058624267578125, -0.029064178466796875, -0.0275421142578125, -0.026020050048828125, -0.02449798583984375, -0.022975921630859375, -0.021453857421875, -0.019931793212890625, -0.01840972900390625, -0.016887664794921875, -0.0153656005859375, -0.013843536376953125, -0.01232147216796875, -0.010799407958984375, -0.00927734375, -0.007755279541015625, -0.00623321533203125, -0.004711151123046875, -0.0031890869140625, -0.001667022705078125, -0.00014495849609375, 0.001377105712890625, 0.002899169921875, 0.004421234130859375, 0.00594329833984375, 0.007465362548828125, 0.0089874267578125, 0.010509490966796875, 0.01203155517578125, 0.013553619384765625, 0.01507568359375, 0.016597747802734375, 0.01811981201171875, 0.019641876220703125, 0.0211639404296875, 0.022686004638671875, 0.02420806884765625, 0.025730133056640625, 0.027252197265625, 0.028774261474609375, 0.03029632568359375, 0.031818389892578125, 0.0333404541015625, 0.034862518310546875, 0.03638458251953125, 0.037906646728515625, 0.0394287109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 0.0, 3.0, 6.0, 4.0, 9.0, 13.0, 12.0, 12.0, 21.0, 16.0, 25.0, 29.0, 33.0, 49.0, 49.0, 37.0, 53.0, 49.0, 64.0, 58.0, 63.0, 71.0, 56.0, 49.0, 46.0, 35.0, 26.0, 22.0, 20.0, 17.0, 10.0, 8.0, 11.0, 4.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010772705078125, -0.010311126708984375, -0.00984954833984375, -0.009387969970703125, -0.0089263916015625, -0.008464813232421875, -0.00800323486328125, -0.007541656494140625, -0.007080078125, -0.006618499755859375, -0.00615692138671875, -0.005695343017578125, -0.0052337646484375, -0.004772186279296875, -0.00431060791015625, -0.003849029541015625, -0.003387451171875, -0.002925872802734375, -0.00246429443359375, -0.002002716064453125, -0.0015411376953125, -0.001079559326171875, -0.00061798095703125, -0.000156402587890625, 0.00030517578125, 0.000766754150390625, 0.00122833251953125, 0.001689910888671875, 0.0021514892578125, 0.002613067626953125, 0.00307464599609375, 0.003536224365234375, 0.003997802734375, 0.004459381103515625, 0.00492095947265625, 0.005382537841796875, 0.0058441162109375, 0.006305694580078125, 0.00676727294921875, 0.007228851318359375, 0.0076904296875, 0.008152008056640625, 0.00861358642578125, 0.009075164794921875, 0.0095367431640625, 0.009998321533203125, 0.01045989990234375, 0.010921478271484375, 0.011383056640625, 0.011844635009765625, 0.01230621337890625, 0.012767791748046875, 0.0132293701171875, 0.013690948486328125, 0.01415252685546875, 0.014614105224609375, 0.01507568359375, 0.015537261962890625, 0.01599884033203125, 0.016460418701171875, 0.0169219970703125, 0.017383575439453125, 0.01784515380859375, 0.018306732177734375, 0.018768310546875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 15.0, 29.0, 68.0, 175.0, 291.0, 248.0, 102.0, 45.0, 16.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.492897868156433, -1.3916181325912476, -1.2903382778167725, -1.189058542251587, -1.0877788066864014, -0.9864989519119263, -0.8852192163467407, -0.7839394211769104, -0.6826596260070801, -0.5813798308372498, -0.4801000654697418, -0.3788203001022339, -0.27754050493240356, -0.17626070976257324, -0.0749809741973877, 0.026298820972442627, 0.12757861614227295, 0.22885839641094208, 0.3301381766796112, 0.43141794204711914, 0.5326977372169495, 0.6339775323867798, 0.7352572679519653, 0.8365370631217957, 0.937816858291626, 1.0390965938568115, 1.1403764486312866, 1.2416561841964722, 1.3429360389709473, 1.4442157745361328, 1.5454955101013184, 1.646775245666504, 1.7480549812316895, 1.849334716796875, 1.95061457157135, 2.051894187927246, 2.1531741619110107, 2.2544538974761963, 2.355733633041382, 2.4570133686065674, 2.558293342590332, 2.6595730781555176, 2.760852813720703, 2.8621325492858887, 2.9634125232696533, 3.064692258834839, 3.1659719944000244, 3.26725172996521, 3.3685314655303955, 3.469811201095581, 3.5710909366607666, 3.6723709106445312, 3.773650646209717, 3.8749303817749023, 3.976210117340088, 4.077489852905273, 4.178769588470459, 4.2800493240356445, 4.38132905960083, 4.482608795166016, 4.583888530731201, 4.685168266296387, 4.7864484786987305, 4.887728214263916, 4.989007949829102]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 18.0, 21.0, 18.0, 23.0, 34.0, 36.0, 40.0, 44.0, 68.0, 67.0, 59.0, 81.0, 74.0, 70.0, 51.0, 40.0, 47.0, 44.0, 30.0, 21.0, 17.0, 21.0, 10.0, 8.0, 6.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8784547448158264, -0.8474689722061157, -0.816483199596405, -0.7854974269866943, -0.7545115947723389, -0.7235258221626282, -0.6925400495529175, -0.6615542769432068, -0.6305685043334961, -0.5995827317237854, -0.5685969591140747, -0.5376111268997192, -0.5066253542900085, -0.47563958168029785, -0.44465380907058716, -0.41366803646087646, -0.382682204246521, -0.3516964316368103, -0.3207106292247772, -0.28972485661506653, -0.25873905420303345, -0.22775328159332275, -0.19676750898361206, -0.16578172147274017, -0.1347959339618683, -0.1038101464509964, -0.07282436639070511, -0.04183858633041382, -0.010852798819541931, 0.020132988691329956, 0.05111876130104065, 0.08210454881191254, 0.11309027671813965, 0.14407606422901154, 0.17506185173988342, 0.20604762434959412, 0.237033411860466, 0.2680191993713379, 0.2990049719810486, 0.3299907445907593, 0.36097654700279236, 0.39196231961250305, 0.42294812202453613, 0.4539338946342468, 0.4849196672439575, 0.515905499458313, 0.5468912124633789, 0.5778770446777344, 0.6088628172874451, 0.6398485898971558, 0.6708343625068665, 0.7018201351165771, 0.7328059673309326, 0.7637917399406433, 0.794777512550354, 0.8257632851600647, 0.8567490577697754, 0.8877348303794861, 0.9187206029891968, 0.9497064352035522, 0.9806922078132629, 1.0116779804229736, 1.042663812637329, 1.073649525642395, 1.1046353578567505]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 16.0, 10.0, 14.0, 30.0, 52.0, 104.0, 190.0, 402.0, 838.0, 1937.0, 4847.0, 14138.0, 52634.0, 325768.0, 529410.0, 86259.0, 20532.0, 6720.0, 2511.0, 1110.0, 490.0, 230.0, 122.0, 74.0, 24.0, 18.0, 15.0, 9.0, 10.0, 6.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78515625, -0.7582244873046875, -0.731292724609375, -0.7043609619140625, -0.67742919921875, -0.6504974365234375, -0.623565673828125, -0.5966339111328125, -0.5697021484375, -0.5427703857421875, -0.515838623046875, -0.4889068603515625, -0.46197509765625, -0.4350433349609375, -0.408111572265625, -0.3811798095703125, -0.354248046875, -0.3273162841796875, -0.300384521484375, -0.2734527587890625, -0.24652099609375, -0.2195892333984375, -0.192657470703125, -0.1657257080078125, -0.1387939453125, -0.1118621826171875, -0.084930419921875, -0.0579986572265625, -0.03106689453125, -0.0041351318359375, 0.022796630859375, 0.0497283935546875, 0.07666015625, 0.1035919189453125, 0.130523681640625, 0.1574554443359375, 0.18438720703125, 0.2113189697265625, 0.238250732421875, 0.2651824951171875, 0.2921142578125, 0.3190460205078125, 0.345977783203125, 0.3729095458984375, 0.39984130859375, 0.4267730712890625, 0.453704833984375, 0.4806365966796875, 0.507568359375, 0.5345001220703125, 0.561431884765625, 0.5883636474609375, 0.61529541015625, 0.6422271728515625, 0.669158935546875, 0.6960906982421875, 0.7230224609375, 0.7499542236328125, 0.776885986328125, 0.8038177490234375, 0.83074951171875, 0.8576812744140625, 0.884613037109375, 0.9115447998046875, 0.9384765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 6.0, 14.0, 13.0, 13.0, 12.0, 22.0, 32.0, 45.0, 34.0, 55.0, 63.0, 59.0, 68.0, 70.0, 71.0, 73.0, 51.0, 45.0, 45.0, 44.0, 31.0, 29.0, 25.0, 14.0, 15.0, 12.0, 4.0, 5.0, 9.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6064453125, -1.5441436767578125, -1.481842041015625, -1.4195404052734375, -1.35723876953125, -1.2949371337890625, -1.232635498046875, -1.1703338623046875, -1.1080322265625, -1.0457305908203125, -0.983428955078125, -0.9211273193359375, -0.85882568359375, -0.7965240478515625, -0.734222412109375, -0.6719207763671875, -0.609619140625, -0.5473175048828125, -0.485015869140625, -0.4227142333984375, -0.36041259765625, -0.2981109619140625, -0.235809326171875, -0.1735076904296875, -0.1112060546875, -0.0489044189453125, 0.013397216796875, 0.0756988525390625, 0.13800048828125, 0.2003021240234375, 0.262603759765625, 0.3249053955078125, 0.38720703125, 0.4495086669921875, 0.511810302734375, 0.5741119384765625, 0.63641357421875, 0.6987152099609375, 0.761016845703125, 0.8233184814453125, 0.8856201171875, 0.9479217529296875, 1.010223388671875, 1.0725250244140625, 1.13482666015625, 1.1971282958984375, 1.259429931640625, 1.3217315673828125, 1.384033203125, 1.4463348388671875, 1.508636474609375, 1.5709381103515625, 1.63323974609375, 1.6955413818359375, 1.757843017578125, 1.8201446533203125, 1.8824462890625, 1.9447479248046875, 2.007049560546875, 2.0693511962890625, 2.13165283203125, 2.1939544677734375, 2.256256103515625, 2.3185577392578125, 2.380859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 5.0, 14.0, 8.0, 11.0, 18.0, 22.0, 29.0, 39.0, 52.0, 88.0, 121.0, 198.0, 356.0, 691.0, 2478.0, 16628.0, 277751.0, 705665.0, 37647.0, 4553.0, 1028.0, 411.0, 225.0, 127.0, 109.0, 56.0, 55.0, 39.0, 34.0, 22.0, 14.0, 13.0, 11.0, 5.0, 3.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.05078125, -1.0106353759765625, -0.970489501953125, -0.9303436279296875, -0.89019775390625, -0.8500518798828125, -0.809906005859375, -0.7697601318359375, -0.7296142578125, -0.6894683837890625, -0.649322509765625, -0.6091766357421875, -0.56903076171875, -0.5288848876953125, -0.488739013671875, -0.4485931396484375, -0.408447265625, -0.3683013916015625, -0.328155517578125, -0.2880096435546875, -0.24786376953125, -0.2077178955078125, -0.167572021484375, -0.1274261474609375, -0.0872802734375, -0.0471343994140625, -0.006988525390625, 0.0331573486328125, 0.07330322265625, 0.1134490966796875, 0.153594970703125, 0.1937408447265625, 0.23388671875, 0.2740325927734375, 0.314178466796875, 0.3543243408203125, 0.39447021484375, 0.4346160888671875, 0.474761962890625, 0.5149078369140625, 0.5550537109375, 0.5951995849609375, 0.635345458984375, 0.6754913330078125, 0.71563720703125, 0.7557830810546875, 0.795928955078125, 0.8360748291015625, 0.876220703125, 0.9163665771484375, 0.956512451171875, 0.9966583251953125, 1.03680419921875, 1.0769500732421875, 1.117095947265625, 1.1572418212890625, 1.1973876953125, 1.2375335693359375, 1.277679443359375, 1.3178253173828125, 1.35797119140625, 1.3981170654296875, 1.438262939453125, 1.4784088134765625, 1.5185546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 3.0, 7.0, 12.0, 20.0, 13.0, 20.0, 23.0, 14.0, 22.0, 21.0, 32.0, 25.0, 28.0, 28.0, 36.0, 33.0, 34.0, 42.0, 28.0, 41.0, 40.0, 30.0, 39.0, 40.0, 32.0, 28.0, 34.0, 34.0, 36.0, 24.0, 11.0, 19.0, 16.0, 18.0, 7.0, 14.0, 14.0, 11.0, 8.0, 6.0, 6.0, 2.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-1.4521484375, -1.409637451171875, -1.36712646484375, -1.324615478515625, -1.2821044921875, -1.239593505859375, -1.19708251953125, -1.154571533203125, -1.112060546875, -1.069549560546875, -1.02703857421875, -0.984527587890625, -0.9420166015625, -0.899505615234375, -0.85699462890625, -0.814483642578125, -0.77197265625, -0.729461669921875, -0.68695068359375, -0.644439697265625, -0.6019287109375, -0.559417724609375, -0.51690673828125, -0.474395751953125, -0.431884765625, -0.389373779296875, -0.34686279296875, -0.304351806640625, -0.2618408203125, -0.219329833984375, -0.17681884765625, -0.134307861328125, -0.091796875, -0.049285888671875, -0.00677490234375, 0.035736083984375, 0.0782470703125, 0.120758056640625, 0.16326904296875, 0.205780029296875, 0.248291015625, 0.290802001953125, 0.33331298828125, 0.375823974609375, 0.4183349609375, 0.460845947265625, 0.50335693359375, 0.545867919921875, 0.58837890625, 0.630889892578125, 0.67340087890625, 0.715911865234375, 0.7584228515625, 0.800933837890625, 0.84344482421875, 0.885955810546875, 0.928466796875, 0.970977783203125, 1.01348876953125, 1.055999755859375, 1.0985107421875, 1.141021728515625, 1.18353271484375, 1.226043701171875, 1.2685546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 5.0, 10.0, 13.0, 22.0, 23.0, 55.0, 145.0, 302.0, 1173.0, 7888.0, 560374.0, 469558.0, 7273.0, 1109.0, 334.0, 129.0, 64.0, 36.0, 15.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -1.00384521484375, -0.9774169921875, -0.95098876953125, -0.924560546875, -0.89813232421875, -0.8717041015625, -0.84527587890625, -0.81884765625, -0.79241943359375, -0.7659912109375, -0.73956298828125, -0.713134765625, -0.68670654296875, -0.6602783203125, -0.63385009765625, -0.607421875, -0.58099365234375, -0.5545654296875, -0.52813720703125, -0.501708984375, -0.47528076171875, -0.4488525390625, -0.42242431640625, -0.39599609375, -0.36956787109375, -0.3431396484375, -0.31671142578125, -0.290283203125, -0.26385498046875, -0.2374267578125, -0.21099853515625, -0.1845703125, -0.15814208984375, -0.1317138671875, -0.10528564453125, -0.078857421875, -0.05242919921875, -0.0260009765625, 0.00042724609375, 0.02685546875, 0.05328369140625, 0.0797119140625, 0.10614013671875, 0.132568359375, 0.15899658203125, 0.1854248046875, 0.21185302734375, 0.23828125, 0.26470947265625, 0.2911376953125, 0.31756591796875, 0.343994140625, 0.37042236328125, 0.3968505859375, 0.42327880859375, 0.44970703125, 0.47613525390625, 0.5025634765625, 0.52899169921875, 0.555419921875, 0.58184814453125, 0.6082763671875, 0.63470458984375, 0.6611328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 9.0, 11.0, 24.0, 44.0, 91.0, 194.0, 263.0, 172.0, 101.0, 48.0, 20.0, 16.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00016307830810546875, -0.00015956629067659378, -0.0001560542732477188, -0.00015254225581884384, -0.00014903023838996887, -0.0001455182209610939, -0.00014200620353221893, -0.00013849418610334396, -0.000134982168674469, -0.00013147015124559402, -0.00012795813381671906, -0.00012444611638784409, -0.00012093409895896912, -0.00011742208153009415, -0.00011391006410121918, -0.00011039804667234421, -0.00010688602924346924, -0.00010337401181459427, -9.98619943857193e-05, -9.634997695684433e-05, -9.283795952796936e-05, -8.932594209909439e-05, -8.581392467021942e-05, -8.230190724134445e-05, -7.878988981246948e-05, -7.527787238359451e-05, -7.176585495471954e-05, -6.825383752584457e-05, -6.47418200969696e-05, -6.122980266809464e-05, -5.7717785239219666e-05, -5.4205767810344696e-05, -5.0693750381469727e-05, -4.718173295259476e-05, -4.366971552371979e-05, -4.015769809484482e-05, -3.664568066596985e-05, -3.313366323709488e-05, -2.962164580821991e-05, -2.610962837934494e-05, -2.259761095046997e-05, -1.9085593521595e-05, -1.5573576092720032e-05, -1.2061558663845062e-05, -8.549541234970093e-06, -5.037523806095123e-06, -1.5255063772201538e-06, 1.9865110516548157e-06, 5.498528480529785e-06, 9.010545909404755e-06, 1.2522563338279724e-05, 1.6034580767154694e-05, 1.9546598196029663e-05, 2.3058615624904633e-05, 2.6570633053779602e-05, 3.008265048265457e-05, 3.359466791152954e-05, 3.710668534040451e-05, 4.061870276927948e-05, 4.413072019815445e-05, 4.764273762702942e-05, 5.115475505590439e-05, 5.466677248477936e-05, 5.817878991365433e-05, 6.16908073425293e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 9.0, 17.0, 23.0, 42.0, 85.0, 198.0, 419.0, 1092.0, 3044.0, 15968.0, 550345.0, 458188.0, 14372.0, 2953.0, 1026.0, 400.0, 164.0, 78.0, 44.0, 24.0, 15.0, 15.0, 6.0, 3.0, 3.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5843276977539062, -0.5641632080078125, -0.5439987182617188, -0.523834228515625, -0.5036697387695312, -0.4835052490234375, -0.46334075927734375, -0.44317626953125, -0.42301177978515625, -0.4028472900390625, -0.38268280029296875, -0.362518310546875, -0.34235382080078125, -0.3221893310546875, -0.30202484130859375, -0.2818603515625, -0.26169586181640625, -0.2415313720703125, -0.22136688232421875, -0.201202392578125, -0.18103790283203125, -0.1608734130859375, -0.14070892333984375, -0.12054443359375, -0.10037994384765625, -0.0802154541015625, -0.06005096435546875, -0.039886474609375, -0.01972198486328125, 0.0004425048828125, 0.02060699462890625, 0.040771484375, 0.06093597412109375, 0.0811004638671875, 0.10126495361328125, 0.121429443359375, 0.14159393310546875, 0.1617584228515625, 0.18192291259765625, 0.20208740234375, 0.22225189208984375, 0.2424163818359375, 0.26258087158203125, 0.282745361328125, 0.30290985107421875, 0.3230743408203125, 0.34323883056640625, 0.3634033203125, 0.38356781005859375, 0.4037322998046875, 0.42389678955078125, 0.444061279296875, 0.46422576904296875, 0.4843902587890625, 0.5045547485351562, 0.52471923828125, 0.5448837280273438, 0.5650482177734375, 0.5852127075195312, 0.605377197265625, 0.6255416870117188, 0.6457061767578125, 0.6658706665039062, 0.68603515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 5.0, 15.0, 29.0, 28.0, 67.0, 104.0, 153.0, 176.0, 148.0, 90.0, 57.0, 48.0, 29.0, 13.0, 9.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.216552734375, -0.2100696563720703, -0.20358657836914062, -0.19710350036621094, -0.19062042236328125, -0.18413734436035156, -0.17765426635742188, -0.1711711883544922, -0.1646881103515625, -0.1582050323486328, -0.15172195434570312, -0.14523887634277344, -0.13875579833984375, -0.13227272033691406, -0.12578964233398438, -0.11930656433105469, -0.112823486328125, -0.10634040832519531, -0.09985733032226562, -0.09337425231933594, -0.08689117431640625, -0.08040809631347656, -0.07392501831054688, -0.06744194030761719, -0.0609588623046875, -0.05447578430175781, -0.047992706298828125, -0.04150962829589844, -0.03502655029296875, -0.028543472290039062, -0.022060394287109375, -0.015577316284179688, -0.00909423828125, -0.0026111602783203125, 0.003871917724609375, 0.010354995727539062, 0.01683807373046875, 0.023321151733398438, 0.029804229736328125, 0.03628730773925781, 0.0427703857421875, 0.04925346374511719, 0.055736541748046875, 0.06221961975097656, 0.06870269775390625, 0.07518577575683594, 0.08166885375976562, 0.08815193176269531, 0.094635009765625, 0.10111808776855469, 0.10760116577148438, 0.11408424377441406, 0.12056732177734375, 0.12705039978027344, 0.13353347778320312, 0.1400165557861328, 0.1464996337890625, 0.1529827117919922, 0.15946578979492188, 0.16594886779785156, 0.17243194580078125, 0.17891502380371094, 0.18539810180664062, 0.1918811798095703, 0.1983642578125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 13.0, 35.0, 90.0, 233.0, 311.0, 195.0, 79.0, 22.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.189291000366211, -10.975666999816895, -10.762042999267578, -10.548418998718262, -10.334795951843262, -10.121171951293945, -9.907547950744629, -9.693923950195312, -9.480299949645996, -9.26667594909668, -9.053051948547363, -8.839427947998047, -8.625804901123047, -8.41218090057373, -8.198556900024414, -7.984932899475098, -7.771308898925781, -7.557684898376465, -7.344061374664307, -7.13043737411499, -6.916813373565674, -6.703189849853516, -6.489565849304199, -6.275941848754883, -6.062318325042725, -5.848694324493408, -5.63507080078125, -5.421446800231934, -5.207822799682617, -4.994198799133301, -4.780575275421143, -4.566951274871826, -4.35332727432251, -4.139703273773193, -3.926079511642456, -3.7124557495117188, -3.4988317489624023, -3.285207986831665, -3.0715842247009277, -2.8579602241516113, -2.644336223602295, -2.4307124614715576, -2.217088460922241, -2.003464698791504, -1.7898406982421875, -1.5762169361114502, -1.3625930547714233, -1.1489691734313965, -0.9353454113006592, -0.7217215299606323, -0.5080976486206055, -0.2944738268852234, -0.08084994554519653, 0.13277387619018555, 0.3463977575302124, 0.5600216388702393, 0.7736455202102661, 0.987269401550293, 1.2008932828903198, 1.4145171642303467, 1.628140926361084, 1.8417648077011108, 2.0553886890411377, 2.269012451171875, 2.4826364517211914]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 6.0, 6.0, 10.0, 9.0, 16.0, 9.0, 18.0, 13.0, 22.0, 25.0, 25.0, 28.0, 27.0, 51.0, 43.0, 50.0, 49.0, 35.0, 43.0, 41.0, 46.0, 36.0, 34.0, 43.0, 36.0, 33.0, 33.0, 31.0, 22.0, 18.0, 19.0, 17.0, 21.0, 13.0, 12.0, 9.0, 10.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.9308040142059326, -2.8450233936309814, -2.7592430114746094, -2.673462390899658, -2.587681770324707, -2.501901149749756, -2.4161205291748047, -2.3303401470184326, -2.2445595264434814, -2.1587789058685303, -2.072998523712158, -1.987217903137207, -1.9014372825622559, -1.8156566619873047, -1.729876160621643, -1.6440956592559814, -1.5583150386810303, -1.472534418106079, -1.3867539167404175, -1.3009734153747559, -1.2151927947998047, -1.1294121742248535, -1.043631672859192, -0.9578511118888855, -0.8720705509185791, -0.7862899899482727, -0.7005094289779663, -0.6147288680076599, -0.5289483070373535, -0.4431677460670471, -0.3573871850967407, -0.2716066241264343, -0.18582582473754883, -0.10004526376724243, -0.014264702796936035, 0.07151585817337036, 0.15729641914367676, 0.24307698011398315, 0.32885754108428955, 0.41463810205459595, 0.5004186630249023, 0.5861992239952087, 0.6719797849655151, 0.7577603459358215, 0.8435409069061279, 0.9293214678764343, 1.0151020288467407, 1.1008825302124023, 1.1866631507873535, 1.2724437713623047, 1.3582242727279663, 1.444004774093628, 1.529785394668579, 1.6155660152435303, 1.701346516609192, 1.7871270179748535, 1.8729076385498047, 1.9586882591247559, 2.044468879699707, 2.130249261856079, 2.2160298824310303, 2.3018105030059814, 2.3875908851623535, 2.4733715057373047, 2.559152126312256]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 10.0, 5.0, 12.0, 15.0, 10.0, 26.0, 48.0, 43.0, 74.0, 116.0, 186.0, 307.0, 621.0, 1415.0, 4961.0, 40397.0, 1737134.0, 2350566.0, 50571.0, 4923.0, 1343.0, 562.0, 296.0, 211.0, 96.0, 96.0, 53.0, 39.0, 42.0, 19.0, 16.0, 15.0, 12.0, 8.0, 5.0, 6.0, 4.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.65234375, -2.564056396484375, -2.47576904296875, -2.387481689453125, -2.2991943359375, -2.210906982421875, -2.12261962890625, -2.034332275390625, -1.946044921875, -1.857757568359375, -1.76947021484375, -1.681182861328125, -1.5928955078125, -1.504608154296875, -1.41632080078125, -1.328033447265625, -1.23974609375, -1.151458740234375, -1.06317138671875, -0.974884033203125, -0.8865966796875, -0.798309326171875, -0.71002197265625, -0.621734619140625, -0.533447265625, -0.445159912109375, -0.35687255859375, -0.268585205078125, -0.1802978515625, -0.092010498046875, -0.00372314453125, 0.084564208984375, 0.1728515625, 0.261138916015625, 0.34942626953125, 0.437713623046875, 0.5260009765625, 0.614288330078125, 0.70257568359375, 0.790863037109375, 0.879150390625, 0.967437744140625, 1.05572509765625, 1.144012451171875, 1.2322998046875, 1.320587158203125, 1.40887451171875, 1.497161865234375, 1.58544921875, 1.673736572265625, 1.76202392578125, 1.850311279296875, 1.9385986328125, 2.026885986328125, 2.11517333984375, 2.203460693359375, 2.291748046875, 2.380035400390625, 2.46832275390625, 2.556610107421875, 2.6448974609375, 2.733184814453125, 2.82147216796875, 2.909759521484375, 2.998046875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 7.0, 8.0, 10.0, 16.0, 14.0, 15.0, 31.0, 36.0, 36.0, 49.0, 55.0, 55.0, 78.0, 74.0, 65.0, 66.0, 49.0, 52.0, 59.0, 52.0, 34.0, 23.0, 30.0, 19.0, 11.0, 13.0, 9.0, 1.0, 4.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.065704345703125, -1.02789306640625, -0.990081787109375, -0.9522705078125, -0.914459228515625, -0.87664794921875, -0.838836669921875, -0.801025390625, -0.763214111328125, -0.72540283203125, -0.687591552734375, -0.6497802734375, -0.611968994140625, -0.57415771484375, -0.536346435546875, -0.49853515625, -0.460723876953125, -0.42291259765625, -0.385101318359375, -0.3472900390625, -0.309478759765625, -0.27166748046875, -0.233856201171875, -0.196044921875, -0.158233642578125, -0.12042236328125, -0.082611083984375, -0.0447998046875, -0.006988525390625, 0.03082275390625, 0.068634033203125, 0.1064453125, 0.144256591796875, 0.18206787109375, 0.219879150390625, 0.2576904296875, 0.295501708984375, 0.33331298828125, 0.371124267578125, 0.408935546875, 0.446746826171875, 0.48455810546875, 0.522369384765625, 0.5601806640625, 0.597991943359375, 0.63580322265625, 0.673614501953125, 0.71142578125, 0.749237060546875, 0.78704833984375, 0.824859619140625, 0.8626708984375, 0.900482177734375, 0.93829345703125, 0.976104736328125, 1.013916015625, 1.051727294921875, 1.08953857421875, 1.127349853515625, 1.1651611328125, 1.202972412109375, 1.24078369140625, 1.278594970703125, 1.31640625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 15.0, 16.0, 21.0, 31.0, 42.0, 82.0, 124.0, 187.0, 294.0, 651.0, 1146.0, 2372.0, 6067.0, 20888.0, 141848.0, 3112060.0, 835255.0, 53922.0, 11684.0, 3831.0, 1677.0, 838.0, 473.0, 279.0, 166.0, 88.0, 74.0, 35.0, 33.0, 11.0, 22.0, 10.0, 13.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.822265625, -1.7740325927734375, -1.725799560546875, -1.6775665283203125, -1.62933349609375, -1.5811004638671875, -1.532867431640625, -1.4846343994140625, -1.4364013671875, -1.3881683349609375, -1.339935302734375, -1.2917022705078125, -1.24346923828125, -1.1952362060546875, -1.147003173828125, -1.0987701416015625, -1.050537109375, -1.0023040771484375, -0.954071044921875, -0.9058380126953125, -0.85760498046875, -0.8093719482421875, -0.761138916015625, -0.7129058837890625, -0.6646728515625, -0.6164398193359375, -0.568206787109375, -0.5199737548828125, -0.47174072265625, -0.4235076904296875, -0.375274658203125, -0.3270416259765625, -0.27880859375, -0.2305755615234375, -0.182342529296875, -0.1341094970703125, -0.08587646484375, -0.0376434326171875, 0.010589599609375, 0.0588226318359375, 0.1070556640625, 0.1552886962890625, 0.203521728515625, 0.2517547607421875, 0.29998779296875, 0.3482208251953125, 0.396453857421875, 0.4446868896484375, 0.492919921875, 0.5411529541015625, 0.589385986328125, 0.6376190185546875, 0.68585205078125, 0.7340850830078125, 0.782318115234375, 0.8305511474609375, 0.8787841796875, 0.9270172119140625, 0.975250244140625, 1.0234832763671875, 1.07171630859375, 1.1199493408203125, 1.168182373046875, 1.2164154052734375, 1.2646484375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 7.0, 13.0, 25.0, 24.0, 27.0, 54.0, 75.0, 138.0, 281.0, 512.0, 734.0, 832.0, 546.0, 318.0, 182.0, 106.0, 57.0, 44.0, 29.0, 15.0, 12.0, 11.0, 1.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5625, -0.5459938049316406, -0.5294876098632812, -0.5129814147949219, -0.4964752197265625, -0.4799690246582031, -0.46346282958984375, -0.4469566345214844, -0.430450439453125, -0.4139442443847656, -0.39743804931640625, -0.3809318542480469, -0.3644256591796875, -0.3479194641113281, -0.33141326904296875, -0.3149070739746094, -0.29840087890625, -0.2818946838378906, -0.26538848876953125, -0.24888229370117188, -0.2323760986328125, -0.21586990356445312, -0.19936370849609375, -0.18285751342773438, -0.166351318359375, -0.14984512329101562, -0.13333892822265625, -0.11683273315429688, -0.1003265380859375, -0.08382034301757812, -0.06731414794921875, -0.050807952880859375, -0.0343017578125, -0.017795562744140625, -0.00128936767578125, 0.015216827392578125, 0.0317230224609375, 0.048229217529296875, 0.06473541259765625, 0.08124160766601562, 0.097747802734375, 0.11425399780273438, 0.13076019287109375, 0.14726638793945312, 0.1637725830078125, 0.18027877807617188, 0.19678497314453125, 0.21329116821289062, 0.22979736328125, 0.24630355834960938, 0.26280975341796875, 0.2793159484863281, 0.2958221435546875, 0.3123283386230469, 0.32883453369140625, 0.3453407287597656, 0.361846923828125, 0.3783531188964844, 0.39485931396484375, 0.4113655090332031, 0.4278717041015625, 0.4443778991699219, 0.46088409423828125, 0.4773902893066406, 0.493896484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 8.0, 18.0, 24.0, 38.0, 51.0, 94.0, 127.0, 170.0, 159.0, 112.0, 82.0, 42.0, 36.0, 17.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7463443279266357, -3.6642932891845703, -3.582242250442505, -3.5001912117004395, -3.418140172958374, -3.3360891342163086, -3.254038095474243, -3.1719870567321777, -3.089935779571533, -3.0078847408294678, -2.9258337020874023, -2.843782663345337, -2.7617316246032715, -2.679680585861206, -2.5976295471191406, -2.515578269958496, -2.4335274696350098, -2.3514764308929443, -2.269425392150879, -2.1873743534088135, -2.105323314666748, -2.0232722759246826, -1.9412211179733276, -1.8591700792312622, -1.7771190404891968, -1.6950680017471313, -1.613016963005066, -1.5309659242630005, -1.4489147663116455, -1.36686372756958, -1.2848126888275146, -1.2027616500854492, -1.1207103729248047, -1.0386593341827393, -0.9566082954406738, -0.8745571970939636, -0.7925061583518982, -0.7104551196098328, -0.6284040212631226, -0.5463529825210571, -0.4643019437789917, -0.38225090503692627, -0.30019983649253845, -0.21814878284931183, -0.1360977292060852, -0.054046690464019775, 0.028004378080368042, 0.11005544662475586, 0.1921064853668213, 0.2741575241088867, 0.35620859265327454, 0.43825966119766235, 0.5203106999397278, 0.6023617386817932, 0.6844128370285034, 0.7664638757705688, 0.8485149145126343, 0.9305659532546997, 1.0126169919967651, 1.0946680307388306, 1.1767191886901855, 1.258770227432251, 1.3408212661743164, 1.4228723049163818, 1.5049233436584473]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 8.0, 6.0, 6.0, 14.0, 16.0, 19.0, 19.0, 21.0, 27.0, 41.0, 33.0, 52.0, 51.0, 60.0, 49.0, 53.0, 55.0, 57.0, 48.0, 58.0, 39.0, 31.0, 52.0, 28.0, 31.0, 22.0, 21.0, 19.0, 13.0, 16.0, 9.0, 3.0, 3.0, 6.0, 1.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2287441492080688, -1.19148588180542, -1.154227614402771, -1.1169694662094116, -1.0797111988067627, -1.0424529314041138, -1.0051946640014648, -0.9679363965988159, -0.9306781888008118, -0.8934199213981628, -0.8561617136001587, -0.8189034461975098, -0.7816451787948608, -0.7443869709968567, -0.7071287035942078, -0.6698704957962036, -0.6326122283935547, -0.5953539609909058, -0.5580957531929016, -0.5208374857902527, -0.48357924818992615, -0.4463210105895996, -0.4090627431869507, -0.37180450558662415, -0.3345462679862976, -0.29728803038597107, -0.26002979278564453, -0.2227715253829956, -0.18551328778266907, -0.14825505018234253, -0.1109967976808548, -0.07373854517936707, -0.03648042678833008, 0.0007778182625770569, 0.03803606331348419, 0.07529430836439133, 0.11255255341529846, 0.149810791015625, 0.18706904351711273, 0.22432729601860046, 0.261585533618927, 0.29884377121925354, 0.3361020088195801, 0.373360276222229, 0.41061851382255554, 0.4478767514228821, 0.485135018825531, 0.5223932266235352, 0.5596514940261841, 0.596909761428833, 0.6341679692268372, 0.6714262366294861, 0.7086844444274902, 0.7459427118301392, 0.7832009792327881, 0.820459246635437, 0.8577174544334412, 0.8949757218360901, 0.9322339296340942, 0.9694921970367432, 1.006750464439392, 1.044008731842041, 1.0812668800354004, 1.1185251474380493, 1.1557834148406982]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 12.0, 5.0, 13.0, 12.0, 18.0, 21.0, 39.0, 44.0, 100.0, 169.0, 252.0, 477.0, 981.0, 1930.0, 4701.0, 12043.0, 38586.0, 145271.0, 443814.0, 290810.0, 74327.0, 21300.0, 7596.0, 3017.0, 1361.0, 703.0, 364.0, 182.0, 142.0, 72.0, 52.0, 29.0, 27.0, 28.0, 14.0, 12.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1920166015625, -0.1855640411376953, -0.17911148071289062, -0.17265892028808594, -0.16620635986328125, -0.15975379943847656, -0.15330123901367188, -0.1468486785888672, -0.1403961181640625, -0.1339435577392578, -0.12749099731445312, -0.12103843688964844, -0.11458587646484375, -0.10813331604003906, -0.10168075561523438, -0.09522819519042969, -0.088775634765625, -0.08232307434082031, -0.07587051391601562, -0.06941795349121094, -0.06296539306640625, -0.05651283264160156, -0.050060272216796875, -0.04360771179199219, -0.0371551513671875, -0.030702590942382812, -0.024250030517578125, -0.017797470092773438, -0.01134490966796875, -0.0048923492431640625, 0.001560211181640625, 0.008012771606445312, 0.01446533203125, 0.020917892456054688, 0.027370452880859375, 0.03382301330566406, 0.04027557373046875, 0.04672813415527344, 0.053180694580078125, 0.05963325500488281, 0.0660858154296875, 0.07253837585449219, 0.07899093627929688, 0.08544349670410156, 0.09189605712890625, 0.09834861755371094, 0.10480117797851562, 0.11125373840332031, 0.117706298828125, 0.12415885925292969, 0.13061141967773438, 0.13706398010253906, 0.14351654052734375, 0.14996910095214844, 0.15642166137695312, 0.1628742218017578, 0.1693267822265625, 0.1757793426513672, 0.18223190307617188, 0.18868446350097656, 0.19513702392578125, 0.20158958435058594, 0.20804214477539062, 0.2144947052001953, 0.220947265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 6.0, 11.0, 7.0, 5.0, 11.0, 20.0, 23.0, 29.0, 30.0, 34.0, 45.0, 63.0, 52.0, 66.0, 46.0, 52.0, 72.0, 55.0, 47.0, 52.0, 50.0, 29.0, 38.0, 29.0, 28.0, 23.0, 11.0, 15.0, 10.0, 10.0, 6.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9228515625, -0.8954696655273438, -0.8680877685546875, -0.8407058715820312, -0.813323974609375, -0.7859420776367188, -0.7585601806640625, -0.7311782836914062, -0.70379638671875, -0.6764144897460938, -0.6490325927734375, -0.6216506958007812, -0.594268798828125, -0.5668869018554688, -0.5395050048828125, -0.5121231079101562, -0.4847412109375, -0.45735931396484375, -0.4299774169921875, -0.40259552001953125, -0.375213623046875, -0.34783172607421875, -0.3204498291015625, -0.29306793212890625, -0.26568603515625, -0.23830413818359375, -0.2109222412109375, -0.18354034423828125, -0.156158447265625, -0.12877655029296875, -0.1013946533203125, -0.07401275634765625, -0.046630859375, -0.01924896240234375, 0.0081329345703125, 0.03551483154296875, 0.062896728515625, 0.09027862548828125, 0.1176605224609375, 0.14504241943359375, 0.17242431640625, 0.19980621337890625, 0.2271881103515625, 0.25457000732421875, 0.281951904296875, 0.30933380126953125, 0.3367156982421875, 0.36409759521484375, 0.3914794921875, 0.41886138916015625, 0.4462432861328125, 0.47362518310546875, 0.501007080078125, 0.5283889770507812, 0.5557708740234375, 0.5831527709960938, 0.61053466796875, 0.6379165649414062, 0.6652984619140625, 0.6926803588867188, 0.720062255859375, 0.7474441528320312, 0.7748260498046875, 0.8022079467773438, 0.82958984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 7.0, 10.0, 13.0, 19.0, 39.0, 54.0, 59.0, 97.0, 138.0, 208.0, 292.0, 472.0, 733.0, 1328.0, 2226.0, 4038.0, 7904.0, 16683.0, 35268.0, 79018.0, 175199.0, 290214.0, 229538.0, 110500.0, 49142.0, 22346.0, 10696.0, 5401.0, 2785.0, 1546.0, 950.0, 525.0, 337.0, 234.0, 158.0, 109.0, 82.0, 47.0, 28.0, 31.0, 24.0, 8.0, 7.0, 12.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.12103271484375, -0.11744022369384766, -0.11384773254394531, -0.11025524139404297, -0.10666275024414062, -0.10307025909423828, -0.09947776794433594, -0.0958852767944336, -0.09229278564453125, -0.0887002944946289, -0.08510780334472656, -0.08151531219482422, -0.07792282104492188, -0.07433032989501953, -0.07073783874511719, -0.06714534759521484, -0.0635528564453125, -0.059960365295410156, -0.05636787414550781, -0.05277538299560547, -0.049182891845703125, -0.04559040069580078, -0.04199790954589844, -0.038405418395996094, -0.03481292724609375, -0.031220436096191406, -0.027627944946289062, -0.02403545379638672, -0.020442962646484375, -0.01685047149658203, -0.013257980346679688, -0.009665489196777344, -0.006072998046875, -0.0024805068969726562, 0.0011119842529296875, 0.004704475402832031, 0.008296966552734375, 0.011889457702636719, 0.015481948852539062, 0.019074440002441406, 0.02266693115234375, 0.026259422302246094, 0.029851913452148438, 0.03344440460205078, 0.037036895751953125, 0.04062938690185547, 0.04422187805175781, 0.047814369201660156, 0.0514068603515625, 0.054999351501464844, 0.05859184265136719, 0.06218433380126953, 0.06577682495117188, 0.06936931610107422, 0.07296180725097656, 0.0765542984008789, 0.08014678955078125, 0.0837392807006836, 0.08733177185058594, 0.09092426300048828, 0.09451675415039062, 0.09810924530029297, 0.10170173645019531, 0.10529422760009766, 0.10888671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 10.0, 10.0, 13.0, 18.0, 20.0, 12.0, 27.0, 21.0, 25.0, 30.0, 44.0, 31.0, 32.0, 53.0, 43.0, 38.0, 46.0, 42.0, 52.0, 39.0, 53.0, 41.0, 36.0, 45.0, 32.0, 31.0, 21.0, 22.0, 20.0, 12.0, 11.0, 16.0, 6.0, 5.0, 6.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4189453125, -1.376251220703125, -1.33355712890625, -1.290863037109375, -1.2481689453125, -1.205474853515625, -1.16278076171875, -1.120086669921875, -1.077392578125, -1.034698486328125, -0.99200439453125, -0.949310302734375, -0.9066162109375, -0.863922119140625, -0.82122802734375, -0.778533935546875, -0.73583984375, -0.693145751953125, -0.65045166015625, -0.607757568359375, -0.5650634765625, -0.522369384765625, -0.47967529296875, -0.436981201171875, -0.394287109375, -0.351593017578125, -0.30889892578125, -0.266204833984375, -0.2235107421875, -0.180816650390625, -0.13812255859375, -0.095428466796875, -0.052734375, -0.010040283203125, 0.03265380859375, 0.075347900390625, 0.1180419921875, 0.160736083984375, 0.20343017578125, 0.246124267578125, 0.288818359375, 0.331512451171875, 0.37420654296875, 0.416900634765625, 0.4595947265625, 0.502288818359375, 0.54498291015625, 0.587677001953125, 0.63037109375, 0.673065185546875, 0.71575927734375, 0.758453369140625, 0.8011474609375, 0.843841552734375, 0.88653564453125, 0.929229736328125, 0.971923828125, 1.014617919921875, 1.05731201171875, 1.100006103515625, 1.1427001953125, 1.185394287109375, 1.22808837890625, 1.270782470703125, 1.3134765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 10.0, 16.0, 11.0, 19.0, 28.0, 42.0, 68.0, 96.0, 177.0, 313.0, 518.0, 987.0, 2099.0, 4519.0, 12020.0, 40884.0, 172163.0, 454875.0, 265997.0, 64574.0, 17430.0, 6113.0, 2560.0, 1339.0, 684.0, 384.0, 239.0, 144.0, 72.0, 49.0, 43.0, 27.0, 17.0, 13.0, 3.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.055206298828125, -0.05340576171875, -0.051605224609375, -0.0498046875, -0.048004150390625, -0.04620361328125, -0.044403076171875, -0.0426025390625, -0.040802001953125, -0.03900146484375, -0.037200927734375, -0.035400390625, -0.033599853515625, -0.03179931640625, -0.029998779296875, -0.0281982421875, -0.026397705078125, -0.02459716796875, -0.022796630859375, -0.02099609375, -0.019195556640625, -0.01739501953125, -0.015594482421875, -0.0137939453125, -0.011993408203125, -0.01019287109375, -0.008392333984375, -0.006591796875, -0.004791259765625, -0.00299072265625, -0.001190185546875, 0.0006103515625, 0.002410888671875, 0.00421142578125, 0.006011962890625, 0.0078125, 0.009613037109375, 0.01141357421875, 0.013214111328125, 0.0150146484375, 0.016815185546875, 0.01861572265625, 0.020416259765625, 0.022216796875, 0.024017333984375, 0.02581787109375, 0.027618408203125, 0.0294189453125, 0.031219482421875, 0.03302001953125, 0.034820556640625, 0.03662109375, 0.038421630859375, 0.04022216796875, 0.042022705078125, 0.0438232421875, 0.045623779296875, 0.04742431640625, 0.049224853515625, 0.051025390625, 0.052825927734375, 0.05462646484375, 0.056427001953125, 0.0582275390625, 0.060028076171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 13.0, 11.0, 9.0, 18.0, 18.0, 18.0, 20.0, 42.0, 53.0, 61.0, 63.0, 90.0, 86.0, 104.0, 69.0, 82.0, 59.0, 31.0, 36.0, 38.0, 21.0, 10.0, 8.0, 10.0, 9.0, 4.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.325939178466797e-05, -3.231316804885864e-05, -3.1366944313049316e-05, -3.042072057723999e-05, -2.9474496841430664e-05, -2.8528273105621338e-05, -2.7582049369812012e-05, -2.6635825634002686e-05, -2.568960189819336e-05, -2.4743378162384033e-05, -2.3797154426574707e-05, -2.285093069076538e-05, -2.1904706954956055e-05, -2.095848321914673e-05, -2.0012259483337402e-05, -1.9066035747528076e-05, -1.811981201171875e-05, -1.7173588275909424e-05, -1.6227364540100098e-05, -1.528114080429077e-05, -1.4334917068481445e-05, -1.3388693332672119e-05, -1.2442469596862793e-05, -1.1496245861053467e-05, -1.055002212524414e-05, -9.603798389434814e-06, -8.657574653625488e-06, -7.711350917816162e-06, -6.765127182006836e-06, -5.81890344619751e-06, -4.872679710388184e-06, -3.926455974578857e-06, -2.9802322387695312e-06, -2.034008502960205e-06, -1.087784767150879e-06, -1.4156103134155273e-07, 8.046627044677734e-07, 1.7508864402770996e-06, 2.6971101760864258e-06, 3.643333911895752e-06, 4.589557647705078e-06, 5.535781383514404e-06, 6.4820051193237305e-06, 7.428228855133057e-06, 8.374452590942383e-06, 9.320676326751709e-06, 1.0266900062561035e-05, 1.1213123798370361e-05, 1.2159347534179688e-05, 1.3105571269989014e-05, 1.405179500579834e-05, 1.4998018741607666e-05, 1.5944242477416992e-05, 1.689046621322632e-05, 1.7836689949035645e-05, 1.878291368484497e-05, 1.9729137420654297e-05, 2.0675361156463623e-05, 2.162158489227295e-05, 2.2567808628082275e-05, 2.35140323638916e-05, 2.4460256099700928e-05, 2.5406479835510254e-05, 2.635270357131958e-05, 2.7298927307128906e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 7.0, 12.0, 12.0, 12.0, 32.0, 26.0, 39.0, 56.0, 107.0, 104.0, 189.0, 275.0, 395.0, 683.0, 1061.0, 1919.0, 3654.0, 7326.0, 15207.0, 35352.0, 87712.0, 202933.0, 304879.0, 216979.0, 96221.0, 39227.0, 17001.0, 7746.0, 3983.0, 2139.0, 1184.0, 757.0, 437.0, 296.0, 169.0, 127.0, 70.0, 53.0, 54.0, 30.0, 23.0, 22.0, 14.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.041290283203125, -0.04009532928466797, -0.03890037536621094, -0.037705421447753906, -0.036510467529296875, -0.035315513610839844, -0.03412055969238281, -0.03292560577392578, -0.03173065185546875, -0.03053569793701172, -0.029340744018554688, -0.028145790100097656, -0.026950836181640625, -0.025755882263183594, -0.024560928344726562, -0.02336597442626953, -0.0221710205078125, -0.02097606658935547, -0.019781112670898438, -0.018586158752441406, -0.017391204833984375, -0.016196250915527344, -0.015001296997070312, -0.013806343078613281, -0.01261138916015625, -0.011416435241699219, -0.010221481323242188, -0.009026527404785156, -0.007831573486328125, -0.006636619567871094, -0.0054416656494140625, -0.004246711730957031, -0.0030517578125, -0.0018568038940429688, -0.0006618499755859375, 0.0005331039428710938, 0.001728057861328125, 0.0029230117797851562, 0.0041179656982421875, 0.005312919616699219, 0.00650787353515625, 0.007702827453613281, 0.008897781372070312, 0.010092735290527344, 0.011287689208984375, 0.012482643127441406, 0.013677597045898438, 0.014872550964355469, 0.0160675048828125, 0.01726245880126953, 0.018457412719726562, 0.019652366638183594, 0.020847320556640625, 0.022042274475097656, 0.023237228393554688, 0.02443218231201172, 0.02562713623046875, 0.02682209014892578, 0.028017044067382812, 0.029211997985839844, 0.030406951904296875, 0.031601905822753906, 0.03279685974121094, 0.03399181365966797, 0.035186767578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 4.0, 6.0, 7.0, 13.0, 18.0, 16.0, 13.0, 23.0, 34.0, 30.0, 33.0, 45.0, 24.0, 47.0, 45.0, 53.0, 46.0, 51.0, 52.0, 39.0, 42.0, 42.0, 36.0, 34.0, 33.0, 31.0, 16.0, 25.0, 26.0, 17.0, 14.0, 14.0, 11.0, 8.0, 8.0, 4.0, 3.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0105438232421875, -0.01016700267791748, -0.009790182113647461, -0.009413361549377441, -0.009036540985107422, -0.008659720420837402, -0.008282899856567383, -0.007906079292297363, -0.007529258728027344, -0.007152438163757324, -0.006775617599487305, -0.006398797035217285, -0.006021976470947266, -0.005645155906677246, -0.0052683353424072266, -0.004891514778137207, -0.0045146942138671875, -0.004137873649597168, -0.0037610530853271484, -0.003384232521057129, -0.0030074119567871094, -0.00263059139251709, -0.0022537708282470703, -0.0018769502639770508, -0.0015001296997070312, -0.0011233091354370117, -0.0007464885711669922, -0.00036966800689697266, 7.152557373046875e-06, 0.0003839731216430664, 0.0007607936859130859, 0.0011376142501831055, 0.001514434814453125, 0.0018912553787231445, 0.002268075942993164, 0.0026448965072631836, 0.003021717071533203, 0.0033985376358032227, 0.003775358200073242, 0.004152178764343262, 0.004528999328613281, 0.004905819892883301, 0.00528264045715332, 0.00565946102142334, 0.006036281585693359, 0.006413102149963379, 0.0067899227142333984, 0.007166743278503418, 0.0075435638427734375, 0.007920384407043457, 0.008297204971313477, 0.008674025535583496, 0.009050846099853516, 0.009427666664123535, 0.009804487228393555, 0.010181307792663574, 0.010558128356933594, 0.010934948921203613, 0.011311769485473633, 0.011688590049743652, 0.012065410614013672, 0.012442231178283691, 0.012819051742553711, 0.01319587230682373, 0.01357269287109375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 4.0, 7.0, 13.0, 28.0, 60.0, 102.0, 217.0, 252.0, 172.0, 82.0, 35.0, 22.0, 4.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0], "bins": [-4.247142791748047, -4.165737152099609, -4.084331512451172, -4.002925872802734, -3.9215199947357178, -3.8401143550872803, -3.7587084770202637, -3.677302837371826, -3.5958971977233887, -3.514491558074951, -3.4330856800079346, -3.351680040359497, -3.2702744007110596, -3.188868761062622, -3.1074628829956055, -3.026057243347168, -2.9446516036987305, -2.863245964050293, -2.7818400859832764, -2.700434446334839, -2.6190288066864014, -2.537623167037964, -2.4562172889709473, -2.3748116493225098, -2.293405771255493, -2.2120001316070557, -2.130594253540039, -2.0491886138916016, -1.967782974243164, -1.886377215385437, -1.80497145652771, -1.7235658168792725, -1.642160177230835, -1.560754418373108, -1.4793487787246704, -1.3979430198669434, -1.3165373802185059, -1.2351316213607788, -1.1537258625030518, -1.0723202228546143, -0.9909145832061768, -0.9095088839530945, -0.8281031847000122, -0.7466974258422852, -0.6652917861938477, -0.5838860273361206, -0.5024803280830383, -0.42107462882995605, -0.3396689295768738, -0.2582632303237915, -0.17685751616954803, -0.09545180201530457, -0.01404610276222229, 0.06735959649085999, 0.14876532554626465, 0.23017102479934692, 0.3115767240524292, 0.3929824233055115, 0.47438812255859375, 0.5557938814163208, 0.6371995210647583, 0.7186052799224854, 0.8000109791755676, 0.8814166784286499, 0.9628223776817322]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 9.0, 9.0, 18.0, 8.0, 19.0, 24.0, 36.0, 30.0, 45.0, 60.0, 69.0, 69.0, 65.0, 67.0, 57.0, 71.0, 55.0, 49.0, 45.0, 47.0, 36.0, 22.0, 27.0, 10.0, 20.0, 11.0, 0.0, 5.0, 4.0, 5.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8462040424346924, -0.8155025839805603, -0.7848011255264282, -0.7540996670722961, -0.7233982086181641, -0.692696750164032, -0.6619952917098999, -0.631293773651123, -0.6005923748016357, -0.5698909163475037, -0.5391894578933716, -0.5084879994392395, -0.4777865409851074, -0.44708508253097534, -0.4163835942745209, -0.3856821358203888, -0.3549806475639343, -0.32427918910980225, -0.29357773065567017, -0.2628762722015381, -0.2321747988462448, -0.20147334039211273, -0.17077186703681946, -0.14007040858268738, -0.1093689501285553, -0.07866749167442322, -0.04796602576971054, -0.017264559864997864, 0.013436898589134216, 0.044138357043266296, 0.07483983039855957, 0.10554128885269165, 0.13624274730682373, 0.1669442057609558, 0.1976456642150879, 0.22834713757038116, 0.25904858112335205, 0.28975003957748413, 0.3204515278339386, 0.3511529862880707, 0.38185444474220276, 0.41255590319633484, 0.4432573616504669, 0.4739588499069214, 0.5046603083610535, 0.5353617668151855, 0.5660632252693176, 0.5967646837234497, 0.6274661421775818, 0.6581676006317139, 0.688869059085846, 0.719570517539978, 0.7502719759941101, 0.7809734344482422, 0.811674952507019, 0.8423763513565063, 0.8730778694152832, 0.9037793278694153, 0.9344807863235474, 0.9651822447776794, 0.9958837032318115, 1.0265852212905884, 1.0572866201400757, 1.0879881381988525, 1.1186895370483398]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 7.0, 10.0, 9.0, 7.0, 11.0, 18.0, 17.0, 28.0, 52.0, 89.0, 124.0, 178.0, 325.0, 514.0, 986.0, 1715.0, 3399.0, 7416.0, 18290.0, 52164.0, 208577.0, 539677.0, 147089.0, 40119.0, 14711.0, 6265.0, 3098.0, 1585.0, 840.0, 479.0, 269.0, 140.0, 114.0, 65.0, 54.0, 41.0, 25.0, 15.0, 7.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.541473388671875, -0.52239990234375, -0.503326416015625, -0.4842529296875, -0.465179443359375, -0.44610595703125, -0.427032470703125, -0.407958984375, -0.388885498046875, -0.36981201171875, -0.350738525390625, -0.3316650390625, -0.312591552734375, -0.29351806640625, -0.274444580078125, -0.25537109375, -0.236297607421875, -0.21722412109375, -0.198150634765625, -0.1790771484375, -0.160003662109375, -0.14093017578125, -0.121856689453125, -0.102783203125, -0.083709716796875, -0.06463623046875, -0.045562744140625, -0.0264892578125, -0.007415771484375, 0.01165771484375, 0.030731201171875, 0.0498046875, 0.068878173828125, 0.08795166015625, 0.107025146484375, 0.1260986328125, 0.145172119140625, 0.16424560546875, 0.183319091796875, 0.202392578125, 0.221466064453125, 0.24053955078125, 0.259613037109375, 0.2786865234375, 0.297760009765625, 0.31683349609375, 0.335906982421875, 0.35498046875, 0.374053955078125, 0.39312744140625, 0.412200927734375, 0.4312744140625, 0.450347900390625, 0.46942138671875, 0.488494873046875, 0.507568359375, 0.526641845703125, 0.54571533203125, 0.564788818359375, 0.5838623046875, 0.602935791015625, 0.62200927734375, 0.641082763671875, 0.66015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 3.0, 5.0, 12.0, 5.0, 7.0, 7.0, 10.0, 11.0, 11.0, 27.0, 23.0, 22.0, 24.0, 50.0, 48.0, 55.0, 54.0, 47.0, 55.0, 54.0, 52.0, 39.0, 42.0, 45.0, 51.0, 36.0, 36.0, 24.0, 28.0, 20.0, 22.0, 11.0, 11.0, 9.0, 13.0, 5.0, 6.0, 5.0, 7.0, 5.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6015625, -1.553924560546875, -1.50628662109375, -1.458648681640625, -1.4110107421875, -1.363372802734375, -1.31573486328125, -1.268096923828125, -1.220458984375, -1.172821044921875, -1.12518310546875, -1.077545166015625, -1.0299072265625, -0.982269287109375, -0.93463134765625, -0.886993408203125, -0.83935546875, -0.791717529296875, -0.74407958984375, -0.696441650390625, -0.6488037109375, -0.601165771484375, -0.55352783203125, -0.505889892578125, -0.458251953125, -0.410614013671875, -0.36297607421875, -0.315338134765625, -0.2677001953125, -0.220062255859375, -0.17242431640625, -0.124786376953125, -0.0771484375, -0.029510498046875, 0.01812744140625, 0.065765380859375, 0.1134033203125, 0.161041259765625, 0.20867919921875, 0.256317138671875, 0.303955078125, 0.351593017578125, 0.39923095703125, 0.446868896484375, 0.4945068359375, 0.542144775390625, 0.58978271484375, 0.637420654296875, 0.68505859375, 0.732696533203125, 0.78033447265625, 0.827972412109375, 0.8756103515625, 0.923248291015625, 0.97088623046875, 1.018524169921875, 1.066162109375, 1.113800048828125, 1.16143798828125, 1.209075927734375, 1.2567138671875, 1.304351806640625, 1.35198974609375, 1.399627685546875, 1.447265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 10.0, 14.0, 14.0, 24.0, 47.0, 55.0, 60.0, 96.0, 141.0, 253.0, 547.0, 1570.0, 7441.0, 75756.0, 871618.0, 80045.0, 7805.0, 1654.0, 605.0, 272.0, 145.0, 94.0, 78.0, 54.0, 36.0, 25.0, 15.0, 13.0, 16.0, 10.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.408203125, -1.366180419921875, -1.32415771484375, -1.282135009765625, -1.2401123046875, -1.198089599609375, -1.15606689453125, -1.114044189453125, -1.072021484375, -1.029998779296875, -0.98797607421875, -0.945953369140625, -0.9039306640625, -0.861907958984375, -0.81988525390625, -0.777862548828125, -0.73583984375, -0.693817138671875, -0.65179443359375, -0.609771728515625, -0.5677490234375, -0.525726318359375, -0.48370361328125, -0.441680908203125, -0.399658203125, -0.357635498046875, -0.31561279296875, -0.273590087890625, -0.2315673828125, -0.189544677734375, -0.14752197265625, -0.105499267578125, -0.0634765625, -0.021453857421875, 0.02056884765625, 0.062591552734375, 0.1046142578125, 0.146636962890625, 0.18865966796875, 0.230682373046875, 0.272705078125, 0.314727783203125, 0.35675048828125, 0.398773193359375, 0.4407958984375, 0.482818603515625, 0.52484130859375, 0.566864013671875, 0.60888671875, 0.650909423828125, 0.69293212890625, 0.734954833984375, 0.7769775390625, 0.819000244140625, 0.86102294921875, 0.903045654296875, 0.945068359375, 0.987091064453125, 1.02911376953125, 1.071136474609375, 1.1131591796875, 1.155181884765625, 1.19720458984375, 1.239227294921875, 1.28125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 4.0, 7.0, 8.0, 6.0, 5.0, 10.0, 16.0, 18.0, 15.0, 16.0, 23.0, 26.0, 29.0, 32.0, 31.0, 30.0, 23.0, 38.0, 37.0, 36.0, 37.0, 46.0, 28.0, 39.0, 40.0, 32.0, 33.0, 34.0, 39.0, 36.0, 25.0, 22.0, 31.0, 22.0, 19.0, 10.0, 16.0, 11.0, 13.0, 10.0, 4.0, 10.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 2.0, 4.0], "bins": [-1.5126953125, -1.4703216552734375, -1.427947998046875, -1.3855743408203125, -1.34320068359375, -1.3008270263671875, -1.258453369140625, -1.2160797119140625, -1.1737060546875, -1.1313323974609375, -1.088958740234375, -1.0465850830078125, -1.00421142578125, -0.9618377685546875, -0.919464111328125, -0.8770904541015625, -0.834716796875, -0.7923431396484375, -0.749969482421875, -0.7075958251953125, -0.66522216796875, -0.6228485107421875, -0.580474853515625, -0.5381011962890625, -0.4957275390625, -0.4533538818359375, -0.410980224609375, -0.3686065673828125, -0.32623291015625, -0.2838592529296875, -0.241485595703125, -0.1991119384765625, -0.15673828125, -0.1143646240234375, -0.071990966796875, -0.0296173095703125, 0.01275634765625, 0.0551300048828125, 0.097503662109375, 0.1398773193359375, 0.1822509765625, 0.2246246337890625, 0.266998291015625, 0.3093719482421875, 0.35174560546875, 0.3941192626953125, 0.436492919921875, 0.4788665771484375, 0.521240234375, 0.5636138916015625, 0.605987548828125, 0.6483612060546875, 0.69073486328125, 0.7331085205078125, 0.775482177734375, 0.8178558349609375, 0.8602294921875, 0.9026031494140625, 0.944976806640625, 0.9873504638671875, 1.02972412109375, 1.0720977783203125, 1.114471435546875, 1.1568450927734375, 1.19921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 8.0, 17.0, 34.0, 58.0, 90.0, 203.0, 384.0, 1199.0, 7082.0, 292719.0, 733124.0, 11155.0, 1563.0, 460.0, 204.0, 96.0, 54.0, 34.0, 20.0, 18.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.96142578125, -0.9374465942382812, -0.9134674072265625, -0.8894882202148438, -0.865509033203125, -0.8415298461914062, -0.8175506591796875, -0.7935714721679688, -0.76959228515625, -0.7456130981445312, -0.7216339111328125, -0.6976547241210938, -0.673675537109375, -0.6496963500976562, -0.6257171630859375, -0.6017379760742188, -0.5777587890625, -0.5537796020507812, -0.5298004150390625, -0.5058212280273438, -0.481842041015625, -0.45786285400390625, -0.4338836669921875, -0.40990447998046875, -0.38592529296875, -0.36194610595703125, -0.3379669189453125, -0.31398773193359375, -0.290008544921875, -0.26602935791015625, -0.2420501708984375, -0.21807098388671875, -0.194091796875, -0.17011260986328125, -0.1461334228515625, -0.12215423583984375, -0.098175048828125, -0.07419586181640625, -0.0502166748046875, -0.02623748779296875, -0.00225830078125, 0.02172088623046875, 0.0457000732421875, 0.06967926025390625, 0.093658447265625, 0.11763763427734375, 0.1416168212890625, 0.16559600830078125, 0.1895751953125, 0.21355438232421875, 0.2375335693359375, 0.26151275634765625, 0.285491943359375, 0.30947113037109375, 0.3334503173828125, 0.35742950439453125, 0.38140869140625, 0.40538787841796875, 0.4293670654296875, 0.45334625244140625, 0.477325439453125, 0.5013046264648438, 0.5252838134765625, 0.5492630004882812, 0.5732421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 19.0, 32.0, 74.0, 118.0, 251.0, 246.0, 126.0, 60.0, 44.0, 18.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015044212341308594, -0.000146377831697464, -0.00014231353998184204, -0.0001382492482662201, -0.00013418495655059814, -0.0001301206648349762, -0.00012605637311935425, -0.0001219920814037323, -0.00011792778968811035, -0.0001138634979724884, -0.00010979920625686646, -0.00010573491454124451, -0.00010167062282562256, -9.760633111000061e-05, -9.354203939437866e-05, -8.947774767875671e-05, -8.541345596313477e-05, -8.134916424751282e-05, -7.728487253189087e-05, -7.322058081626892e-05, -6.915628910064697e-05, -6.509199738502502e-05, -6.1027705669403076e-05, -5.696341395378113e-05, -5.289912223815918e-05, -4.883483052253723e-05, -4.477053880691528e-05, -4.0706247091293335e-05, -3.664195537567139e-05, -3.257766366004944e-05, -2.851337194442749e-05, -2.4449080228805542e-05, -2.0384788513183594e-05, -1.6320496797561646e-05, -1.2256205081939697e-05, -8.191913366317749e-06, -4.127621650695801e-06, -6.332993507385254e-08, 4.000961780548096e-06, 8.065253496170044e-06, 1.2129545211791992e-05, 1.619383692741394e-05, 2.025812864303589e-05, 2.4322420358657837e-05, 2.8386712074279785e-05, 3.2451003789901733e-05, 3.651529550552368e-05, 4.057958722114563e-05, 4.464387893676758e-05, 4.8708170652389526e-05, 5.2772462368011475e-05, 5.683675408363342e-05, 6.090104579925537e-05, 6.496533751487732e-05, 6.902962923049927e-05, 7.309392094612122e-05, 7.715821266174316e-05, 8.122250437736511e-05, 8.528679609298706e-05, 8.935108780860901e-05, 9.341537952423096e-05, 9.74796712398529e-05, 0.00010154396295547485, 0.0001056082546710968, 0.00010967254638671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 5.0, 21.0, 21.0, 28.0, 51.0, 89.0, 182.0, 409.0, 977.0, 2815.0, 11908.0, 157594.0, 831414.0, 34433.0, 5610.0, 1690.0, 651.0, 310.0, 139.0, 82.0, 47.0, 28.0, 10.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.443603515625, -0.4245338439941406, -0.40546417236328125, -0.3863945007324219, -0.3673248291015625, -0.3482551574707031, -0.32918548583984375, -0.3101158142089844, -0.291046142578125, -0.2719764709472656, -0.25290679931640625, -0.23383712768554688, -0.2147674560546875, -0.19569778442382812, -0.17662811279296875, -0.15755844116210938, -0.13848876953125, -0.11941909790039062, -0.10034942626953125, -0.08127975463867188, -0.0622100830078125, -0.043140411376953125, -0.02407073974609375, -0.005001068115234375, 0.014068603515625, 0.033138275146484375, 0.05220794677734375, 0.07127761840820312, 0.0903472900390625, 0.10941696166992188, 0.12848663330078125, 0.14755630493164062, 0.1666259765625, 0.18569564819335938, 0.20476531982421875, 0.22383499145507812, 0.2429046630859375, 0.2619743347167969, 0.28104400634765625, 0.3001136779785156, 0.319183349609375, 0.3382530212402344, 0.35732269287109375, 0.3763923645019531, 0.3954620361328125, 0.4145317077636719, 0.43360137939453125, 0.4526710510253906, 0.47174072265625, 0.4908103942871094, 0.5098800659179688, 0.5289497375488281, 0.5480194091796875, 0.5670890808105469, 0.5861587524414062, 0.6052284240722656, 0.624298095703125, 0.6433677673339844, 0.6624374389648438, 0.6815071105957031, 0.7005767822265625, 0.7196464538574219, 0.7387161254882812, 0.7577857971191406, 0.77685546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 10.0, 13.0, 7.0, 16.0, 22.0, 43.0, 76.0, 99.0, 183.0, 190.0, 121.0, 78.0, 46.0, 29.0, 17.0, 6.0, 10.0, 10.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.2724609375, -0.2660026550292969, -0.25954437255859375, -0.2530860900878906, -0.2466278076171875, -0.24016952514648438, -0.23371124267578125, -0.22725296020507812, -0.220794677734375, -0.21433639526367188, -0.20787811279296875, -0.20141983032226562, -0.1949615478515625, -0.18850326538085938, -0.18204498291015625, -0.17558670043945312, -0.16912841796875, -0.16267013549804688, -0.15621185302734375, -0.14975357055664062, -0.1432952880859375, -0.13683700561523438, -0.13037872314453125, -0.12392044067382812, -0.117462158203125, -0.11100387573242188, -0.10454559326171875, -0.09808731079101562, -0.0916290283203125, -0.08517074584960938, -0.07871246337890625, -0.07225418090820312, -0.0657958984375, -0.059337615966796875, -0.05287933349609375, -0.046421051025390625, -0.0399627685546875, -0.033504486083984375, -0.02704620361328125, -0.020587921142578125, -0.014129638671875, -0.007671356201171875, -0.00121307373046875, 0.005245208740234375, 0.0117034912109375, 0.018161773681640625, 0.02462005615234375, 0.031078338623046875, 0.03753662109375, 0.043994903564453125, 0.05045318603515625, 0.056911468505859375, 0.0633697509765625, 0.06982803344726562, 0.07628631591796875, 0.08274459838867188, 0.089202880859375, 0.09566116333007812, 0.10211944580078125, 0.10857772827148438, 0.1150360107421875, 0.12149429321289062, 0.12795257568359375, 0.13441085815429688, 0.140869140625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 13.0, 34.0, 114.0, 282.0, 314.0, 161.0, 56.0, 12.0, 9.0, 4.0, 2.0, 2.0], "bins": [-13.127320289611816, -12.893108367919922, -12.658896446228027, -12.424684524536133, -12.190472602844238, -11.956260681152344, -11.722049713134766, -11.487837791442871, -11.253625869750977, -11.019413948059082, -10.785202026367188, -10.550990104675293, -10.316778182983398, -10.08256721496582, -9.84835433959961, -9.614143371582031, -9.37993049621582, -9.145718574523926, -8.911506652832031, -8.677294731140137, -8.443082809448242, -8.208871841430664, -7.974659442901611, -7.740447521209717, -7.5062360763549805, -7.272024154663086, -7.037812232971191, -6.803600311279297, -6.5693888664245605, -6.335176944732666, -6.1009650230407715, -5.866753101348877, -5.632541656494141, -5.398329734802246, -5.164117813110352, -4.929905891418457, -4.695694446563721, -4.461482524871826, -4.227270603179932, -3.993058681488037, -3.758847236633301, -3.5246353149414062, -3.290423631668091, -3.0562117099761963, -2.822000026702881, -2.5877881050109863, -2.353576183319092, -2.1193642616271973, -1.8851525783538818, -1.6509407758712769, -1.4167289733886719, -1.1825170516967773, -0.9483052492141724, -0.7140934467315674, -0.47988152503967285, -0.24566972255706787, -0.01145792007446289, 0.22275391221046448, 0.45696574449539185, 0.6911776065826416, 0.9253894090652466, 1.1596012115478516, 1.393813133239746, 1.628024935722351, 1.862236738204956]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 2.0, 5.0, 16.0, 10.0, 14.0, 10.0, 12.0, 15.0, 11.0, 23.0, 23.0, 30.0, 23.0, 22.0, 29.0, 21.0, 34.0, 26.0, 34.0, 34.0, 31.0, 30.0, 27.0, 35.0, 33.0, 35.0, 32.0, 26.0, 28.0, 33.0, 28.0, 29.0, 33.0, 26.0, 26.0, 23.0, 14.0, 18.0, 17.0, 14.0, 5.0, 9.0, 6.0, 6.0, 5.0, 4.0, 7.0, 3.0, 3.0, 5.0, 5.0, 1.0, 3.0, 5.0], "bins": [-2.1108129024505615, -2.0463504791259766, -1.981887936592102, -1.917425513267517, -1.8529629707336426, -1.7885005474090576, -1.7240381240844727, -1.6595757007598877, -1.5951131582260132, -1.5306507349014282, -1.4661881923675537, -1.4017257690429688, -1.3372633457183838, -1.2728008031845093, -1.2083383798599243, -1.1438758373260498, -1.0794134140014648, -1.0149509906768799, -0.9504884481430054, -0.8860260248184204, -0.8215635418891907, -0.7571010589599609, -0.692638635635376, -0.6281761527061462, -0.5637136697769165, -0.49925118684768677, -0.4347887337207794, -0.37032628059387207, -0.30586379766464233, -0.2414013147354126, -0.17693886160850525, -0.1124764084815979, -0.048014163970947266, 0.016448304057121277, 0.08091077208518982, 0.14537324011325836, 0.2098357081413269, 0.27429819107055664, 0.338760644197464, 0.40322309732437134, 0.4676855802536011, 0.5321480631828308, 0.5966105461120605, 0.6610729694366455, 0.7255354523658752, 0.789997935295105, 0.8544603586196899, 0.9189228415489197, 0.9833853244781494, 1.0478477478027344, 1.1123102903366089, 1.1767727136611938, 1.2412352561950684, 1.3056976795196533, 1.3701601028442383, 1.4346225261688232, 1.4990850687026978, 1.5635474920272827, 1.6280100345611572, 1.6924724578857422, 1.7569348812103271, 1.8213974237442017, 1.8858598470687866, 1.9503223896026611, 2.014784812927246]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 11.0, 4.0, 6.0, 9.0, 30.0, 27.0, 27.0, 57.0, 85.0, 112.0, 193.0, 306.0, 567.0, 1167.0, 2884.0, 9317.0, 80128.0, 2947349.0, 1107046.0, 35589.0, 5533.0, 1813.0, 834.0, 467.0, 255.0, 182.0, 98.0, 70.0, 34.0, 23.0, 21.0, 14.0, 4.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.220703125, -2.143707275390625, -2.06671142578125, -1.989715576171875, -1.9127197265625, -1.835723876953125, -1.75872802734375, -1.681732177734375, -1.604736328125, -1.527740478515625, -1.45074462890625, -1.373748779296875, -1.2967529296875, -1.219757080078125, -1.14276123046875, -1.065765380859375, -0.98876953125, -0.911773681640625, -0.83477783203125, -0.757781982421875, -0.6807861328125, -0.603790283203125, -0.52679443359375, -0.449798583984375, -0.372802734375, -0.295806884765625, -0.21881103515625, -0.141815185546875, -0.0648193359375, 0.012176513671875, 0.08917236328125, 0.166168212890625, 0.2431640625, 0.320159912109375, 0.39715576171875, 0.474151611328125, 0.5511474609375, 0.628143310546875, 0.70513916015625, 0.782135009765625, 0.859130859375, 0.936126708984375, 1.01312255859375, 1.090118408203125, 1.1671142578125, 1.244110107421875, 1.32110595703125, 1.398101806640625, 1.47509765625, 1.552093505859375, 1.62908935546875, 1.706085205078125, 1.7830810546875, 1.860076904296875, 1.93707275390625, 2.014068603515625, 2.091064453125, 2.168060302734375, 2.24505615234375, 2.322052001953125, 2.3990478515625, 2.476043701171875, 2.55303955078125, 2.630035400390625, 2.70703125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 10.0, 11.0, 11.0, 18.0, 27.0, 33.0, 42.0, 65.0, 70.0, 67.0, 78.0, 85.0, 75.0, 78.0, 72.0, 62.0, 53.0, 35.0, 31.0, 28.0, 8.0, 14.0, 14.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.06170654296875, -1.0169677734375, -0.97222900390625, -0.927490234375, -0.88275146484375, -0.8380126953125, -0.79327392578125, -0.74853515625, -0.70379638671875, -0.6590576171875, -0.61431884765625, -0.569580078125, -0.52484130859375, -0.4801025390625, -0.43536376953125, -0.390625, -0.34588623046875, -0.3011474609375, -0.25640869140625, -0.211669921875, -0.16693115234375, -0.1221923828125, -0.07745361328125, -0.03271484375, 0.01202392578125, 0.0567626953125, 0.10150146484375, 0.146240234375, 0.19097900390625, 0.2357177734375, 0.28045654296875, 0.3251953125, 0.36993408203125, 0.4146728515625, 0.45941162109375, 0.504150390625, 0.54888916015625, 0.5936279296875, 0.63836669921875, 0.68310546875, 0.72784423828125, 0.7725830078125, 0.81732177734375, 0.862060546875, 0.90679931640625, 0.9515380859375, 0.99627685546875, 1.041015625, 1.08575439453125, 1.1304931640625, 1.17523193359375, 1.219970703125, 1.26470947265625, 1.3094482421875, 1.35418701171875, 1.39892578125, 1.44366455078125, 1.4884033203125, 1.53314208984375, 1.577880859375, 1.62261962890625, 1.6673583984375, 1.71209716796875, 1.7568359375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 13.0, 17.0, 23.0, 37.0, 65.0, 103.0, 227.0, 526.0, 1438.0, 5082.0, 29958.0, 1881080.0, 2235320.0, 32447.0, 5285.0, 1569.0, 554.0, 253.0, 136.0, 53.0, 34.0, 20.0, 18.0, 8.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.591796875, -1.51226806640625, -1.4327392578125, -1.35321044921875, -1.273681640625, -1.19415283203125, -1.1146240234375, -1.03509521484375, -0.95556640625, -0.87603759765625, -0.7965087890625, -0.71697998046875, -0.637451171875, -0.55792236328125, -0.4783935546875, -0.39886474609375, -0.3193359375, -0.23980712890625, -0.1602783203125, -0.08074951171875, -0.001220703125, 0.07830810546875, 0.1578369140625, 0.23736572265625, 0.31689453125, 0.39642333984375, 0.4759521484375, 0.55548095703125, 0.635009765625, 0.71453857421875, 0.7940673828125, 0.87359619140625, 0.953125, 1.03265380859375, 1.1121826171875, 1.19171142578125, 1.271240234375, 1.35076904296875, 1.4302978515625, 1.50982666015625, 1.58935546875, 1.66888427734375, 1.7484130859375, 1.82794189453125, 1.907470703125, 1.98699951171875, 2.0665283203125, 2.14605712890625, 2.2255859375, 2.30511474609375, 2.3846435546875, 2.46417236328125, 2.543701171875, 2.62322998046875, 2.7027587890625, 2.78228759765625, 2.86181640625, 2.94134521484375, 3.0208740234375, 3.10040283203125, 3.179931640625, 3.25946044921875, 3.3389892578125, 3.41851806640625, 3.498046875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 10.0, 11.0, 12.0, 17.0, 30.0, 55.0, 91.0, 157.0, 384.0, 828.0, 1035.0, 726.0, 370.0, 136.0, 76.0, 51.0, 28.0, 21.0, 7.0, 10.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8466796875, -0.8261985778808594, -0.8057174682617188, -0.7852363586425781, -0.7647552490234375, -0.7442741394042969, -0.7237930297851562, -0.7033119201660156, -0.682830810546875, -0.6623497009277344, -0.6418685913085938, -0.6213874816894531, -0.6009063720703125, -0.5804252624511719, -0.5599441528320312, -0.5394630432128906, -0.51898193359375, -0.4985008239746094, -0.47801971435546875, -0.4575386047363281, -0.4370574951171875, -0.4165763854980469, -0.39609527587890625, -0.3756141662597656, -0.355133056640625, -0.3346519470214844, -0.31417083740234375, -0.2936897277832031, -0.2732086181640625, -0.2527275085449219, -0.23224639892578125, -0.21176528930664062, -0.1912841796875, -0.17080307006835938, -0.15032196044921875, -0.12984085083007812, -0.1093597412109375, -0.08887863159179688, -0.06839752197265625, -0.047916412353515625, -0.027435302734375, -0.006954193115234375, 0.01352691650390625, 0.034008026123046875, 0.0544891357421875, 0.07497024536132812, 0.09545135498046875, 0.11593246459960938, 0.13641357421875, 0.15689468383789062, 0.17737579345703125, 0.19785690307617188, 0.2183380126953125, 0.23881912231445312, 0.25930023193359375, 0.2797813415527344, 0.300262451171875, 0.3207435607910156, 0.34122467041015625, 0.3617057800292969, 0.3821868896484375, 0.4026679992675781, 0.42314910888671875, 0.4436302185058594, 0.464111328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 4.0, 9.0, 8.0, 13.0, 29.0, 51.0, 89.0, 100.0, 162.0, 168.0, 121.0, 120.0, 54.0, 24.0, 21.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3088536262512207, -3.229905366897583, -3.1509573459625244, -3.0720090866088867, -2.993060827255249, -2.9141125679016113, -2.8351645469665527, -2.756216287612915, -2.6772680282592773, -2.5983197689056396, -2.519371747970581, -2.4404234886169434, -2.3614752292633057, -2.282526969909668, -2.2035789489746094, -2.1246306896209717, -2.045682668685913, -1.966734528541565, -1.8877862691879272, -1.808838129043579, -1.7298898696899414, -1.6509417295455933, -1.5719935894012451, -1.4930453300476074, -1.4140971899032593, -1.3351490497589111, -1.2562007904052734, -1.1772526502609253, -1.0983045101165771, -1.0193562507629395, -0.9404081106185913, -0.8614599108695984, -0.7825114727020264, -0.7035632729530334, -0.6246150732040405, -0.5456669330596924, -0.46671873331069946, -0.38777053356170654, -0.308822363615036, -0.22987419366836548, -0.15092599391937256, -0.07197780907154083, 0.0069703757762908936, 0.08591856062412262, 0.16486674547195435, 0.24381494522094727, 0.3227631151676178, 0.40171128511428833, 0.48065948486328125, 0.5596076846122742, 0.6385558843612671, 0.7175040245056152, 0.7964522242546082, 0.8754004240036011, 0.9543485641479492, 1.033296823501587, 1.112244963645935, 1.1911931037902832, 1.270141363143921, 1.349089503288269, 1.4280376434326172, 1.5069859027862549, 1.585934042930603, 1.6648821830749512, 1.7438304424285889]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 7.0, 3.0, 6.0, 10.0, 14.0, 14.0, 9.0, 15.0, 18.0, 23.0, 29.0, 24.0, 35.0, 36.0, 38.0, 52.0, 43.0, 52.0, 50.0, 50.0, 48.0, 51.0, 48.0, 42.0, 42.0, 41.0, 36.0, 32.0, 27.0, 20.0, 16.0, 10.0, 9.0, 8.0, 6.0, 9.0, 3.0, 4.0, 4.0, 5.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8334425687789917, -0.801851212978363, -0.7702597975730896, -0.7386684417724609, -0.7070770859718323, -0.6754857301712036, -0.6438943147659302, -0.6123029589653015, -0.5807116031646729, -0.5491202473640442, -0.5175288319587708, -0.4859374761581421, -0.4543461203575134, -0.4227547347545624, -0.39116334915161133, -0.35957199335098267, -0.32798057794570923, -0.2963891923427582, -0.2647978365421295, -0.23320645093917847, -0.2016150802373886, -0.17002370953559875, -0.1384323239326477, -0.10684095323085785, -0.075249582529068, -0.04365820810198784, -0.012066833674907684, 0.01952454447746277, 0.051115915179252625, 0.08270728588104248, 0.11429867148399353, 0.1458900421857834, 0.17748141288757324, 0.2090727835893631, 0.24066415429115295, 0.272255539894104, 0.30384689569473267, 0.3354382812976837, 0.36702966690063477, 0.3986210227012634, 0.4302124083042145, 0.4618037939071655, 0.4933951497077942, 0.5249865055084229, 0.5565779209136963, 0.588169276714325, 0.6197606325149536, 0.651352047920227, 0.6829434037208557, 0.7145347595214844, 0.7461261749267578, 0.7777175307273865, 0.8093088865280151, 0.8409003019332886, 0.8724916577339172, 0.9040830135345459, 0.9356744289398193, 0.967265784740448, 0.9988572001457214, 1.03044855594635, 1.0620399713516235, 1.0936312675476074, 1.1252226829528809, 1.1568140983581543, 1.1884053945541382]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 13.0, 19.0, 29.0, 61.0, 95.0, 201.0, 450.0, 1144.0, 3398.0, 12396.0, 81496.0, 773289.0, 151702.0, 17176.0, 4550.0, 1506.0, 495.0, 248.0, 106.0, 64.0, 27.0, 18.0, 15.0, 7.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.52001953125, -0.5054168701171875, -0.490814208984375, -0.4762115478515625, -0.46160888671875, -0.4470062255859375, -0.432403564453125, -0.4178009033203125, -0.4031982421875, -0.3885955810546875, -0.373992919921875, -0.3593902587890625, -0.34478759765625, -0.3301849365234375, -0.315582275390625, -0.3009796142578125, -0.286376953125, -0.2717742919921875, -0.257171630859375, -0.2425689697265625, -0.22796630859375, -0.2133636474609375, -0.198760986328125, -0.1841583251953125, -0.1695556640625, -0.1549530029296875, -0.140350341796875, -0.1257476806640625, -0.11114501953125, -0.0965423583984375, -0.081939697265625, -0.0673370361328125, -0.052734375, -0.0381317138671875, -0.023529052734375, -0.0089263916015625, 0.00567626953125, 0.0202789306640625, 0.034881591796875, 0.0494842529296875, 0.0640869140625, 0.0786895751953125, 0.093292236328125, 0.1078948974609375, 0.12249755859375, 0.1371002197265625, 0.151702880859375, 0.1663055419921875, 0.180908203125, 0.1955108642578125, 0.210113525390625, 0.2247161865234375, 0.23931884765625, 0.2539215087890625, 0.268524169921875, 0.2831268310546875, 0.2977294921875, 0.3123321533203125, 0.326934814453125, 0.3415374755859375, 0.35614013671875, 0.3707427978515625, 0.385345458984375, 0.3999481201171875, 0.41455078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 10.0, 4.0, 11.0, 8.0, 17.0, 30.0, 34.0, 26.0, 45.0, 62.0, 60.0, 57.0, 79.0, 85.0, 74.0, 70.0, 65.0, 58.0, 47.0, 52.0, 32.0, 15.0, 19.0, 10.0, 9.0, 4.0, 9.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72509765625, -0.6944198608398438, -0.6637420654296875, -0.6330642700195312, -0.602386474609375, -0.5717086791992188, -0.5410308837890625, -0.5103530883789062, -0.47967529296875, -0.44899749755859375, -0.4183197021484375, -0.38764190673828125, -0.356964111328125, -0.32628631591796875, -0.2956085205078125, -0.26493072509765625, -0.2342529296875, -0.20357513427734375, -0.1728973388671875, -0.14221954345703125, -0.111541748046875, -0.08086395263671875, -0.0501861572265625, -0.01950836181640625, 0.01116943359375, 0.04184722900390625, 0.0725250244140625, 0.10320281982421875, 0.133880615234375, 0.16455841064453125, 0.1952362060546875, 0.22591400146484375, 0.256591796875, 0.28726959228515625, 0.3179473876953125, 0.34862518310546875, 0.379302978515625, 0.40998077392578125, 0.4406585693359375, 0.47133636474609375, 0.50201416015625, 0.5326919555664062, 0.5633697509765625, 0.5940475463867188, 0.624725341796875, 0.6554031372070312, 0.6860809326171875, 0.7167587280273438, 0.7474365234375, 0.7781143188476562, 0.8087921142578125, 0.8394699096679688, 0.870147705078125, 0.9008255004882812, 0.9315032958984375, 0.9621810913085938, 0.99285888671875, 1.0235366821289062, 1.0542144775390625, 1.0848922729492188, 1.115570068359375, 1.1462478637695312, 1.1769256591796875, 1.2076034545898438, 1.23828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 12.0, 8.0, 17.0, 12.0, 27.0, 29.0, 44.0, 61.0, 72.0, 118.0, 175.0, 300.0, 490.0, 851.0, 1549.0, 2903.0, 5812.0, 12100.0, 33684.0, 127768.0, 444419.0, 303418.0, 73994.0, 21954.0, 9034.0, 4320.0, 2203.0, 1252.0, 718.0, 401.0, 245.0, 177.0, 115.0, 69.0, 54.0, 42.0, 28.0, 18.0, 19.0, 11.0, 7.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1951904296875, -0.1892414093017578, -0.18329238891601562, -0.17734336853027344, -0.17139434814453125, -0.16544532775878906, -0.15949630737304688, -0.1535472869873047, -0.1475982666015625, -0.1416492462158203, -0.13570022583007812, -0.12975120544433594, -0.12380218505859375, -0.11785316467285156, -0.11190414428710938, -0.10595512390136719, -0.100006103515625, -0.09405708312988281, -0.08810806274414062, -0.08215904235839844, -0.07621002197265625, -0.07026100158691406, -0.06431198120117188, -0.05836296081542969, -0.0524139404296875, -0.04646492004394531, -0.040515899658203125, -0.03456687927246094, -0.02861785888671875, -0.022668838500976562, -0.016719818115234375, -0.010770797729492188, -0.00482177734375, 0.0011272430419921875, 0.007076263427734375, 0.013025283813476562, 0.01897430419921875, 0.024923324584960938, 0.030872344970703125, 0.03682136535644531, 0.0427703857421875, 0.04871940612792969, 0.054668426513671875, 0.06061744689941406, 0.06656646728515625, 0.07251548767089844, 0.07846450805664062, 0.08441352844238281, 0.090362548828125, 0.09631156921386719, 0.10226058959960938, 0.10820960998535156, 0.11415863037109375, 0.12010765075683594, 0.12605667114257812, 0.1320056915283203, 0.1379547119140625, 0.1439037322998047, 0.14985275268554688, 0.15580177307128906, 0.16175079345703125, 0.16769981384277344, 0.17364883422851562, 0.1795978546142578, 0.185546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 0.0, 4.0, 6.0, 15.0, 15.0, 22.0, 26.0, 40.0, 39.0, 36.0, 45.0, 36.0, 35.0, 52.0, 58.0, 60.0, 58.0, 68.0, 44.0, 62.0, 44.0, 41.0, 42.0, 24.0, 27.0, 23.0, 20.0, 14.0, 8.0, 5.0, 3.0, 7.0, 2.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.564453125, -1.5181884765625, -1.471923828125, -1.4256591796875, -1.37939453125, -1.3331298828125, -1.286865234375, -1.2406005859375, -1.1943359375, -1.1480712890625, -1.101806640625, -1.0555419921875, -1.00927734375, -0.9630126953125, -0.916748046875, -0.8704833984375, -0.82421875, -0.7779541015625, -0.731689453125, -0.6854248046875, -0.63916015625, -0.5928955078125, -0.546630859375, -0.5003662109375, -0.4541015625, -0.4078369140625, -0.361572265625, -0.3153076171875, -0.26904296875, -0.2227783203125, -0.176513671875, -0.1302490234375, -0.083984375, -0.0377197265625, 0.008544921875, 0.0548095703125, 0.10107421875, 0.1473388671875, 0.193603515625, 0.2398681640625, 0.2861328125, 0.3323974609375, 0.378662109375, 0.4249267578125, 0.47119140625, 0.5174560546875, 0.563720703125, 0.6099853515625, 0.65625, 0.7025146484375, 0.748779296875, 0.7950439453125, 0.84130859375, 0.8875732421875, 0.933837890625, 0.9801025390625, 1.0263671875, 1.0726318359375, 1.118896484375, 1.1651611328125, 1.21142578125, 1.2576904296875, 1.303955078125, 1.3502197265625, 1.396484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 9.0, 11.0, 26.0, 21.0, 33.0, 46.0, 61.0, 97.0, 163.0, 211.0, 300.0, 566.0, 900.0, 1583.0, 3310.0, 8402.0, 26753.0, 131765.0, 550185.0, 256901.0, 45408.0, 12214.0, 4520.0, 2075.0, 1132.0, 635.0, 408.0, 256.0, 169.0, 114.0, 73.0, 48.0, 33.0, 29.0, 19.0, 14.0, 12.0, 10.0, 9.0, 6.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0787353515625, -0.07632637023925781, -0.07391738891601562, -0.07150840759277344, -0.06909942626953125, -0.06669044494628906, -0.06428146362304688, -0.06187248229980469, -0.0594635009765625, -0.05705451965332031, -0.054645538330078125, -0.05223655700683594, -0.04982757568359375, -0.04741859436035156, -0.045009613037109375, -0.04260063171386719, -0.040191650390625, -0.03778266906738281, -0.035373687744140625, -0.03296470642089844, -0.03055572509765625, -0.028146743774414062, -0.025737762451171875, -0.023328781127929688, -0.0209197998046875, -0.018510818481445312, -0.016101837158203125, -0.013692855834960938, -0.01128387451171875, -0.008874893188476562, -0.006465911865234375, -0.0040569305419921875, -0.00164794921875, 0.0007610321044921875, 0.003170013427734375, 0.0055789947509765625, 0.00798797607421875, 0.010396957397460938, 0.012805938720703125, 0.015214920043945312, 0.0176239013671875, 0.020032882690429688, 0.022441864013671875, 0.024850845336914062, 0.02725982666015625, 0.029668807983398438, 0.032077789306640625, 0.03448677062988281, 0.036895751953125, 0.03930473327636719, 0.041713714599609375, 0.04412269592285156, 0.04653167724609375, 0.04894065856933594, 0.051349639892578125, 0.05375862121582031, 0.0561676025390625, 0.05857658386230469, 0.060985565185546875, 0.06339454650878906, 0.06580352783203125, 0.06821250915527344, 0.07062149047851562, 0.07303047180175781, 0.075439453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 12.0, 8.0, 36.0, 81.0, 232.0, 344.0, 185.0, 53.0, 19.0, 13.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011342763900756836, -0.00010955985635519028, -0.0001056920737028122, -0.00010182429105043411, -9.795650839805603e-05, -9.408872574567795e-05, -9.022094309329987e-05, -8.635316044092178e-05, -8.24853777885437e-05, -7.861759513616562e-05, -7.474981248378754e-05, -7.088202983140945e-05, -6.701424717903137e-05, -6.314646452665329e-05, -5.927868187427521e-05, -5.5410899221897125e-05, -5.154311656951904e-05, -4.767533391714096e-05, -4.380755126476288e-05, -3.9939768612384796e-05, -3.6071985960006714e-05, -3.220420330762863e-05, -2.833642065525055e-05, -2.4468638002872467e-05, -2.0600855350494385e-05, -1.6733072698116302e-05, -1.286529004573822e-05, -8.997507393360138e-06, -5.129724740982056e-06, -1.2619420886039734e-06, 2.605840563774109e-06, 6.473623216152191e-06, 1.0341405868530273e-05, 1.4209188520908356e-05, 1.8076971173286438e-05, 2.194475382566452e-05, 2.5812536478042603e-05, 2.9680319130420685e-05, 3.354810178279877e-05, 3.741588443517685e-05, 4.128366708755493e-05, 4.5151449739933014e-05, 4.9019232392311096e-05, 5.288701504468918e-05, 5.675479769706726e-05, 6.062258034944534e-05, 6.449036300182343e-05, 6.835814565420151e-05, 7.222592830657959e-05, 7.609371095895767e-05, 7.996149361133575e-05, 8.382927626371384e-05, 8.769705891609192e-05, 9.156484156847e-05, 9.543262422084808e-05, 9.930040687322617e-05, 0.00010316818952560425, 0.00010703597217798233, 0.00011090375483036041, 0.0001147715374827385, 0.00011863932013511658, 0.00012250710278749466, 0.00012637488543987274, 0.00013024266809225082, 0.0001341104507446289]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 5.0, 8.0, 14.0, 20.0, 20.0, 35.0, 39.0, 56.0, 99.0, 140.0, 239.0, 354.0, 609.0, 1105.0, 1972.0, 4210.0, 10882.0, 36743.0, 160811.0, 486709.0, 259887.0, 57461.0, 15729.0, 5710.0, 2420.0, 1331.0, 698.0, 427.0, 284.0, 170.0, 120.0, 74.0, 42.0, 38.0, 26.0, 23.0, 6.0, 10.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0723876953125, -0.07017135620117188, -0.06795501708984375, -0.06573867797851562, -0.0635223388671875, -0.061305999755859375, -0.05908966064453125, -0.056873321533203125, -0.054656982421875, -0.052440643310546875, -0.05022430419921875, -0.048007965087890625, -0.0457916259765625, -0.043575286865234375, -0.04135894775390625, -0.039142608642578125, -0.03692626953125, -0.034709930419921875, -0.03249359130859375, -0.030277252197265625, -0.0280609130859375, -0.025844573974609375, -0.02362823486328125, -0.021411895751953125, -0.019195556640625, -0.016979217529296875, -0.01476287841796875, -0.012546539306640625, -0.0103302001953125, -0.008113861083984375, -0.00589752197265625, -0.003681182861328125, -0.00146484375, 0.000751495361328125, 0.00296783447265625, 0.005184173583984375, 0.0074005126953125, 0.009616851806640625, 0.01183319091796875, 0.014049530029296875, 0.016265869140625, 0.018482208251953125, 0.02069854736328125, 0.022914886474609375, 0.0251312255859375, 0.027347564697265625, 0.02956390380859375, 0.031780242919921875, 0.03399658203125, 0.036212921142578125, 0.03842926025390625, 0.040645599365234375, 0.0428619384765625, 0.045078277587890625, 0.04729461669921875, 0.049510955810546875, 0.051727294921875, 0.053943634033203125, 0.05615997314453125, 0.058376312255859375, 0.0605926513671875, 0.06280899047851562, 0.06502532958984375, 0.06724166870117188, 0.0694580078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 7.0, 4.0, 5.0, 9.0, 12.0, 12.0, 20.0, 29.0, 28.0, 36.0, 41.0, 63.0, 71.0, 75.0, 82.0, 77.0, 76.0, 67.0, 67.0, 46.0, 33.0, 27.0, 22.0, 14.0, 22.0, 13.0, 12.0, 9.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0175933837890625, -0.01701831817626953, -0.016443252563476562, -0.015868186950683594, -0.015293121337890625, -0.014718055725097656, -0.014142990112304688, -0.013567924499511719, -0.01299285888671875, -0.012417793273925781, -0.011842727661132812, -0.011267662048339844, -0.010692596435546875, -0.010117530822753906, -0.009542465209960938, -0.008967399597167969, -0.008392333984375, -0.007817268371582031, -0.0072422027587890625, -0.006667137145996094, -0.006092071533203125, -0.005517005920410156, -0.0049419403076171875, -0.004366874694824219, -0.00379180908203125, -0.0032167434692382812, -0.0026416778564453125, -0.0020666122436523438, -0.001491546630859375, -0.0009164810180664062, -0.0003414154052734375, 0.00023365020751953125, 0.0008087158203125, 0.0013837814331054688, 0.0019588470458984375, 0.0025339126586914062, 0.003108978271484375, 0.0036840438842773438, 0.0042591094970703125, 0.004834175109863281, 0.00540924072265625, 0.005984306335449219, 0.0065593719482421875, 0.007134437561035156, 0.007709503173828125, 0.008284568786621094, 0.008859634399414062, 0.009434700012207031, 0.010009765625, 0.010584831237792969, 0.011159896850585938, 0.011734962463378906, 0.012310028076171875, 0.012885093688964844, 0.013460159301757812, 0.014035224914550781, 0.01461029052734375, 0.015185356140136719, 0.015760421752929688, 0.016335487365722656, 0.016910552978515625, 0.017485618591308594, 0.018060684204101562, 0.01863574981689453, 0.0192108154296875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 13.0, 11.0, 25.0, 77.0, 170.0, 293.0, 228.0, 113.0, 37.0, 16.0, 8.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.750623941421509, -3.6717898845672607, -3.5929555892944336, -3.5141215324401855, -3.4352874755859375, -3.3564534187316895, -3.2776191234588623, -3.1987850666046143, -3.119950771331787, -3.041116714477539, -2.962282419204712, -2.883448362350464, -2.804614305496216, -2.7257800102233887, -2.6469459533691406, -2.5681118965148926, -2.4892778396606445, -2.4104437828063965, -2.3316094875335693, -2.2527754306793213, -2.1739413738250732, -2.095107078552246, -2.016273021697998, -1.93743896484375, -1.8586047887802124, -1.7797706127166748, -1.7009365558624268, -1.6221023797988892, -1.5432682037353516, -1.4644341468811035, -1.385599970817566, -1.3067657947540283, -1.2279317378997803, -1.1490975618362427, -1.0702635049819946, -0.991429328918457, -0.9125952124595642, -0.8337610960006714, -0.7549269199371338, -0.676092803478241, -0.5972586870193481, -0.5184245705604553, -0.4395904242992401, -0.3607562780380249, -0.2819221615791321, -0.20308804512023926, -0.12425389885902405, -0.04541975259780884, 0.033414363861083984, 0.112248495221138, 0.19108262658119202, 0.2699167728424072, 0.34875088930130005, 0.42758500576019287, 0.5064191818237305, 0.5852532982826233, 0.6640874147415161, 0.7429215312004089, 0.8217556476593018, 0.9005898237228394, 0.9794239401817322, 1.058258056640625, 1.1370922327041626, 1.2159264087677002, 1.2947604656219482]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 5.0, 7.0, 6.0, 12.0, 14.0, 18.0, 18.0, 26.0, 35.0, 31.0, 44.0, 56.0, 67.0, 64.0, 73.0, 79.0, 71.0, 76.0, 58.0, 52.0, 42.0, 45.0, 25.0, 24.0, 11.0, 7.0, 14.0, 8.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8210428357124329, -0.7928128838539124, -0.7645828723907471, -0.7363529205322266, -0.708122968673706, -0.6798929572105408, -0.6516630053520203, -0.623432993888855, -0.5952030420303345, -0.566973090171814, -0.5387430787086487, -0.5105131268501282, -0.4822831451892853, -0.4540531635284424, -0.4258232116699219, -0.397593230009079, -0.36936327815055847, -0.3411332964897156, -0.31290334463119507, -0.2846733629703522, -0.2564433813095093, -0.22821341454982758, -0.19998344779014587, -0.17175346612930298, -0.14352349936962128, -0.11529352515935898, -0.08706355094909668, -0.05883358418941498, -0.03060360997915268, -0.002373635768890381, 0.02585633099079132, 0.054086312651634216, 0.08231627941131592, 0.11054625362157822, 0.13877622783184052, 0.16700619459152222, 0.1952361762523651, 0.22346614301204681, 0.2516961097717285, 0.2799260914325714, 0.3081560730934143, 0.3363860547542572, 0.3646160066127777, 0.3928459882736206, 0.4210759699344635, 0.4493059515953064, 0.4775359034538269, 0.5057659149169922, 0.5339958667755127, 0.5622258186340332, 0.5904558300971985, 0.618685781955719, 0.6469157338142395, 0.6751457452774048, 0.7033756971359253, 0.7316056489944458, 0.7598356008529663, 0.7880655527114868, 0.8162955641746521, 0.8445255160331726, 0.8727554678916931, 0.9009854793548584, 0.9292154312133789, 0.9574453830718994, 0.9856753945350647]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 11.0, 17.0, 24.0, 25.0, 37.0, 45.0, 81.0, 144.0, 271.0, 446.0, 915.0, 2080.0, 5970.0, 23429.0, 157744.0, 742349.0, 91118.0, 15912.0, 4517.0, 1649.0, 764.0, 375.0, 218.0, 155.0, 65.0, 57.0, 44.0, 16.0, 14.0, 8.0, 13.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.99658203125, -0.9667205810546875, -0.936859130859375, -0.9069976806640625, -0.87713623046875, -0.8472747802734375, -0.817413330078125, -0.7875518798828125, -0.7576904296875, -0.7278289794921875, -0.697967529296875, -0.6681060791015625, -0.63824462890625, -0.6083831787109375, -0.578521728515625, -0.5486602783203125, -0.518798828125, -0.4889373779296875, -0.459075927734375, -0.4292144775390625, -0.39935302734375, -0.3694915771484375, -0.339630126953125, -0.3097686767578125, -0.2799072265625, -0.2500457763671875, -0.220184326171875, -0.1903228759765625, -0.16046142578125, -0.1305999755859375, -0.100738525390625, -0.0708770751953125, -0.041015625, -0.0111541748046875, 0.018707275390625, 0.0485687255859375, 0.07843017578125, 0.1082916259765625, 0.138153076171875, 0.1680145263671875, 0.1978759765625, 0.2277374267578125, 0.257598876953125, 0.2874603271484375, 0.31732177734375, 0.3471832275390625, 0.377044677734375, 0.4069061279296875, 0.436767578125, 0.4666290283203125, 0.496490478515625, 0.5263519287109375, 0.55621337890625, 0.5860748291015625, 0.615936279296875, 0.6457977294921875, 0.6756591796875, 0.7055206298828125, 0.735382080078125, 0.7652435302734375, 0.79510498046875, 0.8249664306640625, 0.854827880859375, 0.8846893310546875, 0.91455078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 7.0, 8.0, 6.0, 11.0, 8.0, 12.0, 17.0, 11.0, 32.0, 31.0, 40.0, 40.0, 52.0, 53.0, 60.0, 66.0, 79.0, 66.0, 64.0, 60.0, 59.0, 48.0, 28.0, 29.0, 28.0, 18.0, 17.0, 11.0, 12.0, 9.0, 8.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.736328125, -1.6845550537109375, -1.632781982421875, -1.5810089111328125, -1.52923583984375, -1.4774627685546875, -1.425689697265625, -1.3739166259765625, -1.3221435546875, -1.2703704833984375, -1.218597412109375, -1.1668243408203125, -1.11505126953125, -1.0632781982421875, -1.011505126953125, -0.9597320556640625, -0.907958984375, -0.8561859130859375, -0.804412841796875, -0.7526397705078125, -0.70086669921875, -0.6490936279296875, -0.597320556640625, -0.5455474853515625, -0.4937744140625, -0.4420013427734375, -0.390228271484375, -0.3384552001953125, -0.28668212890625, -0.2349090576171875, -0.183135986328125, -0.1313629150390625, -0.07958984375, -0.0278167724609375, 0.023956298828125, 0.0757293701171875, 0.12750244140625, 0.1792755126953125, 0.231048583984375, 0.2828216552734375, 0.3345947265625, 0.3863677978515625, 0.438140869140625, 0.4899139404296875, 0.54168701171875, 0.5934600830078125, 0.645233154296875, 0.6970062255859375, 0.748779296875, 0.8005523681640625, 0.852325439453125, 0.9040985107421875, 0.95587158203125, 1.0076446533203125, 1.059417724609375, 1.1111907958984375, 1.1629638671875, 1.2147369384765625, 1.266510009765625, 1.3182830810546875, 1.37005615234375, 1.4218292236328125, 1.473602294921875, 1.5253753662109375, 1.5771484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 10.0, 10.0, 7.0, 9.0, 11.0, 11.0, 19.0, 28.0, 31.0, 31.0, 28.0, 51.0, 73.0, 107.0, 174.0, 413.0, 1942.0, 19025.0, 942857.0, 78343.0, 4019.0, 685.0, 215.0, 136.0, 68.0, 54.0, 39.0, 26.0, 28.0, 19.0, 19.0, 13.0, 8.0, 8.0, 14.0, 4.0, 5.0, 3.0, 2.0, 0.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.453125, -2.386260986328125, -2.31939697265625, -2.252532958984375, -2.1856689453125, -2.118804931640625, -2.05194091796875, -1.985076904296875, -1.918212890625, -1.851348876953125, -1.78448486328125, -1.717620849609375, -1.6507568359375, -1.583892822265625, -1.51702880859375, -1.450164794921875, -1.38330078125, -1.316436767578125, -1.24957275390625, -1.182708740234375, -1.1158447265625, -1.048980712890625, -0.98211669921875, -0.915252685546875, -0.848388671875, -0.781524658203125, -0.71466064453125, -0.647796630859375, -0.5809326171875, -0.514068603515625, -0.44720458984375, -0.380340576171875, -0.3134765625, -0.246612548828125, -0.17974853515625, -0.112884521484375, -0.0460205078125, 0.020843505859375, 0.08770751953125, 0.154571533203125, 0.221435546875, 0.288299560546875, 0.35516357421875, 0.422027587890625, 0.4888916015625, 0.555755615234375, 0.62261962890625, 0.689483642578125, 0.75634765625, 0.823211669921875, 0.89007568359375, 0.956939697265625, 1.0238037109375, 1.090667724609375, 1.15753173828125, 1.224395751953125, 1.291259765625, 1.358123779296875, 1.42498779296875, 1.491851806640625, 1.5587158203125, 1.625579833984375, 1.69244384765625, 1.759307861328125, 1.826171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 6.0, 9.0, 13.0, 15.0, 20.0, 24.0, 33.0, 21.0, 36.0, 33.0, 42.0, 44.0, 44.0, 51.0, 56.0, 60.0, 58.0, 54.0, 45.0, 51.0, 40.0, 38.0, 32.0, 29.0, 17.0, 20.0, 17.0, 17.0, 5.0, 11.0, 11.0, 5.0, 6.0, 10.0, 2.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 3.0], "bins": [-1.9912109375, -1.938751220703125, -1.88629150390625, -1.833831787109375, -1.7813720703125, -1.728912353515625, -1.67645263671875, -1.623992919921875, -1.571533203125, -1.519073486328125, -1.46661376953125, -1.414154052734375, -1.3616943359375, -1.309234619140625, -1.25677490234375, -1.204315185546875, -1.15185546875, -1.099395751953125, -1.04693603515625, -0.994476318359375, -0.9420166015625, -0.889556884765625, -0.83709716796875, -0.784637451171875, -0.732177734375, -0.679718017578125, -0.62725830078125, -0.574798583984375, -0.5223388671875, -0.469879150390625, -0.41741943359375, -0.364959716796875, -0.3125, -0.260040283203125, -0.20758056640625, -0.155120849609375, -0.1026611328125, -0.050201416015625, 0.00225830078125, 0.054718017578125, 0.107177734375, 0.159637451171875, 0.21209716796875, 0.264556884765625, 0.3170166015625, 0.369476318359375, 0.42193603515625, 0.474395751953125, 0.52685546875, 0.579315185546875, 0.63177490234375, 0.684234619140625, 0.7366943359375, 0.789154052734375, 0.84161376953125, 0.894073486328125, 0.946533203125, 0.998992919921875, 1.05145263671875, 1.103912353515625, 1.1563720703125, 1.208831787109375, 1.26129150390625, 1.313751220703125, 1.3662109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 10.0, 10.0, 10.0, 23.0, 38.0, 80.0, 119.0, 254.0, 535.0, 1548.0, 7182.0, 175700.0, 842251.0, 16710.0, 2540.0, 812.0, 350.0, 145.0, 81.0, 50.0, 32.0, 16.0, 14.0, 6.0, 5.0, 9.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.845703125, -0.82232666015625, -0.7989501953125, -0.77557373046875, -0.752197265625, -0.72882080078125, -0.7054443359375, -0.68206787109375, -0.65869140625, -0.63531494140625, -0.6119384765625, -0.58856201171875, -0.565185546875, -0.54180908203125, -0.5184326171875, -0.49505615234375, -0.4716796875, -0.44830322265625, -0.4249267578125, -0.40155029296875, -0.378173828125, -0.35479736328125, -0.3314208984375, -0.30804443359375, -0.28466796875, -0.26129150390625, -0.2379150390625, -0.21453857421875, -0.191162109375, -0.16778564453125, -0.1444091796875, -0.12103271484375, -0.09765625, -0.07427978515625, -0.0509033203125, -0.02752685546875, -0.004150390625, 0.01922607421875, 0.0426025390625, 0.06597900390625, 0.08935546875, 0.11273193359375, 0.1361083984375, 0.15948486328125, 0.182861328125, 0.20623779296875, 0.2296142578125, 0.25299072265625, 0.2763671875, 0.29974365234375, 0.3231201171875, 0.34649658203125, 0.369873046875, 0.39324951171875, 0.4166259765625, 0.44000244140625, 0.46337890625, 0.48675537109375, 0.5101318359375, 0.53350830078125, 0.556884765625, 0.58026123046875, 0.6036376953125, 0.62701416015625, 0.650390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 8.0, 8.0, 7.0, 13.0, 20.0, 28.0, 50.0, 77.0, 116.0, 302.0, 151.0, 83.0, 56.0, 25.0, 22.0, 12.0, 10.0, 2.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.602836608886719e-05, -5.3301453590393066e-05, -5.0574541091918945e-05, -4.7847628593444824e-05, -4.51207160949707e-05, -4.239380359649658e-05, -3.966689109802246e-05, -3.693997859954834e-05, -3.421306610107422e-05, -3.14861536026001e-05, -2.8759241104125977e-05, -2.6032328605651855e-05, -2.3305416107177734e-05, -2.0578503608703613e-05, -1.7851591110229492e-05, -1.5124678611755371e-05, -1.239776611328125e-05, -9.670853614807129e-06, -6.943941116333008e-06, -4.217028617858887e-06, -1.4901161193847656e-06, 1.2367963790893555e-06, 3.9637088775634766e-06, 6.690621376037598e-06, 9.417533874511719e-06, 1.214444637298584e-05, 1.4871358871459961e-05, 1.7598271369934082e-05, 2.0325183868408203e-05, 2.3052096366882324e-05, 2.5779008865356445e-05, 2.8505921363830566e-05, 3.123283386230469e-05, 3.395974636077881e-05, 3.668665885925293e-05, 3.941357135772705e-05, 4.214048385620117e-05, 4.486739635467529e-05, 4.7594308853149414e-05, 5.0321221351623535e-05, 5.3048133850097656e-05, 5.577504634857178e-05, 5.85019588470459e-05, 6.122887134552002e-05, 6.395578384399414e-05, 6.668269634246826e-05, 6.940960884094238e-05, 7.21365213394165e-05, 7.486343383789062e-05, 7.759034633636475e-05, 8.031725883483887e-05, 8.304417133331299e-05, 8.577108383178711e-05, 8.849799633026123e-05, 9.122490882873535e-05, 9.395182132720947e-05, 9.66787338256836e-05, 9.940564632415771e-05, 0.00010213255882263184, 0.00010485947132110596, 0.00010758638381958008, 0.0001103132963180542, 0.00011304020881652832, 0.00011576712131500244, 0.00011849403381347656]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 4.0, 12.0, 5.0, 20.0, 19.0, 23.0, 25.0, 34.0, 47.0, 76.0, 100.0, 146.0, 186.0, 338.0, 694.0, 1539.0, 5548.0, 54366.0, 918792.0, 57556.0, 5675.0, 1526.0, 653.0, 389.0, 241.0, 150.0, 96.0, 64.0, 52.0, 34.0, 30.0, 14.0, 26.0, 20.0, 12.0, 14.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.74609375, -0.7208099365234375, -0.695526123046875, -0.6702423095703125, -0.64495849609375, -0.6196746826171875, -0.594390869140625, -0.5691070556640625, -0.5438232421875, -0.5185394287109375, -0.493255615234375, -0.4679718017578125, -0.44268798828125, -0.4174041748046875, -0.392120361328125, -0.3668365478515625, -0.341552734375, -0.3162689208984375, -0.290985107421875, -0.2657012939453125, -0.24041748046875, -0.2151336669921875, -0.189849853515625, -0.1645660400390625, -0.1392822265625, -0.1139984130859375, -0.088714599609375, -0.0634307861328125, -0.03814697265625, -0.0128631591796875, 0.012420654296875, 0.0377044677734375, 0.06298828125, 0.0882720947265625, 0.113555908203125, 0.1388397216796875, 0.16412353515625, 0.1894073486328125, 0.214691162109375, 0.2399749755859375, 0.2652587890625, 0.2905426025390625, 0.315826416015625, 0.3411102294921875, 0.36639404296875, 0.3916778564453125, 0.416961669921875, 0.4422454833984375, 0.467529296875, 0.4928131103515625, 0.518096923828125, 0.5433807373046875, 0.56866455078125, 0.5939483642578125, 0.619232177734375, 0.6445159912109375, 0.6697998046875, 0.6950836181640625, 0.720367431640625, 0.7456512451171875, 0.77093505859375, 0.7962188720703125, 0.821502685546875, 0.8467864990234375, 0.8720703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 15.0, 7.0, 12.0, 16.0, 20.0, 27.0, 40.0, 78.0, 115.0, 243.0, 155.0, 80.0, 46.0, 38.0, 33.0, 16.0, 16.0, 16.0, 7.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2015380859375, -0.19429588317871094, -0.18705368041992188, -0.1798114776611328, -0.17256927490234375, -0.1653270721435547, -0.15808486938476562, -0.15084266662597656, -0.1436004638671875, -0.13635826110839844, -0.12911605834960938, -0.12187385559082031, -0.11463165283203125, -0.10738945007324219, -0.10014724731445312, -0.09290504455566406, -0.085662841796875, -0.07842063903808594, -0.07117843627929688, -0.06393623352050781, -0.05669403076171875, -0.04945182800292969, -0.042209625244140625, -0.03496742248535156, -0.0277252197265625, -0.020483016967773438, -0.013240814208984375, -0.0059986114501953125, 0.00124359130859375, 0.008485794067382812, 0.015727996826171875, 0.022970199584960938, 0.03021240234375, 0.03745460510253906, 0.044696807861328125, 0.05193901062011719, 0.05918121337890625, 0.06642341613769531, 0.07366561889648438, 0.08090782165527344, 0.0881500244140625, 0.09539222717285156, 0.10263442993164062, 0.10987663269042969, 0.11711883544921875, 0.12436103820800781, 0.13160324096679688, 0.13884544372558594, 0.146087646484375, 0.15332984924316406, 0.16057205200195312, 0.1678142547607422, 0.17505645751953125, 0.1822986602783203, 0.18954086303710938, 0.19678306579589844, 0.2040252685546875, 0.21126747131347656, 0.21850967407226562, 0.2257518768310547, 0.23299407958984375, 0.2402362823486328, 0.24747848510742188, 0.25472068786621094, 0.261962890625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 21.0, 54.0, 158.0, 361.0, 254.0, 94.0, 33.0, 8.0, 8.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.069937705993652, -3.862356424331665, -3.6547751426696777, -3.4471936225891113, -3.239612340927124, -3.0320310592651367, -2.8244495391845703, -2.616868257522583, -2.4092869758605957, -2.2017056941986084, -1.9941242933273315, -1.7865428924560547, -1.5789616107940674, -1.37138032913208, -1.1637989282608032, -0.9562175273895264, -0.7486362457275391, -0.541054904460907, -0.3334735631942749, -0.12589222192764282, 0.08168911933898926, 0.28927040100097656, 0.4968518018722534, 0.7044332027435303, 0.9120144844055176, 1.1195957660675049, 1.3271771669387817, 1.5347585678100586, 1.742339849472046, 1.9499211311340332, 2.1575026512145996, 2.365083932876587, 2.572665214538574, 2.7802464962005615, 2.987827777862549, 3.1954092979431152, 3.4029905796051025, 3.61057186126709, 3.8181533813476562, 4.025734901428223, 4.233315944671631, 4.440897464752197, 4.6484785079956055, 4.856060028076172, 5.063641548156738, 5.2712225914001465, 5.478804111480713, 5.686385154724121, 5.8939666748046875, 6.101548194885254, 6.309129238128662, 6.5167107582092285, 6.724291801452637, 6.931873321533203, 7.1394548416137695, 7.347036361694336, 7.554617404937744, 7.7621989250183105, 7.969779968261719, 8.177361488342285, 8.384943008422852, 8.592523574829102, 8.800105094909668, 9.007686614990234, 9.2152681350708]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 2.0, 10.0, 6.0, 7.0, 6.0, 14.0, 9.0, 21.0, 27.0, 29.0, 39.0, 24.0, 37.0, 30.0, 54.0, 43.0, 54.0, 49.0, 49.0, 34.0, 45.0, 51.0, 50.0, 49.0, 37.0, 33.0, 32.0, 27.0, 20.0, 22.0, 11.0, 18.0, 20.0, 9.0, 8.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3316848278045654, -2.250019073486328, -2.16835355758667, -2.0866880416870117, -2.0050222873687744, -1.9233566522598267, -1.841691017150879, -1.7600253820419312, -1.6783597469329834, -1.5966941118240356, -1.515028476715088, -1.4333628416061401, -1.3516972064971924, -1.2700315713882446, -1.1883659362792969, -1.1067003011703491, -1.0250346660614014, -0.9433690309524536, -0.8617033958435059, -0.7800377607345581, -0.6983721256256104, -0.6167064905166626, -0.5350408554077148, -0.4533752202987671, -0.37170958518981934, -0.2900439500808716, -0.20837831497192383, -0.12671267986297607, -0.04504704475402832, 0.036618590354919434, 0.11828422546386719, 0.19994986057281494, 0.2816157341003418, 0.36328136920928955, 0.4449470043182373, 0.5266126394271851, 0.6082782745361328, 0.6899439096450806, 0.7716095447540283, 0.8532751798629761, 0.9349408149719238, 1.0166064500808716, 1.0982720851898193, 1.179937720298767, 1.2616033554077148, 1.3432689905166626, 1.4249346256256104, 1.506600260734558, 1.5882658958435059, 1.6699315309524536, 1.7515971660614014, 1.8332628011703491, 1.9149284362792969, 1.9965940713882446, 2.0782597064971924, 2.1599254608154297, 2.241590976715088, 2.323256492614746, 2.4049222469329834, 2.4865880012512207, 2.568253517150879, 2.649919033050537, 2.7315847873687744, 2.8132505416870117, 2.89491605758667]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 5.0, 11.0, 10.0, 17.0, 28.0, 34.0, 78.0, 111.0, 139.0, 250.0, 474.0, 891.0, 2099.0, 7984.0, 92449.0, 3778264.0, 295043.0, 11507.0, 2686.0, 1018.0, 491.0, 237.0, 154.0, 93.0, 57.0, 38.0, 38.0, 20.0, 16.0, 14.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83984375, -2.7528076171875, -2.665771484375, -2.5787353515625, -2.49169921875, -2.4046630859375, -2.317626953125, -2.2305908203125, -2.1435546875, -2.0565185546875, -1.969482421875, -1.8824462890625, -1.79541015625, -1.7083740234375, -1.621337890625, -1.5343017578125, -1.447265625, -1.3602294921875, -1.273193359375, -1.1861572265625, -1.09912109375, -1.0120849609375, -0.925048828125, -0.8380126953125, -0.7509765625, -0.6639404296875, -0.576904296875, -0.4898681640625, -0.40283203125, -0.3157958984375, -0.228759765625, -0.1417236328125, -0.0546875, 0.0323486328125, 0.119384765625, 0.2064208984375, 0.29345703125, 0.3804931640625, 0.467529296875, 0.5545654296875, 0.6416015625, 0.7286376953125, 0.815673828125, 0.9027099609375, 0.98974609375, 1.0767822265625, 1.163818359375, 1.2508544921875, 1.337890625, 1.4249267578125, 1.511962890625, 1.5989990234375, 1.68603515625, 1.7730712890625, 1.860107421875, 1.9471435546875, 2.0341796875, 2.1212158203125, 2.208251953125, 2.2952880859375, 2.38232421875, 2.4693603515625, 2.556396484375, 2.6434326171875, 2.73046875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 12.0, 12.0, 12.0, 19.0, 13.0, 31.0, 38.0, 32.0, 44.0, 59.0, 47.0, 59.0, 69.0, 66.0, 60.0, 61.0, 48.0, 56.0, 51.0, 38.0, 28.0, 36.0, 30.0, 16.0, 10.0, 10.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.83447265625, -0.8041000366210938, -0.7737274169921875, -0.7433547973632812, -0.712982177734375, -0.6826095581054688, -0.6522369384765625, -0.6218643188476562, -0.59149169921875, -0.5611190795898438, -0.5307464599609375, -0.5003738403320312, -0.470001220703125, -0.43962860107421875, -0.4092559814453125, -0.37888336181640625, -0.3485107421875, -0.31813812255859375, -0.2877655029296875, -0.25739288330078125, -0.227020263671875, -0.19664764404296875, -0.1662750244140625, -0.13590240478515625, -0.10552978515625, -0.07515716552734375, -0.0447845458984375, -0.01441192626953125, 0.015960693359375, 0.04633331298828125, 0.0767059326171875, 0.10707855224609375, 0.137451171875, 0.16782379150390625, 0.1981964111328125, 0.22856903076171875, 0.258941650390625, 0.28931427001953125, 0.3196868896484375, 0.35005950927734375, 0.38043212890625, 0.41080474853515625, 0.4411773681640625, 0.47154998779296875, 0.501922607421875, 0.5322952270507812, 0.5626678466796875, 0.5930404663085938, 0.6234130859375, 0.6537857055664062, 0.6841583251953125, 0.7145309448242188, 0.744903564453125, 0.7752761840820312, 0.8056488037109375, 0.8360214233398438, 0.86639404296875, 0.8967666625976562, 0.9271392822265625, 0.9575119018554688, 0.987884521484375, 1.0182571411132812, 1.0486297607421875, 1.0790023803710938, 1.109375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 12.0, 11.0, 24.0, 32.0, 75.0, 139.0, 316.0, 692.0, 1880.0, 6989.0, 45434.0, 3086619.0, 1016476.0, 27774.0, 5146.0, 1487.0, 586.0, 257.0, 138.0, 64.0, 48.0, 29.0, 13.0, 13.0, 7.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.90625, -1.835357666015625, -1.76446533203125, -1.693572998046875, -1.6226806640625, -1.551788330078125, -1.48089599609375, -1.410003662109375, -1.339111328125, -1.268218994140625, -1.19732666015625, -1.126434326171875, -1.0555419921875, -0.984649658203125, -0.91375732421875, -0.842864990234375, -0.77197265625, -0.701080322265625, -0.63018798828125, -0.559295654296875, -0.4884033203125, -0.417510986328125, -0.34661865234375, -0.275726318359375, -0.204833984375, -0.133941650390625, -0.06304931640625, 0.007843017578125, 0.0787353515625, 0.149627685546875, 0.22052001953125, 0.291412353515625, 0.3623046875, 0.433197021484375, 0.50408935546875, 0.574981689453125, 0.6458740234375, 0.716766357421875, 0.78765869140625, 0.858551025390625, 0.929443359375, 1.000335693359375, 1.07122802734375, 1.142120361328125, 1.2130126953125, 1.283905029296875, 1.35479736328125, 1.425689697265625, 1.49658203125, 1.567474365234375, 1.63836669921875, 1.709259033203125, 1.7801513671875, 1.851043701171875, 1.92193603515625, 1.992828369140625, 2.063720703125, 2.134613037109375, 2.20550537109375, 2.276397705078125, 2.3472900390625, 2.418182373046875, 2.48907470703125, 2.559967041015625, 2.630859375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 4.0, 6.0, 4.0, 15.0, 19.0, 25.0, 29.0, 57.0, 82.0, 149.0, 296.0, 584.0, 875.0, 798.0, 501.0, 270.0, 137.0, 77.0, 51.0, 27.0, 21.0, 11.0, 11.0, 5.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5662879943847656, -0.5500564575195312, -0.5338249206542969, -0.5175933837890625, -0.5013618469238281, -0.48513031005859375, -0.4688987731933594, -0.452667236328125, -0.4364356994628906, -0.42020416259765625, -0.4039726257324219, -0.3877410888671875, -0.3715095520019531, -0.35527801513671875, -0.3390464782714844, -0.32281494140625, -0.3065834045410156, -0.29035186767578125, -0.2741203308105469, -0.2578887939453125, -0.24165725708007812, -0.22542572021484375, -0.20919418334960938, -0.192962646484375, -0.17673110961914062, -0.16049957275390625, -0.14426803588867188, -0.1280364990234375, -0.11180496215820312, -0.09557342529296875, -0.07934188842773438, -0.0631103515625, -0.046878814697265625, -0.03064727783203125, -0.014415740966796875, 0.0018157958984375, 0.018047332763671875, 0.03427886962890625, 0.050510406494140625, 0.066741943359375, 0.08297348022460938, 0.09920501708984375, 0.11543655395507812, 0.1316680908203125, 0.14789962768554688, 0.16413116455078125, 0.18036270141601562, 0.19659423828125, 0.21282577514648438, 0.22905731201171875, 0.24528884887695312, 0.2615203857421875, 0.2777519226074219, 0.29398345947265625, 0.3102149963378906, 0.326446533203125, 0.3426780700683594, 0.35890960693359375, 0.3751411437988281, 0.3913726806640625, 0.4076042175292969, 0.42383575439453125, 0.4400672912597656, 0.456298828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 18.0, 25.0, 49.0, 52.0, 93.0, 137.0, 161.0, 161.0, 106.0, 67.0, 53.0, 30.0, 12.0, 9.0, 10.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4348981380462646, -2.364973306655884, -2.295048475265503, -2.225123643875122, -2.155198812484741, -2.0852739810943604, -2.0153491497039795, -1.9454243183135986, -1.8754994869232178, -1.805574655532837, -1.735649824142456, -1.6657249927520752, -1.5958001613616943, -1.5258753299713135, -1.4559504985809326, -1.3860256671905518, -1.316100835800171, -1.24617600440979, -1.1762511730194092, -1.1063263416290283, -1.0364015102386475, -0.9664766788482666, -0.8965518474578857, -0.8266270160675049, -0.756702184677124, -0.6867773532867432, -0.6168525218963623, -0.5469276905059814, -0.4770028591156006, -0.4070780277252197, -0.33715319633483887, -0.267228364944458, -0.19730353355407715, -0.1273787021636963, -0.05745387077331543, 0.01247096061706543, 0.08239579200744629, 0.15232062339782715, 0.222245454788208, 0.29217028617858887, 0.3620951175689697, 0.4320199489593506, 0.5019447803497314, 0.5718696117401123, 0.6417944431304932, 0.711719274520874, 0.7816441059112549, 0.8515689373016357, 0.9214937686920166, 0.9914186000823975, 1.0613434314727783, 1.1312682628631592, 1.20119309425354, 1.271117925643921, 1.3410427570343018, 1.4109675884246826, 1.4808924198150635, 1.5508172512054443, 1.6207420825958252, 1.690666913986206, 1.760591745376587, 1.8305165767669678, 1.9004414081573486, 1.9703662395477295, 2.0402910709381104]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 4.0, 5.0, 17.0, 13.0, 11.0, 14.0, 22.0, 25.0, 23.0, 27.0, 31.0, 33.0, 36.0, 47.0, 38.0, 44.0, 37.0, 37.0, 46.0, 35.0, 37.0, 46.0, 55.0, 44.0, 34.0, 32.0, 23.0, 27.0, 15.0, 20.0, 15.0, 18.0, 17.0, 12.0, 6.0, 8.0, 10.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7492051124572754, -0.7236148715019226, -0.6980246901512146, -0.6724344491958618, -0.6468442678451538, -0.621254026889801, -0.5956637859344482, -0.5700736045837402, -0.5444833636283875, -0.5188931226730347, -0.49330294132232666, -0.4677127003669739, -0.4421224892139435, -0.4165322780609131, -0.3909420669078827, -0.3653518557548523, -0.3397616446018219, -0.3141714334487915, -0.2885812222957611, -0.2629910111427307, -0.23740077018737793, -0.21181055903434753, -0.18622034788131714, -0.16063012182712555, -0.13503991067409515, -0.10944969207048416, -0.08385947346687317, -0.05826926231384277, -0.03267904371023178, -0.007088825106620789, 0.018501386046409607, 0.044091612100601196, 0.06968182325363159, 0.09527204185724258, 0.12086226046085358, 0.14645247161388397, 0.17204269766807556, 0.19763290882110596, 0.22322311997413635, 0.24881334602832794, 0.27440357208251953, 0.2999937832355499, 0.3255839943885803, 0.3511742353439331, 0.3767644464969635, 0.4023546576499939, 0.4279448688030243, 0.4535350799560547, 0.4791252911090851, 0.5047155022621155, 0.5303057432174683, 0.5558959245681763, 0.581486165523529, 0.6070764064788818, 0.6326665878295898, 0.6582568287849426, 0.6838470101356506, 0.7094372510910034, 0.7350274324417114, 0.7606176733970642, 0.7862078547477722, 0.811798095703125, 0.837388277053833, 0.8629785180091858, 0.8885687589645386]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 5.0, 4.0, 5.0, 13.0, 17.0, 22.0, 32.0, 41.0, 57.0, 117.0, 205.0, 362.0, 656.0, 1235.0, 2368.0, 4953.0, 11935.0, 41902.0, 333614.0, 555331.0, 67395.0, 15782.0, 6339.0, 2890.0, 1457.0, 760.0, 410.0, 257.0, 132.0, 81.0, 59.0, 38.0, 25.0, 14.0, 10.0, 11.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396484375, -0.38187408447265625, -0.3672637939453125, -0.35265350341796875, -0.338043212890625, -0.32343292236328125, -0.3088226318359375, -0.29421234130859375, -0.27960205078125, -0.26499176025390625, -0.2503814697265625, -0.23577117919921875, -0.221160888671875, -0.20655059814453125, -0.1919403076171875, -0.17733001708984375, -0.1627197265625, -0.14810943603515625, -0.1334991455078125, -0.11888885498046875, -0.104278564453125, -0.08966827392578125, -0.0750579833984375, -0.06044769287109375, -0.04583740234375, -0.03122711181640625, -0.0166168212890625, -0.00200653076171875, 0.012603759765625, 0.02721405029296875, 0.0418243408203125, 0.05643463134765625, 0.071044921875, 0.08565521240234375, 0.1002655029296875, 0.11487579345703125, 0.129486083984375, 0.14409637451171875, 0.1587066650390625, 0.17331695556640625, 0.18792724609375, 0.20253753662109375, 0.2171478271484375, 0.23175811767578125, 0.246368408203125, 0.26097869873046875, 0.2755889892578125, 0.29019927978515625, 0.3048095703125, 0.31941986083984375, 0.3340301513671875, 0.34864044189453125, 0.363250732421875, 0.37786102294921875, 0.3924713134765625, 0.40708160400390625, 0.42169189453125, 0.43630218505859375, 0.4509124755859375, 0.46552276611328125, 0.480133056640625, 0.49474334716796875, 0.5093536376953125, 0.5239639282226562, 0.53857421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 7.0, 5.0, 12.0, 10.0, 18.0, 14.0, 25.0, 20.0, 30.0, 28.0, 38.0, 28.0, 39.0, 53.0, 47.0, 43.0, 49.0, 50.0, 46.0, 48.0, 42.0, 40.0, 48.0, 45.0, 25.0, 26.0, 18.0, 21.0, 26.0, 12.0, 12.0, 10.0, 12.0, 8.0, 7.0, 11.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6533203125, -0.6338348388671875, -0.614349365234375, -0.5948638916015625, -0.57537841796875, -0.5558929443359375, -0.536407470703125, -0.5169219970703125, -0.4974365234375, -0.4779510498046875, -0.458465576171875, -0.4389801025390625, -0.41949462890625, -0.4000091552734375, -0.380523681640625, -0.3610382080078125, -0.341552734375, -0.3220672607421875, -0.302581787109375, -0.2830963134765625, -0.26361083984375, -0.2441253662109375, -0.224639892578125, -0.2051544189453125, -0.1856689453125, -0.1661834716796875, -0.146697998046875, -0.1272125244140625, -0.10772705078125, -0.0882415771484375, -0.068756103515625, -0.0492706298828125, -0.02978515625, -0.0102996826171875, 0.009185791015625, 0.0286712646484375, 0.04815673828125, 0.0676422119140625, 0.087127685546875, 0.1066131591796875, 0.1260986328125, 0.1455841064453125, 0.165069580078125, 0.1845550537109375, 0.20404052734375, 0.2235260009765625, 0.243011474609375, 0.2624969482421875, 0.281982421875, 0.3014678955078125, 0.320953369140625, 0.3404388427734375, 0.35992431640625, 0.3794097900390625, 0.398895263671875, 0.4183807373046875, 0.4378662109375, 0.4573516845703125, 0.476837158203125, 0.4963226318359375, 0.51580810546875, 0.5352935791015625, 0.554779052734375, 0.5742645263671875, 0.59375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 7.0, 9.0, 9.0, 14.0, 25.0, 28.0, 50.0, 73.0, 120.0, 192.0, 307.0, 496.0, 879.0, 1683.0, 3036.0, 5958.0, 13138.0, 33540.0, 110524.0, 397603.0, 340832.0, 89634.0, 28005.0, 11055.0, 5245.0, 2723.0, 1444.0, 783.0, 430.0, 251.0, 168.0, 106.0, 59.0, 41.0, 28.0, 19.0, 16.0, 9.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2489013671875, -0.2417736053466797, -0.23464584350585938, -0.22751808166503906, -0.22039031982421875, -0.21326255798339844, -0.20613479614257812, -0.1990070343017578, -0.1918792724609375, -0.1847515106201172, -0.17762374877929688, -0.17049598693847656, -0.16336822509765625, -0.15624046325683594, -0.14911270141601562, -0.1419849395751953, -0.134857177734375, -0.1277294158935547, -0.12060165405273438, -0.11347389221191406, -0.10634613037109375, -0.09921836853027344, -0.09209060668945312, -0.08496284484863281, -0.0778350830078125, -0.07070732116699219, -0.06357955932617188, -0.05645179748535156, -0.04932403564453125, -0.04219627380371094, -0.035068511962890625, -0.027940750122070312, -0.02081298828125, -0.013685226440429688, -0.006557464599609375, 0.0005702972412109375, 0.00769805908203125, 0.014825820922851562, 0.021953582763671875, 0.029081344604492188, 0.0362091064453125, 0.04333686828613281, 0.050464630126953125, 0.05759239196777344, 0.06472015380859375, 0.07184791564941406, 0.07897567749023438, 0.08610343933105469, 0.093231201171875, 0.10035896301269531, 0.10748672485351562, 0.11461448669433594, 0.12174224853515625, 0.12887001037597656, 0.13599777221679688, 0.1431255340576172, 0.1502532958984375, 0.1573810577392578, 0.16450881958007812, 0.17163658142089844, 0.17876434326171875, 0.18589210510253906, 0.19301986694335938, 0.2001476287841797, 0.207275390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 3.0, 6.0, 5.0, 11.0, 8.0, 13.0, 8.0, 20.0, 19.0, 25.0, 18.0, 26.0, 28.0, 26.0, 40.0, 38.0, 44.0, 38.0, 54.0, 38.0, 43.0, 44.0, 47.0, 57.0, 38.0, 40.0, 38.0, 33.0, 32.0, 26.0, 25.0, 18.0, 16.0, 11.0, 11.0, 11.0, 5.0, 10.0, 4.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.166015625, -1.1275482177734375, -1.089080810546875, -1.0506134033203125, -1.01214599609375, -0.9736785888671875, -0.935211181640625, -0.8967437744140625, -0.8582763671875, -0.8198089599609375, -0.781341552734375, -0.7428741455078125, -0.70440673828125, -0.6659393310546875, -0.627471923828125, -0.5890045166015625, -0.550537109375, -0.5120697021484375, -0.473602294921875, -0.4351348876953125, -0.39666748046875, -0.3582000732421875, -0.319732666015625, -0.2812652587890625, -0.2427978515625, -0.2043304443359375, -0.165863037109375, -0.1273956298828125, -0.08892822265625, -0.0504608154296875, -0.011993408203125, 0.0264739990234375, 0.06494140625, 0.1034088134765625, 0.141876220703125, 0.1803436279296875, 0.21881103515625, 0.2572784423828125, 0.295745849609375, 0.3342132568359375, 0.3726806640625, 0.4111480712890625, 0.449615478515625, 0.4880828857421875, 0.52655029296875, 0.5650177001953125, 0.603485107421875, 0.6419525146484375, 0.680419921875, 0.7188873291015625, 0.757354736328125, 0.7958221435546875, 0.83428955078125, 0.8727569580078125, 0.911224365234375, 0.9496917724609375, 0.9881591796875, 1.0266265869140625, 1.065093994140625, 1.1035614013671875, 1.14202880859375, 1.1804962158203125, 1.218963623046875, 1.2574310302734375, 1.2958984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 17.0, 11.0, 10.0, 27.0, 28.0, 34.0, 64.0, 117.0, 182.0, 326.0, 517.0, 1057.0, 2036.0, 4688.0, 12753.0, 49454.0, 254611.0, 520341.0, 154109.0, 31658.0, 9341.0, 3603.0, 1605.0, 813.0, 441.0, 263.0, 176.0, 91.0, 55.0, 32.0, 23.0, 21.0, 7.0, 11.0, 10.0, 2.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08233642578125, -0.07979106903076172, -0.07724571228027344, -0.07470035552978516, -0.07215499877929688, -0.0696096420288086, -0.06706428527832031, -0.06451892852783203, -0.06197357177734375, -0.05942821502685547, -0.05688285827636719, -0.054337501525878906, -0.051792144775390625, -0.049246788024902344, -0.04670143127441406, -0.04415607452392578, -0.0416107177734375, -0.03906536102294922, -0.03652000427246094, -0.033974647521972656, -0.031429290771484375, -0.028883934020996094, -0.026338577270507812, -0.02379322052001953, -0.02124786376953125, -0.01870250701904297, -0.016157150268554688, -0.013611793518066406, -0.011066436767578125, -0.008521080017089844, -0.0059757232666015625, -0.0034303665161132812, -0.000885009765625, 0.0016603469848632812, 0.0042057037353515625, 0.006751060485839844, 0.009296417236328125, 0.011841773986816406, 0.014387130737304688, 0.01693248748779297, 0.01947784423828125, 0.02202320098876953, 0.024568557739257812, 0.027113914489746094, 0.029659271240234375, 0.032204627990722656, 0.03474998474121094, 0.03729534149169922, 0.0398406982421875, 0.04238605499267578, 0.04493141174316406, 0.047476768493652344, 0.050022125244140625, 0.052567481994628906, 0.05511283874511719, 0.05765819549560547, 0.06020355224609375, 0.06274890899658203, 0.06529426574707031, 0.0678396224975586, 0.07038497924804688, 0.07293033599853516, 0.07547569274902344, 0.07802104949951172, 0.08056640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 8.0, 14.0, 24.0, 22.0, 32.0, 45.0, 62.0, 90.0, 72.0, 91.0, 92.0, 91.0, 87.0, 65.0, 43.0, 33.0, 32.0, 15.0, 16.0, 9.0, 5.0, 6.0, 6.0, 6.0, 8.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.612041473388672e-05, -3.492925316095352e-05, -3.3738091588020325e-05, -3.254693001508713e-05, -3.135576844215393e-05, -3.0164606869220734e-05, -2.8973445296287537e-05, -2.778228372335434e-05, -2.6591122150421143e-05, -2.5399960577487946e-05, -2.420879900455475e-05, -2.301763743162155e-05, -2.1826475858688354e-05, -2.0635314285755157e-05, -1.944415271282196e-05, -1.8252991139888763e-05, -1.7061829566955566e-05, -1.587066799402237e-05, -1.4679506421089172e-05, -1.3488344848155975e-05, -1.2297183275222778e-05, -1.1106021702289581e-05, -9.914860129356384e-06, -8.723698556423187e-06, -7.53253698348999e-06, -6.341375410556793e-06, -5.150213837623596e-06, -3.959052264690399e-06, -2.767890691757202e-06, -1.5767291188240051e-06, -3.855675458908081e-07, 8.055940270423889e-07, 1.996755599975586e-06, 3.187917172908783e-06, 4.37907874584198e-06, 5.570240318775177e-06, 6.761401891708374e-06, 7.952563464641571e-06, 9.143725037574768e-06, 1.0334886610507965e-05, 1.1526048183441162e-05, 1.2717209756374359e-05, 1.3908371329307556e-05, 1.5099532902240753e-05, 1.629069447517395e-05, 1.7481856048107147e-05, 1.8673017621040344e-05, 1.986417919397354e-05, 2.1055340766906738e-05, 2.2246502339839935e-05, 2.3437663912773132e-05, 2.462882548570633e-05, 2.5819987058639526e-05, 2.7011148631572723e-05, 2.820231020450592e-05, 2.9393471777439117e-05, 3.0584633350372314e-05, 3.177579492330551e-05, 3.296695649623871e-05, 3.4158118069171906e-05, 3.53492796421051e-05, 3.65404412150383e-05, 3.7731602787971497e-05, 3.8922764360904694e-05, 4.011392593383789e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 4.0, 6.0, 8.0, 6.0, 11.0, 23.0, 31.0, 74.0, 117.0, 198.0, 375.0, 856.0, 2116.0, 6204.0, 24994.0, 143571.0, 565553.0, 249919.0, 40340.0, 9103.0, 2829.0, 1129.0, 501.0, 237.0, 139.0, 85.0, 34.0, 27.0, 13.0, 16.0, 5.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.104736328125, -0.10142707824707031, -0.09811782836914062, -0.09480857849121094, -0.09149932861328125, -0.08819007873535156, -0.08488082885742188, -0.08157157897949219, -0.0782623291015625, -0.07495307922363281, -0.07164382934570312, -0.06833457946777344, -0.06502532958984375, -0.06171607971191406, -0.058406829833984375, -0.05509757995605469, -0.051788330078125, -0.04847908020019531, -0.045169830322265625, -0.04186058044433594, -0.03855133056640625, -0.03524208068847656, -0.031932830810546875, -0.028623580932617188, -0.0253143310546875, -0.022005081176757812, -0.018695831298828125, -0.015386581420898438, -0.01207733154296875, -0.008768081665039062, -0.005458831787109375, -0.0021495819091796875, 0.00115966796875, 0.0044689178466796875, 0.007778167724609375, 0.011087417602539062, 0.01439666748046875, 0.017705917358398438, 0.021015167236328125, 0.024324417114257812, 0.0276336669921875, 0.030942916870117188, 0.034252166748046875, 0.03756141662597656, 0.04087066650390625, 0.04417991638183594, 0.047489166259765625, 0.05079841613769531, 0.054107666015625, 0.05741691589355469, 0.060726165771484375, 0.06403541564941406, 0.06734466552734375, 0.07065391540527344, 0.07396316528320312, 0.07727241516113281, 0.0805816650390625, 0.08389091491699219, 0.08720016479492188, 0.09050941467285156, 0.09381866455078125, 0.09712791442871094, 0.10043716430664062, 0.10374641418457031, 0.1070556640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 0.0, 10.0, 14.0, 15.0, 27.0, 38.0, 48.0, 83.0, 79.0, 108.0, 100.0, 115.0, 96.0, 70.0, 61.0, 42.0, 29.0, 24.0, 10.0, 8.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03045654296875, -0.02939748764038086, -0.02833843231201172, -0.027279376983642578, -0.026220321655273438, -0.025161266326904297, -0.024102210998535156, -0.023043155670166016, -0.021984100341796875, -0.020925045013427734, -0.019865989685058594, -0.018806934356689453, -0.017747879028320312, -0.016688823699951172, -0.01562976837158203, -0.01457071304321289, -0.01351165771484375, -0.01245260238647461, -0.011393547058105469, -0.010334491729736328, -0.009275436401367188, -0.008216381072998047, -0.007157325744628906, -0.006098270416259766, -0.005039215087890625, -0.003980159759521484, -0.0029211044311523438, -0.0018620491027832031, -0.0008029937744140625, 0.0002560615539550781, 0.0013151168823242188, 0.0023741722106933594, 0.0034332275390625, 0.004492282867431641, 0.005551338195800781, 0.006610393524169922, 0.0076694488525390625, 0.008728504180908203, 0.009787559509277344, 0.010846614837646484, 0.011905670166015625, 0.012964725494384766, 0.014023780822753906, 0.015082836151123047, 0.016141891479492188, 0.017200946807861328, 0.01826000213623047, 0.01931905746459961, 0.02037811279296875, 0.02143716812133789, 0.02249622344970703, 0.023555278778076172, 0.024614334106445312, 0.025673389434814453, 0.026732444763183594, 0.027791500091552734, 0.028850555419921875, 0.029909610748291016, 0.030968666076660156, 0.0320277214050293, 0.03308677673339844, 0.03414583206176758, 0.03520488739013672, 0.03626394271850586, 0.037322998046875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 6.0, 10.0, 24.0, 22.0, 43.0, 65.0, 77.0, 132.0, 154.0, 138.0, 124.0, 79.0, 54.0, 21.0, 22.0, 12.0, 5.0, 1.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.242753028869629, -1.199507474899292, -1.1562620401382446, -1.1130164861679077, -1.0697710514068604, -1.0265254974365234, -0.9832800030708313, -0.9400345087051392, -0.896789014339447, -0.8535435199737549, -0.8102980256080627, -0.7670525312423706, -0.7238069772720337, -0.6805615425109863, -0.6373159885406494, -0.5940704941749573, -0.5508249998092651, -0.507579505443573, -0.46433401107788086, -0.42108848690986633, -0.3778429925441742, -0.33459749817848206, -0.29135197401046753, -0.2481064796447754, -0.20486098527908325, -0.1616154909133911, -0.11836998164653778, -0.07512447237968445, -0.03187897801399231, 0.011366516351699829, 0.054612040519714355, 0.0978575348854065, 0.14110314846038818, 0.18434864282608032, 0.22759415209293365, 0.270839661359787, 0.3140851557254791, 0.35733065009117126, 0.4005761742591858, 0.44382166862487793, 0.48706716299057007, 0.5303126573562622, 0.5735581517219543, 0.6168036460876465, 0.6600492000579834, 0.7032946348190308, 0.7465401887893677, 0.7897856831550598, 0.833031177520752, 0.8762766718864441, 0.9195221662521362, 0.9627677202224731, 1.0060131549835205, 1.0492587089538574, 1.0925042629241943, 1.1357496976852417, 1.178995132446289, 1.222240686416626, 1.2654861211776733, 1.3087316751480103, 1.3519771099090576, 1.3952226638793945, 1.4384682178497314, 1.4817136526107788, 1.5249592065811157]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 8.0, 8.0, 13.0, 18.0, 12.0, 26.0, 26.0, 24.0, 35.0, 32.0, 46.0, 42.0, 47.0, 43.0, 42.0, 42.0, 53.0, 57.0, 47.0, 48.0, 54.0, 34.0, 48.0, 18.0, 22.0, 21.0, 19.0, 18.0, 19.0, 17.0, 11.0, 6.0, 10.0, 5.0, 5.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6448963284492493, -0.6255130767822266, -0.6061298251152039, -0.5867465734481812, -0.5673632621765137, -0.547980010509491, -0.5285967588424683, -0.5092135071754456, -0.48983025550842285, -0.47044700384140015, -0.45106372237205505, -0.43168047070503235, -0.41229721903800964, -0.39291393756866455, -0.37353068590164185, -0.35414743423461914, -0.33476415276527405, -0.31538090109825134, -0.29599761962890625, -0.27661436796188354, -0.25723111629486084, -0.23784784972667694, -0.21846458315849304, -0.19908133149147034, -0.17969806492328644, -0.16031479835510254, -0.14093154668807983, -0.12154828011989594, -0.10216502100229263, -0.08278176188468933, -0.06339849531650543, -0.04401524364948273, -0.024631977081298828, -0.005248716101050377, 0.014134544879198074, 0.033517807722091675, 0.05290106683969498, 0.07228432595729828, 0.09166759252548218, 0.11105084419250488, 0.13043411076068878, 0.14981737732887268, 0.16920062899589539, 0.18858389556407928, 0.20796716213226318, 0.2273504137992859, 0.2467336803674698, 0.2661169171333313, 0.2855001986026764, 0.3048834502696991, 0.3242667317390442, 0.3436499834060669, 0.3630332350730896, 0.3824164867401123, 0.4017997682094574, 0.4211830198764801, 0.4405663013458252, 0.4599495530128479, 0.479332834482193, 0.4987160861492157, 0.5180993676185608, 0.5374826192855835, 0.5568658709526062, 0.5762491226196289, 0.5956323742866516]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 10.0, 10.0, 14.0, 12.0, 29.0, 49.0, 53.0, 91.0, 165.0, 221.0, 403.0, 692.0, 1370.0, 2892.0, 6818.0, 19327.0, 65930.0, 279510.0, 507130.0, 114531.0, 31236.0, 10269.0, 3830.0, 1738.0, 881.0, 501.0, 293.0, 192.0, 104.0, 68.0, 66.0, 29.0, 23.0, 29.0, 11.0, 12.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.86181640625, -0.8392562866210938, -0.8166961669921875, -0.7941360473632812, -0.771575927734375, -0.7490158081054688, -0.7264556884765625, -0.7038955688476562, -0.68133544921875, -0.6587753295898438, -0.6362152099609375, -0.6136550903320312, -0.591094970703125, -0.5685348510742188, -0.5459747314453125, -0.5234146118164062, -0.5008544921875, -0.47829437255859375, -0.4557342529296875, -0.43317413330078125, -0.410614013671875, -0.38805389404296875, -0.3654937744140625, -0.34293365478515625, -0.32037353515625, -0.29781341552734375, -0.2752532958984375, -0.25269317626953125, -0.230133056640625, -0.20757293701171875, -0.1850128173828125, -0.16245269775390625, -0.139892578125, -0.11733245849609375, -0.0947723388671875, -0.07221221923828125, -0.049652099609375, -0.02709197998046875, -0.0045318603515625, 0.01802825927734375, 0.04058837890625, 0.06314849853515625, 0.0857086181640625, 0.10826873779296875, 0.130828857421875, 0.15338897705078125, 0.1759490966796875, 0.19850921630859375, 0.2210693359375, 0.24362945556640625, 0.2661895751953125, 0.28874969482421875, 0.311309814453125, 0.33386993408203125, 0.3564300537109375, 0.37899017333984375, 0.40155029296875, 0.42411041259765625, 0.4466705322265625, 0.46923065185546875, 0.491790771484375, 0.5143508911132812, 0.5369110107421875, 0.5594711303710938, 0.58203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 10.0, 14.0, 22.0, 16.0, 21.0, 21.0, 41.0, 35.0, 37.0, 51.0, 51.0, 58.0, 59.0, 65.0, 50.0, 45.0, 62.0, 46.0, 62.0, 42.0, 28.0, 27.0, 25.0, 29.0, 17.0, 10.0, 11.0, 16.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.470703125, -1.428741455078125, -1.38677978515625, -1.344818115234375, -1.3028564453125, -1.260894775390625, -1.21893310546875, -1.176971435546875, -1.135009765625, -1.093048095703125, -1.05108642578125, -1.009124755859375, -0.9671630859375, -0.925201416015625, -0.88323974609375, -0.841278076171875, -0.79931640625, -0.757354736328125, -0.71539306640625, -0.673431396484375, -0.6314697265625, -0.589508056640625, -0.54754638671875, -0.505584716796875, -0.463623046875, -0.421661376953125, -0.37969970703125, -0.337738037109375, -0.2957763671875, -0.253814697265625, -0.21185302734375, -0.169891357421875, -0.1279296875, -0.085968017578125, -0.04400634765625, -0.002044677734375, 0.0399169921875, 0.081878662109375, 0.12384033203125, 0.165802001953125, 0.207763671875, 0.249725341796875, 0.29168701171875, 0.333648681640625, 0.3756103515625, 0.417572021484375, 0.45953369140625, 0.501495361328125, 0.54345703125, 0.585418701171875, 0.62738037109375, 0.669342041015625, 0.7113037109375, 0.753265380859375, 0.79522705078125, 0.837188720703125, 0.879150390625, 0.921112060546875, 0.96307373046875, 1.005035400390625, 1.0469970703125, 1.088958740234375, 1.13092041015625, 1.172882080078125, 1.21484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 7.0, 8.0, 12.0, 21.0, 23.0, 22.0, 38.0, 52.0, 75.0, 132.0, 230.0, 622.0, 3085.0, 127030.0, 900817.0, 14366.0, 1115.0, 374.0, 184.0, 104.0, 62.0, 44.0, 34.0, 22.0, 24.0, 17.0, 10.0, 10.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.873046875, -2.793792724609375, -2.71453857421875, -2.635284423828125, -2.5560302734375, -2.476776123046875, -2.39752197265625, -2.318267822265625, -2.239013671875, -2.159759521484375, -2.08050537109375, -2.001251220703125, -1.9219970703125, -1.842742919921875, -1.76348876953125, -1.684234619140625, -1.60498046875, -1.525726318359375, -1.44647216796875, -1.367218017578125, -1.2879638671875, -1.208709716796875, -1.12945556640625, -1.050201416015625, -0.970947265625, -0.891693115234375, -0.81243896484375, -0.733184814453125, -0.6539306640625, -0.574676513671875, -0.49542236328125, -0.416168212890625, -0.3369140625, -0.257659912109375, -0.17840576171875, -0.099151611328125, -0.0198974609375, 0.059356689453125, 0.13861083984375, 0.217864990234375, 0.297119140625, 0.376373291015625, 0.45562744140625, 0.534881591796875, 0.6141357421875, 0.693389892578125, 0.77264404296875, 0.851898193359375, 0.93115234375, 1.010406494140625, 1.08966064453125, 1.168914794921875, 1.2481689453125, 1.327423095703125, 1.40667724609375, 1.485931396484375, 1.565185546875, 1.644439697265625, 1.72369384765625, 1.802947998046875, 1.8822021484375, 1.961456298828125, 2.04071044921875, 2.119964599609375, 2.19921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 7.0, 6.0, 8.0, 14.0, 17.0, 14.0, 11.0, 33.0, 17.0, 21.0, 30.0, 34.0, 51.0, 39.0, 59.0, 42.0, 75.0, 44.0, 60.0, 57.0, 49.0, 46.0, 43.0, 32.0, 48.0, 29.0, 14.0, 23.0, 20.0, 11.0, 11.0, 11.0, 4.0, 9.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.63671875, -1.5918731689453125, -1.547027587890625, -1.5021820068359375, -1.45733642578125, -1.4124908447265625, -1.367645263671875, -1.3227996826171875, -1.2779541015625, -1.2331085205078125, -1.188262939453125, -1.1434173583984375, -1.09857177734375, -1.0537261962890625, -1.008880615234375, -0.9640350341796875, -0.919189453125, -0.8743438720703125, -0.829498291015625, -0.7846527099609375, -0.73980712890625, -0.6949615478515625, -0.650115966796875, -0.6052703857421875, -0.5604248046875, -0.5155792236328125, -0.470733642578125, -0.4258880615234375, -0.38104248046875, -0.3361968994140625, -0.291351318359375, -0.2465057373046875, -0.20166015625, -0.1568145751953125, -0.111968994140625, -0.0671234130859375, -0.02227783203125, 0.0225677490234375, 0.067413330078125, 0.1122589111328125, 0.1571044921875, 0.2019500732421875, 0.246795654296875, 0.2916412353515625, 0.33648681640625, 0.3813323974609375, 0.426177978515625, 0.4710235595703125, 0.515869140625, 0.5607147216796875, 0.605560302734375, 0.6504058837890625, 0.69525146484375, 0.7400970458984375, 0.784942626953125, 0.8297882080078125, 0.8746337890625, 0.9194793701171875, 0.964324951171875, 1.0091705322265625, 1.05401611328125, 1.0988616943359375, 1.143707275390625, 1.1885528564453125, 1.2333984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 7.0, 6.0, 11.0, 9.0, 21.0, 30.0, 43.0, 64.0, 123.0, 196.0, 338.0, 713.0, 1777.0, 6353.0, 34418.0, 372180.0, 572345.0, 48242.0, 7848.0, 2080.0, 772.0, 392.0, 195.0, 119.0, 77.0, 56.0, 30.0, 26.0, 15.0, 10.0, 16.0, 3.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.3439521789550781, -0.33170318603515625, -0.3194541931152344, -0.3072052001953125, -0.2949562072753906, -0.28270721435546875, -0.2704582214355469, -0.258209228515625, -0.24596023559570312, -0.23371124267578125, -0.22146224975585938, -0.2092132568359375, -0.19696426391601562, -0.18471527099609375, -0.17246627807617188, -0.16021728515625, -0.14796829223632812, -0.13571929931640625, -0.12347030639648438, -0.1112213134765625, -0.09897232055664062, -0.08672332763671875, -0.07447433471679688, -0.062225341796875, -0.049976348876953125, -0.03772735595703125, -0.025478363037109375, -0.0132293701171875, -0.000980377197265625, 0.01126861572265625, 0.023517608642578125, 0.0357666015625, 0.048015594482421875, 0.06026458740234375, 0.07251358032226562, 0.0847625732421875, 0.09701156616210938, 0.10926055908203125, 0.12150955200195312, 0.133758544921875, 0.14600753784179688, 0.15825653076171875, 0.17050552368164062, 0.1827545166015625, 0.19500350952148438, 0.20725250244140625, 0.21950149536132812, 0.23175048828125, 0.24399948120117188, 0.25624847412109375, 0.2684974670410156, 0.2807464599609375, 0.2929954528808594, 0.30524444580078125, 0.3174934387207031, 0.329742431640625, 0.3419914245605469, 0.35424041748046875, 0.3664894104003906, 0.3787384033203125, 0.3909873962402344, 0.40323638916015625, 0.4154853820800781, 0.427734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 8.0, 6.0, 5.0, 6.0, 22.0, 20.0, 38.0, 42.0, 77.0, 109.0, 185.0, 135.0, 101.0, 68.0, 55.0, 28.0, 32.0, 20.0, 10.0, 7.0, 6.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56382942199707e-05, -7.358472794294357e-05, -7.153116166591644e-05, -6.947759538888931e-05, -6.742402911186218e-05, -6.537046283483505e-05, -6.331689655780792e-05, -6.126333028078079e-05, -5.920976400375366e-05, -5.715619772672653e-05, -5.51026314496994e-05, -5.304906517267227e-05, -5.099549889564514e-05, -4.894193261861801e-05, -4.688836634159088e-05, -4.483480006456375e-05, -4.278123378753662e-05, -4.072766751050949e-05, -3.867410123348236e-05, -3.662053495645523e-05, -3.45669686794281e-05, -3.251340240240097e-05, -3.045983612537384e-05, -2.840626984834671e-05, -2.635270357131958e-05, -2.429913729429245e-05, -2.224557101726532e-05, -2.019200474023819e-05, -1.813843846321106e-05, -1.608487218618393e-05, -1.40313059091568e-05, -1.197773963212967e-05, -9.924173355102539e-06, -7.870607078075409e-06, -5.817040801048279e-06, -3.7634745240211487e-06, -1.7099082469940186e-06, 3.4365803003311157e-07, 2.3972243070602417e-06, 4.450790584087372e-06, 6.504356861114502e-06, 8.557923138141632e-06, 1.0611489415168762e-05, 1.2665055692195892e-05, 1.4718621969223022e-05, 1.6772188246250153e-05, 1.8825754523277283e-05, 2.0879320800304413e-05, 2.2932887077331543e-05, 2.4986453354358673e-05, 2.7040019631385803e-05, 2.9093585908412933e-05, 3.1147152185440063e-05, 3.3200718462467194e-05, 3.5254284739494324e-05, 3.7307851016521454e-05, 3.9361417293548584e-05, 4.1414983570575714e-05, 4.3468549847602844e-05, 4.5522116124629974e-05, 4.7575682401657104e-05, 4.9629248678684235e-05, 5.1682814955711365e-05, 5.3736381232738495e-05, 5.5789947509765625e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 10.0, 7.0, 12.0, 26.0, 35.0, 30.0, 77.0, 139.0, 267.0, 644.0, 1659.0, 4498.0, 21034.0, 235908.0, 714210.0, 56873.0, 8600.0, 2676.0, 967.0, 423.0, 217.0, 97.0, 64.0, 26.0, 16.0, 8.0, 12.0, 9.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.6796875, -0.6635932922363281, -0.6474990844726562, -0.6314048767089844, -0.6153106689453125, -0.5992164611816406, -0.5831222534179688, -0.5670280456542969, -0.550933837890625, -0.5348396301269531, -0.5187454223632812, -0.5026512145996094, -0.4865570068359375, -0.4704627990722656, -0.45436859130859375, -0.4382743835449219, -0.42218017578125, -0.4060859680175781, -0.38999176025390625, -0.3738975524902344, -0.3578033447265625, -0.3417091369628906, -0.32561492919921875, -0.3095207214355469, -0.293426513671875, -0.2773323059082031, -0.26123809814453125, -0.24514389038085938, -0.2290496826171875, -0.21295547485351562, -0.19686126708984375, -0.18076705932617188, -0.1646728515625, -0.14857864379882812, -0.13248443603515625, -0.11639022827148438, -0.1002960205078125, -0.08420181274414062, -0.06810760498046875, -0.052013397216796875, -0.035919189453125, -0.019824981689453125, -0.00373077392578125, 0.012363433837890625, 0.0284576416015625, 0.044551849365234375, 0.06064605712890625, 0.07674026489257812, 0.09283447265625, 0.10892868041992188, 0.12502288818359375, 0.14111709594726562, 0.1572113037109375, 0.17330551147460938, 0.18939971923828125, 0.20549392700195312, 0.221588134765625, 0.23768234252929688, 0.25377655029296875, 0.2698707580566406, 0.2859649658203125, 0.3020591735839844, 0.31815338134765625, 0.3342475891113281, 0.350341796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 9.0, 24.0, 21.0, 21.0, 45.0, 64.0, 77.0, 98.0, 191.0, 117.0, 91.0, 72.0, 58.0, 23.0, 26.0, 12.0, 12.0, 3.0, 6.0, 4.0, 3.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12446022033691406, -0.11842727661132812, -0.11239433288574219, -0.10636138916015625, -0.10032844543457031, -0.09429550170898438, -0.08826255798339844, -0.0822296142578125, -0.07619667053222656, -0.07016372680664062, -0.06413078308105469, -0.05809783935546875, -0.05206489562988281, -0.046031951904296875, -0.03999900817871094, -0.033966064453125, -0.027933120727539062, -0.021900177001953125, -0.015867233276367188, -0.00983428955078125, -0.0038013458251953125, 0.002231597900390625, 0.008264541625976562, 0.0142974853515625, 0.020330429077148438, 0.026363372802734375, 0.03239631652832031, 0.03842926025390625, 0.04446220397949219, 0.050495147705078125, 0.05652809143066406, 0.06256103515625, 0.06859397888183594, 0.07462692260742188, 0.08065986633300781, 0.08669281005859375, 0.09272575378417969, 0.09875869750976562, 0.10479164123535156, 0.1108245849609375, 0.11685752868652344, 0.12289047241210938, 0.1289234161376953, 0.13495635986328125, 0.1409893035888672, 0.14702224731445312, 0.15305519104003906, 0.159088134765625, 0.16512107849121094, 0.17115402221679688, 0.1771869659423828, 0.18321990966796875, 0.1892528533935547, 0.19528579711914062, 0.20131874084472656, 0.2073516845703125, 0.21338462829589844, 0.21941757202148438, 0.2254505157470703, 0.23148345947265625, 0.2375164031982422, 0.24354934692382812, 0.24958229064941406, 0.255615234375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 7.0, 18.0, 45.0, 61.0, 143.0, 177.0, 196.0, 155.0, 102.0, 44.0, 29.0, 11.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.593125581741333, -2.4704627990722656, -2.3478000164031982, -2.225137233734131, -2.1024744510650635, -1.979811668395996, -1.8571490049362183, -1.7344862222671509, -1.6118234395980835, -1.4891606569290161, -1.3664978742599487, -1.243835210800171, -1.1211724281311035, -0.9985095858573914, -0.8758468627929688, -0.7531840801239014, -0.630521297454834, -0.5078585147857666, -0.3851957619190216, -0.2625330090522766, -0.13987022638320923, -0.017207443714141846, 0.10545527935028076, 0.22811806201934814, 0.3507808446884155, 0.4734436273574829, 0.5961064100265503, 0.7187691330909729, 0.8414319157600403, 0.9640946984291077, 1.0867574214935303, 1.2094202041625977, 1.332082748413086, 1.4547455310821533, 1.5774083137512207, 1.700071096420288, 1.8227338790893555, 1.9453966617584229, 2.0680594444274902, 2.1907219886779785, 2.313385009765625, 2.4360477924346924, 2.5587105751037598, 2.681373357772827, 2.8040361404418945, 2.926698923110962, 3.0493617057800293, 3.1720242500305176, 3.294687032699585, 3.4173498153686523, 3.5400125980377197, 3.662675380706787, 3.7853381633758545, 3.908000946044922, 4.03066349029541, 4.153326511383057, 4.275989055633545, 4.398651599884033, 4.52131462097168, 4.643977165222168, 4.7666401863098145, 4.889302730560303, 5.011965751647949, 5.1346282958984375, 5.257291316986084]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 5.0, 15.0, 14.0, 20.0, 19.0, 26.0, 23.0, 23.0, 28.0, 30.0, 33.0, 41.0, 38.0, 50.0, 47.0, 38.0, 37.0, 48.0, 45.0, 35.0, 30.0, 33.0, 38.0, 34.0, 29.0, 34.0, 24.0, 26.0, 18.0, 23.0, 18.0, 15.0, 10.0, 12.0, 8.0, 4.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0123181343078613, -1.9492347240447998, -1.8861511945724487, -1.8230676651000977, -1.7599842548370361, -1.6969008445739746, -1.6338173151016235, -1.5707337856292725, -1.507650375366211, -1.4445669651031494, -1.3814834356307983, -1.3183999061584473, -1.2553164958953857, -1.1922330856323242, -1.1291495561599731, -1.066066026687622, -1.0029826164245605, -0.9398991465568542, -0.876815676689148, -0.8137322068214417, -0.7506487369537354, -0.687565267086029, -0.6244817972183228, -0.5613983273506165, -0.49831485748291016, -0.43523138761520386, -0.37214791774749756, -0.30906444787979126, -0.24598097801208496, -0.18289750814437866, -0.11981403827667236, -0.056730568408966064, 0.006352901458740234, 0.06943637132644653, 0.13251984119415283, 0.19560331106185913, 0.25868678092956543, 0.32177025079727173, 0.384853720664978, 0.4479371905326843, 0.5110206604003906, 0.5741041302680969, 0.6371876001358032, 0.7002710700035095, 0.7633545398712158, 0.8264380097389221, 0.8895214796066284, 0.9526049494743347, 1.015688419342041, 1.0787718296051025, 1.1418553590774536, 1.2049388885498047, 1.2680222988128662, 1.3311057090759277, 1.3941892385482788, 1.4572727680206299, 1.5203561782836914, 1.583439588546753, 1.646523118019104, 1.709606647491455, 1.7726900577545166, 1.8357734680175781, 1.8988569974899292, 1.9619405269622803, 2.025023937225342]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 4.0, 10.0, 10.0, 21.0, 24.0, 46.0, 52.0, 71.0, 123.0, 175.0, 241.0, 384.0, 654.0, 1002.0, 1757.0, 3533.0, 8381.0, 29531.0, 210290.0, 2300380.0, 1490467.0, 114513.0, 19160.0, 6414.0, 2911.0, 1518.0, 907.0, 557.0, 368.0, 211.0, 147.0, 129.0, 81.0, 64.0, 31.0, 26.0, 19.0, 14.0, 16.0, 4.0, 10.0, 6.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.048828125, -1.0112152099609375, -0.973602294921875, -0.9359893798828125, -0.89837646484375, -0.8607635498046875, -0.823150634765625, -0.7855377197265625, -0.7479248046875, -0.7103118896484375, -0.672698974609375, -0.6350860595703125, -0.59747314453125, -0.5598602294921875, -0.522247314453125, -0.4846343994140625, -0.447021484375, -0.4094085693359375, -0.371795654296875, -0.3341827392578125, -0.29656982421875, -0.2589569091796875, -0.221343994140625, -0.1837310791015625, -0.1461181640625, -0.1085052490234375, -0.070892333984375, -0.0332794189453125, 0.00433349609375, 0.0419464111328125, 0.079559326171875, 0.1171722412109375, 0.15478515625, 0.1923980712890625, 0.230010986328125, 0.2676239013671875, 0.30523681640625, 0.3428497314453125, 0.380462646484375, 0.4180755615234375, 0.4556884765625, 0.4933013916015625, 0.530914306640625, 0.5685272216796875, 0.60614013671875, 0.6437530517578125, 0.681365966796875, 0.7189788818359375, 0.756591796875, 0.7942047119140625, 0.831817626953125, 0.8694305419921875, 0.90704345703125, 0.9446563720703125, 0.982269287109375, 1.0198822021484375, 1.0574951171875, 1.0951080322265625, 1.132720947265625, 1.1703338623046875, 1.20794677734375, 1.2455596923828125, 1.283172607421875, 1.3207855224609375, 1.3583984375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 8.0, 13.0, 17.0, 13.0, 18.0, 20.0, 32.0, 37.0, 33.0, 38.0, 28.0, 50.0, 53.0, 58.0, 52.0, 48.0, 37.0, 57.0, 60.0, 37.0, 42.0, 31.0, 30.0, 20.0, 22.0, 25.0, 16.0, 16.0, 12.0, 11.0, 9.0, 7.0, 8.0, 7.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.59814453125, -0.5762481689453125, -0.554351806640625, -0.5324554443359375, -0.51055908203125, -0.4886627197265625, -0.466766357421875, -0.4448699951171875, -0.4229736328125, -0.4010772705078125, -0.379180908203125, -0.3572845458984375, -0.33538818359375, -0.3134918212890625, -0.291595458984375, -0.2696990966796875, -0.247802734375, -0.2259063720703125, -0.204010009765625, -0.1821136474609375, -0.16021728515625, -0.1383209228515625, -0.116424560546875, -0.0945281982421875, -0.0726318359375, -0.0507354736328125, -0.028839111328125, -0.0069427490234375, 0.01495361328125, 0.0368499755859375, 0.058746337890625, 0.0806427001953125, 0.1025390625, 0.1244354248046875, 0.146331787109375, 0.1682281494140625, 0.19012451171875, 0.2120208740234375, 0.233917236328125, 0.2558135986328125, 0.2777099609375, 0.2996063232421875, 0.321502685546875, 0.3433990478515625, 0.36529541015625, 0.3871917724609375, 0.409088134765625, 0.4309844970703125, 0.452880859375, 0.4747772216796875, 0.496673583984375, 0.5185699462890625, 0.54046630859375, 0.5623626708984375, 0.584259033203125, 0.6061553955078125, 0.6280517578125, 0.6499481201171875, 0.671844482421875, 0.6937408447265625, 0.71563720703125, 0.7375335693359375, 0.759429931640625, 0.7813262939453125, 0.80322265625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 7.0, 9.0, 13.0, 19.0, 23.0, 33.0, 50.0, 75.0, 128.0, 209.0, 348.0, 745.0, 1801.0, 5216.0, 22520.0, 324694.0, 3718928.0, 99772.0, 13202.0, 3651.0, 1314.0, 648.0, 318.0, 182.0, 114.0, 74.0, 49.0, 40.0, 26.0, 18.0, 13.0, 11.0, 8.0, 5.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.455078125, -2.3910369873046875, -2.326995849609375, -2.2629547119140625, -2.19891357421875, -2.1348724365234375, -2.070831298828125, -2.0067901611328125, -1.9427490234375, -1.8787078857421875, -1.814666748046875, -1.7506256103515625, -1.68658447265625, -1.6225433349609375, -1.558502197265625, -1.4944610595703125, -1.430419921875, -1.3663787841796875, -1.302337646484375, -1.2382965087890625, -1.17425537109375, -1.1102142333984375, -1.046173095703125, -0.9821319580078125, -0.9180908203125, -0.8540496826171875, -0.790008544921875, -0.7259674072265625, -0.66192626953125, -0.5978851318359375, -0.533843994140625, -0.4698028564453125, -0.40576171875, -0.3417205810546875, -0.277679443359375, -0.2136383056640625, -0.14959716796875, -0.0855560302734375, -0.021514892578125, 0.0425262451171875, 0.1065673828125, 0.1706085205078125, 0.234649658203125, 0.2986907958984375, 0.36273193359375, 0.4267730712890625, 0.490814208984375, 0.5548553466796875, 0.618896484375, 0.6829376220703125, 0.746978759765625, 0.8110198974609375, 0.87506103515625, 0.9391021728515625, 1.003143310546875, 1.0671844482421875, 1.1312255859375, 1.1952667236328125, 1.259307861328125, 1.3233489990234375, 1.38739013671875, 1.4514312744140625, 1.515472412109375, 1.5795135498046875, 1.6435546875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 2.0, 4.0, 6.0, 15.0, 12.0, 28.0, 23.0, 57.0, 100.0, 228.0, 559.0, 1029.0, 1063.0, 529.0, 211.0, 83.0, 48.0, 21.0, 16.0, 9.0, 6.0, 8.0, 7.0, 3.0, 5.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54541015625, -0.5243911743164062, -0.5033721923828125, -0.48235321044921875, -0.461334228515625, -0.44031524658203125, -0.4192962646484375, -0.39827728271484375, -0.37725830078125, -0.35623931884765625, -0.3352203369140625, -0.31420135498046875, -0.293182373046875, -0.27216339111328125, -0.2511444091796875, -0.23012542724609375, -0.2091064453125, -0.18808746337890625, -0.1670684814453125, -0.14604949951171875, -0.125030517578125, -0.10401153564453125, -0.0829925537109375, -0.06197357177734375, -0.04095458984375, -0.01993560791015625, 0.0010833740234375, 0.02210235595703125, 0.043121337890625, 0.06414031982421875, 0.0851593017578125, 0.10617828369140625, 0.127197265625, 0.14821624755859375, 0.1692352294921875, 0.19025421142578125, 0.211273193359375, 0.23229217529296875, 0.2533111572265625, 0.27433013916015625, 0.29534912109375, 0.31636810302734375, 0.3373870849609375, 0.35840606689453125, 0.379425048828125, 0.40044403076171875, 0.4214630126953125, 0.44248199462890625, 0.4635009765625, 0.48451995849609375, 0.5055389404296875, 0.5265579223632812, 0.547576904296875, 0.5685958862304688, 0.5896148681640625, 0.6106338500976562, 0.63165283203125, 0.6526718139648438, 0.6736907958984375, 0.6947097778320312, 0.715728759765625, 0.7367477416992188, 0.7577667236328125, 0.7787857055664062, 0.7998046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 10.0, 21.0, 30.0, 55.0, 113.0, 145.0, 172.0, 177.0, 111.0, 72.0, 45.0, 22.0, 11.0, 10.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.555267333984375, -3.479269504547119, -3.4032719135284424, -3.3272740840911865, -3.2512762546539307, -3.175278425216675, -3.099280834197998, -3.023283004760742, -2.9472851753234863, -2.8712873458862305, -2.7952897548675537, -2.719291925430298, -2.643294095993042, -2.567296266555786, -2.4912986755371094, -2.4153008460998535, -2.3393030166625977, -2.263305187225342, -2.187307596206665, -2.111309766769409, -2.0353119373321533, -1.959314227104187, -1.8833165168762207, -1.8073186874389648, -1.731321096420288, -1.6553233861923218, -1.579325556755066, -1.5033278465270996, -1.4273300170898438, -1.3513323068618774, -1.2753345966339111, -1.1993367671966553, -1.123339056968689, -1.0473413467407227, -0.9713435173034668, -0.8953458070755005, -0.8193479776382446, -0.7433502674102783, -0.6673524975776672, -0.5913547277450562, -0.5153569579124451, -0.439359188079834, -0.3633614182472229, -0.2873636782169342, -0.21136590838432312, -0.13536813855171204, -0.05937039852142334, 0.016627371311187744, 0.09262514114379883, 0.1686229109764099, 0.2446206659078598, 0.3206184208393097, 0.3966161906719208, 0.47261396050453186, 0.5486117005348206, 0.6246094703674316, 0.7006072402000427, 0.7766050100326538, 0.8526027798652649, 0.928600549697876, 1.0045982599258423, 1.0805960893630981, 1.1565937995910645, 1.2325916290283203, 1.3085893392562866]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 5.0, 4.0, 2.0, 7.0, 11.0, 10.0, 14.0, 20.0, 13.0, 13.0, 28.0, 20.0, 22.0, 38.0, 46.0, 45.0, 49.0, 52.0, 56.0, 51.0, 36.0, 41.0, 40.0, 44.0, 45.0, 44.0, 35.0, 40.0, 22.0, 27.0, 23.0, 14.0, 19.0, 18.0, 14.0, 10.0, 5.0, 4.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.9607695937156677, -0.9340108036994934, -0.9072520732879639, -0.8804932832717896, -0.8537344932556152, -0.8269757032394409, -0.8002169728279114, -0.7734581828117371, -0.7466993927955627, -0.7199406027793884, -0.6931818723678589, -0.6664230823516846, -0.6396642923355103, -0.6129055023193359, -0.5861467719078064, -0.5593879818916321, -0.5326292514801025, -0.5058704614639282, -0.4791117012500763, -0.45235294103622437, -0.42559415102005005, -0.3988353908061981, -0.3720766305923462, -0.3453178405761719, -0.31855905055999756, -0.29180029034614563, -0.2650415003299713, -0.23828274011611938, -0.21152395009994507, -0.18476518988609314, -0.15800641477108002, -0.1312476396560669, -0.10448884963989258, -0.07773007452487946, -0.05097130313515663, -0.024212531745433807, 0.002546243369579315, 0.02930501103401184, 0.05606378614902496, 0.08282256126403809, 0.10958133637905121, 0.13634011149406433, 0.16309888660907745, 0.18985766172409058, 0.2166164219379425, 0.24337519705295563, 0.27013397216796875, 0.29689276218414307, 0.323651522397995, 0.3504102826118469, 0.37716907262802124, 0.40392783284187317, 0.4306866228580475, 0.4574453830718994, 0.48420417308807373, 0.510962963104248, 0.5377216935157776, 0.5644804835319519, 0.5912392139434814, 0.6179980039596558, 0.6447567939758301, 0.6715155839920044, 0.6982743144035339, 0.7250331044197083, 0.7517918944358826]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 0.0, 3.0, 7.0, 6.0, 13.0, 13.0, 34.0, 35.0, 64.0, 108.0, 222.0, 436.0, 931.0, 1925.0, 4449.0, 11608.0, 50814.0, 578495.0, 350101.0, 33243.0, 9163.0, 3667.0, 1647.0, 734.0, 352.0, 202.0, 127.0, 53.0, 33.0, 22.0, 12.0, 17.0, 8.0, 4.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4052734375, -0.389617919921875, -0.37396240234375, -0.358306884765625, -0.3426513671875, -0.326995849609375, -0.31134033203125, -0.295684814453125, -0.280029296875, -0.264373779296875, -0.24871826171875, -0.233062744140625, -0.2174072265625, -0.201751708984375, -0.18609619140625, -0.170440673828125, -0.15478515625, -0.139129638671875, -0.12347412109375, -0.107818603515625, -0.0921630859375, -0.076507568359375, -0.06085205078125, -0.045196533203125, -0.029541015625, -0.013885498046875, 0.00177001953125, 0.017425537109375, 0.0330810546875, 0.048736572265625, 0.06439208984375, 0.080047607421875, 0.095703125, 0.111358642578125, 0.12701416015625, 0.142669677734375, 0.1583251953125, 0.173980712890625, 0.18963623046875, 0.205291748046875, 0.220947265625, 0.236602783203125, 0.25225830078125, 0.267913818359375, 0.2835693359375, 0.299224853515625, 0.31488037109375, 0.330535888671875, 0.34619140625, 0.361846923828125, 0.37750244140625, 0.393157958984375, 0.4088134765625, 0.424468994140625, 0.44012451171875, 0.455780029296875, 0.471435546875, 0.487091064453125, 0.50274658203125, 0.518402099609375, 0.5340576171875, 0.549713134765625, 0.56536865234375, 0.581024169921875, 0.5966796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 0.0, 4.0, 3.0, 8.0, 4.0, 16.0, 14.0, 16.0, 22.0, 22.0, 28.0, 33.0, 40.0, 47.0, 55.0, 64.0, 44.0, 48.0, 53.0, 52.0, 62.0, 53.0, 57.0, 48.0, 36.0, 31.0, 23.0, 22.0, 21.0, 14.0, 18.0, 11.0, 5.0, 12.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.68310546875, -0.6649665832519531, -0.6468276977539062, -0.6286888122558594, -0.6105499267578125, -0.5924110412597656, -0.5742721557617188, -0.5561332702636719, -0.537994384765625, -0.5198554992675781, -0.5017166137695312, -0.4835777282714844, -0.4654388427734375, -0.4472999572753906, -0.42916107177734375, -0.4110221862792969, -0.39288330078125, -0.3747444152832031, -0.35660552978515625, -0.3384666442871094, -0.3203277587890625, -0.3021888732910156, -0.28404998779296875, -0.2659111022949219, -0.247772216796875, -0.22963333129882812, -0.21149444580078125, -0.19335556030273438, -0.1752166748046875, -0.15707778930664062, -0.13893890380859375, -0.12080001831054688, -0.1026611328125, -0.08452224731445312, -0.06638336181640625, -0.048244476318359375, -0.0301055908203125, -0.011966705322265625, 0.00617218017578125, 0.024311065673828125, 0.042449951171875, 0.060588836669921875, 0.07872772216796875, 0.09686660766601562, 0.1150054931640625, 0.13314437866210938, 0.15128326416015625, 0.16942214965820312, 0.18756103515625, 0.20569992065429688, 0.22383880615234375, 0.24197769165039062, 0.2601165771484375, 0.2782554626464844, 0.29639434814453125, 0.3145332336425781, 0.332672119140625, 0.3508110046386719, 0.36894989013671875, 0.3870887756347656, 0.4052276611328125, 0.4233665466308594, 0.44150543212890625, 0.4596443176269531, 0.477783203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 20.0, 23.0, 17.0, 30.0, 39.0, 67.0, 116.0, 155.0, 225.0, 415.0, 654.0, 1108.0, 1925.0, 3547.0, 6771.0, 14688.0, 40185.0, 139074.0, 411374.0, 296270.0, 82834.0, 26318.0, 10687.0, 5323.0, 2692.0, 1526.0, 907.0, 518.0, 350.0, 221.0, 153.0, 89.0, 70.0, 48.0, 34.0, 15.0, 16.0, 10.0, 3.0, 7.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0], "bins": [-0.1866455078125, -0.18143272399902344, -0.17621994018554688, -0.1710071563720703, -0.16579437255859375, -0.1605815887451172, -0.15536880493164062, -0.15015602111816406, -0.1449432373046875, -0.13973045349121094, -0.13451766967773438, -0.1293048858642578, -0.12409210205078125, -0.11887931823730469, -0.11366653442382812, -0.10845375061035156, -0.103240966796875, -0.09802818298339844, -0.09281539916992188, -0.08760261535644531, -0.08238983154296875, -0.07717704772949219, -0.07196426391601562, -0.06675148010253906, -0.0615386962890625, -0.05632591247558594, -0.051113128662109375, -0.04590034484863281, -0.04068756103515625, -0.03547477722167969, -0.030261993408203125, -0.025049209594726562, -0.01983642578125, -0.014623641967773438, -0.009410858154296875, -0.0041980743408203125, 0.00101470947265625, 0.0062274932861328125, 0.011440277099609375, 0.016653060913085938, 0.0218658447265625, 0.027078628540039062, 0.032291412353515625, 0.03750419616699219, 0.04271697998046875, 0.04792976379394531, 0.053142547607421875, 0.05835533142089844, 0.063568115234375, 0.06878089904785156, 0.07399368286132812, 0.07920646667480469, 0.08441925048828125, 0.08963203430175781, 0.09484481811523438, 0.10005760192871094, 0.1052703857421875, 0.11048316955566406, 0.11569595336914062, 0.12090873718261719, 0.12612152099609375, 0.1313343048095703, 0.13654708862304688, 0.14175987243652344, 0.14697265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 8.0, 15.0, 21.0, 20.0, 18.0, 18.0, 21.0, 30.0, 35.0, 33.0, 53.0, 55.0, 49.0, 45.0, 53.0, 54.0, 46.0, 41.0, 42.0, 41.0, 29.0, 29.0, 34.0, 29.0, 24.0, 26.0, 15.0, 18.0, 11.0, 12.0, 7.0, 10.0, 9.0, 7.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8232421875, -0.79400634765625, -0.7647705078125, -0.73553466796875, -0.706298828125, -0.67706298828125, -0.6478271484375, -0.61859130859375, -0.58935546875, -0.56011962890625, -0.5308837890625, -0.50164794921875, -0.472412109375, -0.44317626953125, -0.4139404296875, -0.38470458984375, -0.35546875, -0.32623291015625, -0.2969970703125, -0.26776123046875, -0.238525390625, -0.20928955078125, -0.1800537109375, -0.15081787109375, -0.12158203125, -0.09234619140625, -0.0631103515625, -0.03387451171875, -0.004638671875, 0.02459716796875, 0.0538330078125, 0.08306884765625, 0.1123046875, 0.14154052734375, 0.1707763671875, 0.20001220703125, 0.229248046875, 0.25848388671875, 0.2877197265625, 0.31695556640625, 0.34619140625, 0.37542724609375, 0.4046630859375, 0.43389892578125, 0.463134765625, 0.49237060546875, 0.5216064453125, 0.55084228515625, 0.580078125, 0.60931396484375, 0.6385498046875, 0.66778564453125, 0.697021484375, 0.72625732421875, 0.7554931640625, 0.78472900390625, 0.81396484375, 0.84320068359375, 0.8724365234375, 0.90167236328125, 0.930908203125, 0.96014404296875, 0.9893798828125, 1.01861572265625, 1.0478515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 10.0, 12.0, 24.0, 47.0, 94.0, 171.0, 395.0, 891.0, 2400.0, 7796.0, 38238.0, 383037.0, 545593.0, 55090.0, 9898.0, 2934.0, 1036.0, 444.0, 220.0, 93.0, 59.0, 22.0, 24.0, 12.0, 5.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09906005859375, -0.09526348114013672, -0.09146690368652344, -0.08767032623291016, -0.08387374877929688, -0.0800771713256836, -0.07628059387207031, -0.07248401641845703, -0.06868743896484375, -0.06489086151123047, -0.06109428405761719, -0.057297706604003906, -0.053501129150390625, -0.049704551696777344, -0.04590797424316406, -0.04211139678955078, -0.0383148193359375, -0.03451824188232422, -0.030721664428710938, -0.026925086975097656, -0.023128509521484375, -0.019331932067871094, -0.015535354614257812, -0.011738777160644531, -0.00794219970703125, -0.004145622253417969, -0.0003490447998046875, 0.0034475326538085938, 0.007244110107421875, 0.011040687561035156, 0.014837265014648438, 0.01863384246826172, 0.022430419921875, 0.02622699737548828, 0.030023574829101562, 0.033820152282714844, 0.037616729736328125, 0.041413307189941406, 0.04520988464355469, 0.04900646209716797, 0.05280303955078125, 0.05659961700439453, 0.06039619445800781, 0.0641927719116211, 0.06798934936523438, 0.07178592681884766, 0.07558250427246094, 0.07937908172607422, 0.0831756591796875, 0.08697223663330078, 0.09076881408691406, 0.09456539154052734, 0.09836196899414062, 0.1021585464477539, 0.10595512390136719, 0.10975170135498047, 0.11354827880859375, 0.11734485626220703, 0.12114143371582031, 0.1249380111694336, 0.12873458862304688, 0.13253116607666016, 0.13632774353027344, 0.14012432098388672, 0.1439208984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 9.0, 6.0, 18.0, 17.0, 46.0, 69.0, 166.0, 222.0, 203.0, 103.0, 55.0, 33.0, 24.0, 12.0, 2.0, 4.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.936094284057617e-05, -9.67998057603836e-05, -9.423866868019104e-05, -9.167753159999847e-05, -8.911639451980591e-05, -8.655525743961334e-05, -8.399412035942078e-05, -8.143298327922821e-05, -7.887184619903564e-05, -7.631070911884308e-05, -7.374957203865051e-05, -7.118843495845795e-05, -6.862729787826538e-05, -6.606616079807281e-05, -6.350502371788025e-05, -6.094388663768768e-05, -5.838274955749512e-05, -5.582161247730255e-05, -5.3260475397109985e-05, -5.069933831691742e-05, -4.8138201236724854e-05, -4.557706415653229e-05, -4.301592707633972e-05, -4.0454789996147156e-05, -3.789365291595459e-05, -3.5332515835762024e-05, -3.277137875556946e-05, -3.0210241675376892e-05, -2.7649104595184326e-05, -2.508796751499176e-05, -2.2526830434799194e-05, -1.996569335460663e-05, -1.7404556274414062e-05, -1.4843419194221497e-05, -1.228228211402893e-05, -9.721145033836365e-06, -7.160007953643799e-06, -4.598870873451233e-06, -2.037733793258667e-06, 5.234032869338989e-07, 3.084540367126465e-06, 5.645677447319031e-06, 8.206814527511597e-06, 1.0767951607704163e-05, 1.3329088687896729e-05, 1.5890225768089294e-05, 1.845136284828186e-05, 2.1012499928474426e-05, 2.3573637008666992e-05, 2.6134774088859558e-05, 2.8695911169052124e-05, 3.125704824924469e-05, 3.3818185329437256e-05, 3.637932240962982e-05, 3.894045948982239e-05, 4.1501596570014954e-05, 4.406273365020752e-05, 4.6623870730400085e-05, 4.918500781059265e-05, 5.174614489078522e-05, 5.430728197097778e-05, 5.686841905117035e-05, 5.9429556131362915e-05, 6.199069321155548e-05, 6.455183029174805e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 6.0, 16.0, 35.0, 44.0, 76.0, 151.0, 255.0, 530.0, 1037.0, 2539.0, 6975.0, 22303.0, 94417.0, 476392.0, 352882.0, 64707.0, 16814.0, 5426.0, 2060.0, 893.0, 444.0, 236.0, 137.0, 59.0, 36.0, 23.0, 17.0, 14.0, 7.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128173828125, -0.12469863891601562, -0.12122344970703125, -0.11774826049804688, -0.1142730712890625, -0.11079788208007812, -0.10732269287109375, -0.10384750366210938, -0.100372314453125, -0.09689712524414062, -0.09342193603515625, -0.08994674682617188, -0.0864715576171875, -0.08299636840820312, -0.07952117919921875, -0.07604598999023438, -0.07257080078125, -0.06909561157226562, -0.06562042236328125, -0.062145233154296875, -0.0586700439453125, -0.055194854736328125, -0.05171966552734375, -0.048244476318359375, -0.044769287109375, -0.041294097900390625, -0.03781890869140625, -0.034343719482421875, -0.0308685302734375, -0.027393341064453125, -0.02391815185546875, -0.020442962646484375, -0.0169677734375, -0.013492584228515625, -0.01001739501953125, -0.006542205810546875, -0.0030670166015625, 0.000408172607421875, 0.00388336181640625, 0.007358551025390625, 0.010833740234375, 0.014308929443359375, 0.01778411865234375, 0.021259307861328125, 0.0247344970703125, 0.028209686279296875, 0.03168487548828125, 0.035160064697265625, 0.03863525390625, 0.042110443115234375, 0.04558563232421875, 0.049060821533203125, 0.0525360107421875, 0.056011199951171875, 0.05948638916015625, 0.06296157836914062, 0.066436767578125, 0.06991195678710938, 0.07338714599609375, 0.07686233520507812, 0.0803375244140625, 0.08381271362304688, 0.08728790283203125, 0.09076309204101562, 0.09423828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 8.0, 5.0, 8.0, 9.0, 18.0, 18.0, 27.0, 49.0, 51.0, 90.0, 82.0, 115.0, 98.0, 117.0, 75.0, 59.0, 43.0, 37.0, 28.0, 11.0, 9.0, 12.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0244598388671875, -0.023560762405395508, -0.022661685943603516, -0.021762609481811523, -0.02086353302001953, -0.01996445655822754, -0.019065380096435547, -0.018166303634643555, -0.017267227172851562, -0.01636815071105957, -0.015469074249267578, -0.014569997787475586, -0.013670921325683594, -0.012771844863891602, -0.01187276840209961, -0.010973691940307617, -0.010074615478515625, -0.009175539016723633, -0.00827646255493164, -0.0073773860931396484, -0.006478309631347656, -0.005579233169555664, -0.004680156707763672, -0.0037810802459716797, -0.0028820037841796875, -0.0019829273223876953, -0.0010838508605957031, -0.00018477439880371094, 0.0007143020629882812, 0.0016133785247802734, 0.0025124549865722656, 0.003411531448364258, 0.00431060791015625, 0.005209684371948242, 0.006108760833740234, 0.0070078372955322266, 0.007906913757324219, 0.008805990219116211, 0.009705066680908203, 0.010604143142700195, 0.011503219604492188, 0.01240229606628418, 0.013301372528076172, 0.014200448989868164, 0.015099525451660156, 0.01599860191345215, 0.01689767837524414, 0.017796754837036133, 0.018695831298828125, 0.019594907760620117, 0.02049398422241211, 0.0213930606842041, 0.022292137145996094, 0.023191213607788086, 0.024090290069580078, 0.02498936653137207, 0.025888442993164062, 0.026787519454956055, 0.027686595916748047, 0.02858567237854004, 0.02948474884033203, 0.030383825302124023, 0.031282901763916016, 0.03218197822570801, 0.0330810546875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 14.0, 19.0, 28.0, 60.0, 94.0, 130.0, 158.0, 168.0, 126.0, 73.0, 56.0, 28.0, 17.0, 9.0, 5.0, 3.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6006691455841064, -1.5624265670776367, -1.5241841077804565, -1.4859415292739868, -1.447698950767517, -1.4094563722610474, -1.3712139129638672, -1.3329713344573975, -1.2947287559509277, -1.256486177444458, -1.2182437181472778, -1.180001139640808, -1.1417585611343384, -1.1035159826278687, -1.0652735233306885, -1.0270309448242188, -0.9887884259223938, -0.9505459070205688, -0.9123033285140991, -0.8740608096122742, -0.8358182311058044, -0.7975757122039795, -0.7593331336975098, -0.7210906147956848, -0.6828480958938599, -0.6446055769920349, -0.6063629984855652, -0.5681204795837402, -0.5298779010772705, -0.49163538217544556, -0.4533928334712982, -0.4151502847671509, -0.3769076466560364, -0.33866509795188904, -0.3004225492477417, -0.26218003034591675, -0.22393746674060822, -0.18569491803646088, -0.14745238423347473, -0.10920983552932739, -0.07096728682518005, -0.03272474184632301, 0.005517803132534027, 0.04376034438610077, 0.08200289309024811, 0.12024544179439545, 0.1584879755973816, 0.19673052430152893, 0.23497307300567627, 0.2732156217098236, 0.31145817041397095, 0.3497006893157959, 0.3879432678222656, 0.4261857867240906, 0.4644283354282379, 0.5026708841323853, 0.540913462638855, 0.5791559815406799, 0.6173985600471497, 0.6556410789489746, 0.6938836574554443, 0.7321261763572693, 0.7703686952590942, 0.808611273765564, 0.8468537926673889]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 8.0, 8.0, 6.0, 19.0, 13.0, 17.0, 19.0, 17.0, 34.0, 30.0, 42.0, 48.0, 49.0, 54.0, 61.0, 51.0, 41.0, 52.0, 44.0, 54.0, 51.0, 39.0, 42.0, 34.0, 35.0, 23.0, 19.0, 21.0, 19.0, 9.0, 6.0, 5.0, 5.0, 4.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6077475547790527, -0.5911387801170349, -0.5745299458503723, -0.5579211711883545, -0.5413123369216919, -0.5247035622596741, -0.5080947875976562, -0.49148598313331604, -0.47487717866897583, -0.4582683742046356, -0.4416595697402954, -0.4250507950782776, -0.4084419906139374, -0.39183318614959717, -0.37522441148757935, -0.35861560702323914, -0.3420068025588989, -0.3253979980945587, -0.3087891936302185, -0.2921804189682007, -0.2755716145038605, -0.25896281003952026, -0.24235402047634125, -0.22574523091316223, -0.20913642644882202, -0.1925276219844818, -0.1759188324213028, -0.15931004285812378, -0.14270123839378357, -0.12609243392944336, -0.10948364436626434, -0.09287484735250473, -0.07626610994338989, -0.05965731292963028, -0.043048515915870667, -0.026439718902111053, -0.00983092188835144, 0.006777875125408173, 0.023386672139167786, 0.0399954691529274, 0.05660426616668701, 0.07321306318044662, 0.08982186019420624, 0.10643065720796585, 0.12303945422172546, 0.13964825868606567, 0.1562570482492447, 0.1728658378124237, 0.18947464227676392, 0.20608344674110413, 0.22269223630428314, 0.23930102586746216, 0.25590983033180237, 0.2725186347961426, 0.2891274094581604, 0.3057362139225006, 0.3223450183868408, 0.33895382285118103, 0.35556262731552124, 0.37217140197753906, 0.3887802064418793, 0.4053890109062195, 0.4219977855682373, 0.4386065900325775, 0.4552153944969177]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 21.0, 26.0, 41.0, 80.0, 161.0, 270.0, 565.0, 1143.0, 2494.0, 6392.0, 20757.0, 103645.0, 589174.0, 264020.0, 41895.0, 10759.0, 3826.0, 1621.0, 781.0, 408.0, 179.0, 102.0, 66.0, 45.0, 23.0, 16.0, 9.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7534408569335938, -0.7241668701171875, -0.6948928833007812, -0.665618896484375, -0.6363449096679688, -0.6070709228515625, -0.5777969360351562, -0.54852294921875, -0.5192489624023438, -0.4899749755859375, -0.46070098876953125, -0.431427001953125, -0.40215301513671875, -0.3728790283203125, -0.34360504150390625, -0.3143310546875, -0.28505706787109375, -0.2557830810546875, -0.22650909423828125, -0.197235107421875, -0.16796112060546875, -0.1386871337890625, -0.10941314697265625, -0.08013916015625, -0.05086517333984375, -0.0215911865234375, 0.00768280029296875, 0.036956787109375, 0.06623077392578125, 0.0955047607421875, 0.12477874755859375, 0.154052734375, 0.18332672119140625, 0.2126007080078125, 0.24187469482421875, 0.271148681640625, 0.30042266845703125, 0.3296966552734375, 0.35897064208984375, 0.38824462890625, 0.41751861572265625, 0.4467926025390625, 0.47606658935546875, 0.505340576171875, 0.5346145629882812, 0.5638885498046875, 0.5931625366210938, 0.6224365234375, 0.6517105102539062, 0.6809844970703125, 0.7102584838867188, 0.739532470703125, 0.7688064575195312, 0.7980804443359375, 0.8273544311523438, 0.85662841796875, 0.8859024047851562, 0.9151763916015625, 0.9444503784179688, 0.973724365234375, 1.0029983520507812, 1.0322723388671875, 1.0615463256835938, 1.0908203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 13.0, 10.0, 25.0, 22.0, 25.0, 41.0, 27.0, 52.0, 59.0, 76.0, 72.0, 65.0, 78.0, 64.0, 67.0, 60.0, 43.0, 41.0, 44.0, 27.0, 21.0, 21.0, 14.0, 8.0, 5.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7900390625, -1.7443389892578125, -1.698638916015625, -1.6529388427734375, -1.60723876953125, -1.5615386962890625, -1.515838623046875, -1.4701385498046875, -1.4244384765625, -1.3787384033203125, -1.333038330078125, -1.2873382568359375, -1.24163818359375, -1.1959381103515625, -1.150238037109375, -1.1045379638671875, -1.058837890625, -1.0131378173828125, -0.967437744140625, -0.9217376708984375, -0.87603759765625, -0.8303375244140625, -0.784637451171875, -0.7389373779296875, -0.6932373046875, -0.6475372314453125, -0.601837158203125, -0.5561370849609375, -0.51043701171875, -0.4647369384765625, -0.419036865234375, -0.3733367919921875, -0.32763671875, -0.2819366455078125, -0.236236572265625, -0.1905364990234375, -0.14483642578125, -0.0991363525390625, -0.053436279296875, -0.0077362060546875, 0.0379638671875, 0.0836639404296875, 0.129364013671875, 0.1750640869140625, 0.22076416015625, 0.2664642333984375, 0.312164306640625, 0.3578643798828125, 0.403564453125, 0.4492645263671875, 0.494964599609375, 0.5406646728515625, 0.58636474609375, 0.6320648193359375, 0.677764892578125, 0.7234649658203125, 0.7691650390625, 0.8148651123046875, 0.860565185546875, 0.9062652587890625, 0.95196533203125, 0.9976654052734375, 1.043365478515625, 1.0890655517578125, 1.134765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 11.0, 5.0, 11.0, 7.0, 15.0, 14.0, 30.0, 24.0, 33.0, 48.0, 79.0, 90.0, 136.0, 236.0, 448.0, 993.0, 2216.0, 6943.0, 29488.0, 250370.0, 659935.0, 76861.0, 13644.0, 3863.0, 1455.0, 633.0, 344.0, 187.0, 126.0, 76.0, 60.0, 49.0, 38.0, 28.0, 17.0, 17.0, 10.0, 6.0, 5.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88623046875, -0.8524703979492188, -0.8187103271484375, -0.7849502563476562, -0.751190185546875, -0.7174301147460938, -0.6836700439453125, -0.6499099731445312, -0.61614990234375, -0.5823898315429688, -0.5486297607421875, -0.5148696899414062, -0.481109619140625, -0.44734954833984375, -0.4135894775390625, -0.37982940673828125, -0.3460693359375, -0.31230926513671875, -0.2785491943359375, -0.24478912353515625, -0.211029052734375, -0.17726898193359375, -0.1435089111328125, -0.10974884033203125, -0.07598876953125, -0.04222869873046875, -0.0084686279296875, 0.02529144287109375, 0.059051513671875, 0.09281158447265625, 0.1265716552734375, 0.16033172607421875, 0.194091796875, 0.22785186767578125, 0.2616119384765625, 0.29537200927734375, 0.329132080078125, 0.36289215087890625, 0.3966522216796875, 0.43041229248046875, 0.46417236328125, 0.49793243408203125, 0.5316925048828125, 0.5654525756835938, 0.599212646484375, 0.6329727172851562, 0.6667327880859375, 0.7004928588867188, 0.7342529296875, 0.7680130004882812, 0.8017730712890625, 0.8355331420898438, 0.869293212890625, 0.9030532836914062, 0.9368133544921875, 0.9705734252929688, 1.00433349609375, 1.0380935668945312, 1.0718536376953125, 1.1056137084960938, 1.139373779296875, 1.1731338500976562, 1.2068939208984375, 1.2406539916992188, 1.2744140625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 8.0, 7.0, 17.0, 9.0, 16.0, 13.0, 15.0, 29.0, 14.0, 30.0, 33.0, 32.0, 54.0, 52.0, 53.0, 66.0, 61.0, 56.0, 58.0, 52.0, 50.0, 41.0, 34.0, 32.0, 18.0, 29.0, 19.0, 17.0, 23.0, 12.0, 12.0, 5.0, 7.0, 1.0, 3.0, 7.0, 4.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.30078125, -1.262359619140625, -1.22393798828125, -1.185516357421875, -1.1470947265625, -1.108673095703125, -1.07025146484375, -1.031829833984375, -0.993408203125, -0.954986572265625, -0.91656494140625, -0.878143310546875, -0.8397216796875, -0.801300048828125, -0.76287841796875, -0.724456787109375, -0.68603515625, -0.647613525390625, -0.60919189453125, -0.570770263671875, -0.5323486328125, -0.493927001953125, -0.45550537109375, -0.417083740234375, -0.378662109375, -0.340240478515625, -0.30181884765625, -0.263397216796875, -0.2249755859375, -0.186553955078125, -0.14813232421875, -0.109710693359375, -0.0712890625, -0.032867431640625, 0.00555419921875, 0.043975830078125, 0.0823974609375, 0.120819091796875, 0.15924072265625, 0.197662353515625, 0.236083984375, 0.274505615234375, 0.31292724609375, 0.351348876953125, 0.3897705078125, 0.428192138671875, 0.46661376953125, 0.505035400390625, 0.54345703125, 0.581878662109375, 0.62030029296875, 0.658721923828125, 0.6971435546875, 0.735565185546875, 0.77398681640625, 0.812408447265625, 0.850830078125, 0.889251708984375, 0.92767333984375, 0.966094970703125, 1.0045166015625, 1.042938232421875, 1.08135986328125, 1.119781494140625, 1.158203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 8.0, 9.0, 10.0, 17.0, 31.0, 36.0, 46.0, 103.0, 233.0, 493.0, 1425.0, 5066.0, 28683.0, 321141.0, 617878.0, 61596.0, 8382.0, 2055.0, 682.0, 317.0, 133.0, 76.0, 49.0, 28.0, 19.0, 8.0, 7.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.33349609375, -0.324981689453125, -0.31646728515625, -0.307952880859375, -0.2994384765625, -0.290924072265625, -0.28240966796875, -0.273895263671875, -0.265380859375, -0.256866455078125, -0.24835205078125, -0.239837646484375, -0.2313232421875, -0.222808837890625, -0.21429443359375, -0.205780029296875, -0.197265625, -0.188751220703125, -0.18023681640625, -0.171722412109375, -0.1632080078125, -0.154693603515625, -0.14617919921875, -0.137664794921875, -0.129150390625, -0.120635986328125, -0.11212158203125, -0.103607177734375, -0.0950927734375, -0.086578369140625, -0.07806396484375, -0.069549560546875, -0.06103515625, -0.052520751953125, -0.04400634765625, -0.035491943359375, -0.0269775390625, -0.018463134765625, -0.00994873046875, -0.001434326171875, 0.007080078125, 0.015594482421875, 0.02410888671875, 0.032623291015625, 0.0411376953125, 0.049652099609375, 0.05816650390625, 0.066680908203125, 0.0751953125, 0.083709716796875, 0.09222412109375, 0.100738525390625, 0.1092529296875, 0.117767333984375, 0.12628173828125, 0.134796142578125, 0.143310546875, 0.151824951171875, 0.16033935546875, 0.168853759765625, 0.1773681640625, 0.185882568359375, 0.19439697265625, 0.202911376953125, 0.21142578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 6.0, 12.0, 7.0, 20.0, 23.0, 30.0, 50.0, 38.0, 44.0, 72.0, 72.0, 78.0, 78.0, 77.0, 71.0, 48.0, 46.0, 43.0, 29.0, 20.0, 27.0, 18.0, 15.0, 16.0, 12.0, 8.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.7239322662353516e-05, -2.6467256247997284e-05, -2.5695189833641052e-05, -2.492312341928482e-05, -2.415105700492859e-05, -2.3378990590572357e-05, -2.2606924176216125e-05, -2.1834857761859894e-05, -2.1062791347503662e-05, -2.029072493314743e-05, -1.95186585187912e-05, -1.8746592104434967e-05, -1.7974525690078735e-05, -1.7202459275722504e-05, -1.6430392861366272e-05, -1.565832644701004e-05, -1.4886260032653809e-05, -1.4114193618297577e-05, -1.3342127203941345e-05, -1.2570060789585114e-05, -1.1797994375228882e-05, -1.102592796087265e-05, -1.0253861546516418e-05, -9.481795132160187e-06, -8.709728717803955e-06, -7.937662303447723e-06, -7.165595889091492e-06, -6.39352947473526e-06, -5.621463060379028e-06, -4.849396646022797e-06, -4.077330231666565e-06, -3.3052638173103333e-06, -2.5331974029541016e-06, -1.7611309885978699e-06, -9.890645742416382e-07, -2.169981598854065e-07, 5.550682544708252e-07, 1.3271346688270569e-06, 2.0992010831832886e-06, 2.8712674975395203e-06, 3.643333911895752e-06, 4.415400326251984e-06, 5.187466740608215e-06, 5.959533154964447e-06, 6.731599569320679e-06, 7.50366598367691e-06, 8.275732398033142e-06, 9.047798812389374e-06, 9.819865226745605e-06, 1.0591931641101837e-05, 1.1363998055458069e-05, 1.21360644698143e-05, 1.2908130884170532e-05, 1.3680197298526764e-05, 1.4452263712882996e-05, 1.5224330127239227e-05, 1.599639654159546e-05, 1.676846295595169e-05, 1.7540529370307922e-05, 1.8312595784664154e-05, 1.9084662199020386e-05, 1.9856728613376617e-05, 2.062879502773285e-05, 2.140086144208908e-05, 2.2172927856445312e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 4.0, 7.0, 13.0, 17.0, 40.0, 49.0, 65.0, 96.0, 166.0, 284.0, 396.0, 711.0, 1226.0, 2207.0, 4652.0, 11770.0, 39644.0, 172976.0, 518579.0, 220557.0, 49509.0, 14335.0, 5312.0, 2650.0, 1300.0, 754.0, 459.0, 288.0, 167.0, 109.0, 72.0, 44.0, 33.0, 20.0, 10.0, 8.0, 2.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.181396484375, -0.1752643585205078, -0.16913223266601562, -0.16300010681152344, -0.15686798095703125, -0.15073585510253906, -0.14460372924804688, -0.1384716033935547, -0.1323394775390625, -0.1262073516845703, -0.12007522583007812, -0.11394309997558594, -0.10781097412109375, -0.10167884826660156, -0.09554672241210938, -0.08941459655761719, -0.083282470703125, -0.07715034484863281, -0.07101821899414062, -0.06488609313964844, -0.05875396728515625, -0.05262184143066406, -0.046489715576171875, -0.04035758972167969, -0.0342254638671875, -0.028093338012695312, -0.021961212158203125, -0.015829086303710938, -0.00969696044921875, -0.0035648345947265625, 0.002567291259765625, 0.008699417114257812, 0.01483154296875, 0.020963668823242188, 0.027095794677734375, 0.03322792053222656, 0.03936004638671875, 0.04549217224121094, 0.051624298095703125, 0.05775642395019531, 0.0638885498046875, 0.07002067565917969, 0.07615280151367188, 0.08228492736816406, 0.08841705322265625, 0.09454917907714844, 0.10068130493164062, 0.10681343078613281, 0.112945556640625, 0.11907768249511719, 0.12520980834960938, 0.13134193420410156, 0.13747406005859375, 0.14360618591308594, 0.14973831176757812, 0.1558704376220703, 0.1620025634765625, 0.1681346893310547, 0.17426681518554688, 0.18039894104003906, 0.18653106689453125, 0.19266319274902344, 0.19879531860351562, 0.2049274444580078, 0.2110595703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 9.0, 10.0, 7.0, 15.0, 15.0, 16.0, 23.0, 28.0, 45.0, 40.0, 61.0, 74.0, 73.0, 78.0, 94.0, 68.0, 57.0, 38.0, 53.0, 38.0, 24.0, 20.0, 26.0, 15.0, 16.0, 17.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08807373046875, -0.08568096160888672, -0.08328819274902344, -0.08089542388916016, -0.07850265502929688, -0.0761098861694336, -0.07371711730957031, -0.07132434844970703, -0.06893157958984375, -0.06653881072998047, -0.06414604187011719, -0.061753273010253906, -0.059360504150390625, -0.056967735290527344, -0.05457496643066406, -0.05218219757080078, -0.0497894287109375, -0.04739665985107422, -0.04500389099121094, -0.042611122131347656, -0.040218353271484375, -0.037825584411621094, -0.03543281555175781, -0.03304004669189453, -0.03064727783203125, -0.02825450897216797, -0.025861740112304688, -0.023468971252441406, -0.021076202392578125, -0.018683433532714844, -0.016290664672851562, -0.013897895812988281, -0.011505126953125, -0.009112358093261719, -0.0067195892333984375, -0.004326820373535156, -0.001934051513671875, 0.00045871734619140625, 0.0028514862060546875, 0.005244255065917969, 0.00763702392578125, 0.010029792785644531, 0.012422561645507812, 0.014815330505371094, 0.017208099365234375, 0.019600868225097656, 0.021993637084960938, 0.02438640594482422, 0.0267791748046875, 0.02917194366455078, 0.03156471252441406, 0.033957481384277344, 0.036350250244140625, 0.038743019104003906, 0.04113578796386719, 0.04352855682373047, 0.04592132568359375, 0.04831409454345703, 0.05070686340332031, 0.053099632263183594, 0.055492401123046875, 0.057885169982910156, 0.06027793884277344, 0.06267070770263672, 0.0650634765625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 11.0, 33.0, 112.0, 261.0, 330.0, 195.0, 47.0, 14.0, 5.0, 6.0], "bins": [-10.385149955749512, -10.206710815429688, -10.028271675109863, -9.849832534790039, -9.671394348144531, -9.492955207824707, -9.314516067504883, -9.136076927185059, -8.957637786865234, -8.77919864654541, -8.600759506225586, -8.422320365905762, -8.243882179260254, -8.06544303894043, -7.8870038986206055, -7.708564758300781, -7.530125617980957, -7.351686477661133, -7.173247814178467, -6.994808673858643, -6.816369533538818, -6.637930393218994, -6.459491729736328, -6.281052589416504, -6.102613925933838, -5.924174785614014, -5.745736122131348, -5.567296981811523, -5.388857841491699, -5.210418701171875, -5.031980037689209, -4.853540897369385, -4.6751017570495605, -4.496662616729736, -4.31822395324707, -4.139784812927246, -3.961345672607422, -3.7829067707061768, -3.6044678688049316, -3.4260287284851074, -3.247589588165283, -3.069150686264038, -2.890711545944214, -2.7122726440429688, -2.5338335037231445, -2.3553946018218994, -2.1769556999206543, -1.99851655960083, -1.8200775384902954, -1.6416385173797607, -1.463199496269226, -1.2847604751586914, -1.1063215732574463, -0.9278824925422668, -0.749443531036377, -0.5710045099258423, -0.3925654888153076, -0.21412648260593414, -0.03568747639656067, 0.1427515149116516, 0.3211905360221863, 0.49962955713272095, 0.6780685186386108, 0.8565075397491455, 1.0349465608596802]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 8.0, 9.0, 10.0, 16.0, 24.0, 12.0, 26.0, 27.0, 22.0, 16.0, 37.0, 33.0, 24.0, 46.0, 33.0, 47.0, 54.0, 35.0, 50.0, 38.0, 29.0, 35.0, 41.0, 49.0, 23.0, 27.0, 31.0, 23.0, 21.0, 29.0, 14.0, 17.0, 13.0, 10.0, 10.0, 8.0, 7.0, 8.0, 10.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7313416004180908, -1.680737853050232, -1.6301339864730835, -1.5795302391052246, -1.5289264917373657, -1.4783227443695068, -1.4277188777923584, -1.3771151304244995, -1.3265113830566406, -1.2759076356887817, -1.2253037691116333, -1.1747000217437744, -1.1240962743759155, -1.0734925270080566, -1.0228886604309082, -0.9722849130630493, -0.9216810464859009, -0.8710772395133972, -0.8204734921455383, -0.7698696851730347, -0.7192659378051758, -0.6686621308326721, -0.6180583238601685, -0.5674545764923096, -0.5168507695198059, -0.46624699234962463, -0.41564321517944336, -0.3650394082069397, -0.3144356310367584, -0.26383185386657715, -0.2132280468940735, -0.1626242697238922, -0.11202049255371094, -0.061416707932949066, -0.010812923312187195, 0.03979086875915527, 0.09039464592933655, 0.14099842309951782, 0.19160223007202148, 0.24220600724220276, 0.29280978441238403, 0.3434135615825653, 0.3940173387527466, 0.44462114572525024, 0.4952249228954315, 0.5458287000656128, 0.5964325070381165, 0.6470363140106201, 0.697640061378479, 0.7482438683509827, 0.7988476157188416, 0.8494514226913452, 0.9000551700592041, 0.9506589770317078, 1.0012627840042114, 1.0518665313720703, 1.1024703979492188, 1.1530741453170776, 1.203678011894226, 1.254281759262085, 1.3048855066299438, 1.3554892539978027, 1.4060931205749512, 1.45669686794281, 1.507300615310669]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 8.0, 11.0, 13.0, 18.0, 24.0, 32.0, 48.0, 91.0, 137.0, 211.0, 417.0, 849.0, 1644.0, 3578.0, 10609.0, 70164.0, 2287188.0, 1748843.0, 52943.0, 9908.0, 3959.0, 1741.0, 762.0, 457.0, 224.0, 155.0, 82.0, 48.0, 37.0, 20.0, 8.0, 10.0, 10.0, 6.0, 2.0, 0.0, 5.0], "bins": [-2.150390625, -2.1014633178710938, -2.0525360107421875, -2.0036087036132812, -1.954681396484375, -1.9057540893554688, -1.8568267822265625, -1.8078994750976562, -1.75897216796875, -1.7100448608398438, -1.6611175537109375, -1.6121902465820312, -1.563262939453125, -1.5143356323242188, -1.4654083251953125, -1.4164810180664062, -1.3675537109375, -1.3186264038085938, -1.2696990966796875, -1.2207717895507812, -1.171844482421875, -1.1229171752929688, -1.0739898681640625, -1.0250625610351562, -0.97613525390625, -0.9272079467773438, -0.8782806396484375, -0.8293533325195312, -0.780426025390625, -0.7314987182617188, -0.6825714111328125, -0.6336441040039062, -0.584716796875, -0.5357894897460938, -0.4868621826171875, -0.43793487548828125, -0.389007568359375, -0.34008026123046875, -0.2911529541015625, -0.24222564697265625, -0.19329833984375, -0.14437103271484375, -0.0954437255859375, -0.04651641845703125, 0.002410888671875, 0.05133819580078125, 0.1002655029296875, 0.14919281005859375, 0.1981201171875, 0.24704742431640625, 0.2959747314453125, 0.34490203857421875, 0.393829345703125, 0.44275665283203125, 0.4916839599609375, 0.5406112670898438, 0.58953857421875, 0.6384658813476562, 0.6873931884765625, 0.7363204956054688, 0.785247802734375, 0.8341751098632812, 0.8831024169921875, 0.9320297241210938, 0.98095703125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 17.0, 22.0, 24.0, 42.0, 47.0, 68.0, 58.0, 71.0, 79.0, 91.0, 72.0, 71.0, 76.0, 53.0, 41.0, 48.0, 30.0, 27.0, 19.0, 14.0, 11.0, 7.0, 4.0, 6.0, 2.0, 0.0, 1.0], "bins": [-1.3115234375, -1.2834930419921875, -1.255462646484375, -1.2274322509765625, -1.19940185546875, -1.1713714599609375, -1.143341064453125, -1.1153106689453125, -1.0872802734375, -1.0592498779296875, -1.031219482421875, -1.0031890869140625, -0.97515869140625, -0.9471282958984375, -0.919097900390625, -0.8910675048828125, -0.863037109375, -0.8350067138671875, -0.806976318359375, -0.7789459228515625, -0.75091552734375, -0.7228851318359375, -0.694854736328125, -0.6668243408203125, -0.6387939453125, -0.6107635498046875, -0.582733154296875, -0.5547027587890625, -0.52667236328125, -0.4986419677734375, -0.470611572265625, -0.4425811767578125, -0.41455078125, -0.3865203857421875, -0.358489990234375, -0.3304595947265625, -0.30242919921875, -0.2743988037109375, -0.246368408203125, -0.2183380126953125, -0.1903076171875, -0.1622772216796875, -0.134246826171875, -0.1062164306640625, -0.07818603515625, -0.0501556396484375, -0.022125244140625, 0.0059051513671875, 0.033935546875, 0.0619659423828125, 0.089996337890625, 0.1180267333984375, 0.14605712890625, 0.1740875244140625, 0.202117919921875, 0.2301483154296875, 0.2581787109375, 0.2862091064453125, 0.314239501953125, 0.3422698974609375, 0.37030029296875, 0.3983306884765625, 0.426361083984375, 0.4543914794921875, 0.482421875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 8.0, 10.0, 23.0, 35.0, 44.0, 69.0, 160.0, 335.0, 752.0, 2673.0, 16870.0, 1680109.0, 2469099.0, 19446.0, 3005.0, 917.0, 385.0, 159.0, 79.0, 44.0, 20.0, 10.0, 8.0, 6.0, 4.0, 4.0, 7.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.96875, -2.8863525390625, -2.803955078125, -2.7215576171875, -2.63916015625, -2.5567626953125, -2.474365234375, -2.3919677734375, -2.3095703125, -2.2271728515625, -2.144775390625, -2.0623779296875, -1.97998046875, -1.8975830078125, -1.815185546875, -1.7327880859375, -1.650390625, -1.5679931640625, -1.485595703125, -1.4031982421875, -1.32080078125, -1.2384033203125, -1.156005859375, -1.0736083984375, -0.9912109375, -0.9088134765625, -0.826416015625, -0.7440185546875, -0.66162109375, -0.5792236328125, -0.496826171875, -0.4144287109375, -0.33203125, -0.2496337890625, -0.167236328125, -0.0848388671875, -0.00244140625, 0.0799560546875, 0.162353515625, 0.2447509765625, 0.3271484375, 0.4095458984375, 0.491943359375, 0.5743408203125, 0.65673828125, 0.7391357421875, 0.821533203125, 0.9039306640625, 0.986328125, 1.0687255859375, 1.151123046875, 1.2335205078125, 1.31591796875, 1.3983154296875, 1.480712890625, 1.5631103515625, 1.6455078125, 1.7279052734375, 1.810302734375, 1.8927001953125, 1.97509765625, 2.0574951171875, 2.139892578125, 2.2222900390625, 2.3046875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 1.0, 8.0, 9.0, 16.0, 21.0, 43.0, 74.0, 130.0, 258.0, 532.0, 855.0, 938.0, 597.0, 274.0, 123.0, 74.0, 44.0, 23.0, 20.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4546318054199219, -0.43782806396484375, -0.4210243225097656, -0.4042205810546875, -0.3874168395996094, -0.37061309814453125, -0.3538093566894531, -0.337005615234375, -0.3202018737792969, -0.30339813232421875, -0.2865943908691406, -0.2697906494140625, -0.2529869079589844, -0.23618316650390625, -0.21937942504882812, -0.20257568359375, -0.18577194213867188, -0.16896820068359375, -0.15216445922851562, -0.1353607177734375, -0.11855697631835938, -0.10175323486328125, -0.08494949340820312, -0.068145751953125, -0.051342010498046875, -0.03453826904296875, -0.017734527587890625, -0.0009307861328125, 0.015872955322265625, 0.03267669677734375, 0.049480438232421875, 0.0662841796875, 0.08308792114257812, 0.09989166259765625, 0.11669540405273438, 0.1334991455078125, 0.15030288696289062, 0.16710662841796875, 0.18391036987304688, 0.200714111328125, 0.21751785278320312, 0.23432159423828125, 0.2511253356933594, 0.2679290771484375, 0.2847328186035156, 0.30153656005859375, 0.3183403015136719, 0.33514404296875, 0.3519477844238281, 0.36875152587890625, 0.3855552673339844, 0.4023590087890625, 0.4191627502441406, 0.43596649169921875, 0.4527702331542969, 0.469573974609375, 0.4863777160644531, 0.5031814575195312, 0.5199851989746094, 0.5367889404296875, 0.5535926818847656, 0.5703964233398438, 0.5872001647949219, 0.60400390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 6.0, 4.0, 12.0, 18.0, 25.0, 30.0, 36.0, 47.0, 40.0, 46.0, 51.0, 60.0, 65.0, 50.0, 71.0, 57.0, 69.0, 53.0, 57.0, 42.0, 33.0, 28.0, 22.0, 17.0, 5.0, 10.0, 6.0, 12.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9081579446792603, -0.8820516467094421, -0.8559452891349792, -0.8298389911651611, -0.8037326335906982, -0.7776263356208801, -0.751520037651062, -0.7254136800765991, -0.699307382106781, -0.6732010841369629, -0.6470947265625, -0.6209884285926819, -0.594882071018219, -0.5687757730484009, -0.542669415473938, -0.5165631175041199, -0.49045678973197937, -0.46435046195983887, -0.43824413418769836, -0.41213780641555786, -0.38603150844573975, -0.35992518067359924, -0.33381885290145874, -0.3077125549316406, -0.28160619735717773, -0.25549986958503723, -0.22939355671405792, -0.20328722894191742, -0.1771809160709381, -0.1510745882987976, -0.1249682605266571, -0.0988619476556778, -0.07275563478469849, -0.04664931446313858, -0.020542990416288376, 0.005563333630561829, 0.031669653952121735, 0.05777597427368164, 0.08388230204582214, 0.10998861491680145, 0.13609494268894196, 0.16220127046108246, 0.18830758333206177, 0.21441391110420227, 0.24052023887634277, 0.2666265368461609, 0.2927328944206238, 0.3188391923904419, 0.3449455201625824, 0.3710518479347229, 0.3971581757068634, 0.4232645034790039, 0.449370801448822, 0.4754771292209625, 0.501583456993103, 0.5276897549629211, 0.553796112537384, 0.5799024105072021, 0.606008768081665, 0.6321150660514832, 0.658221423625946, 0.6843277215957642, 0.710434079170227, 0.7365403771400452, 0.7626466751098633]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 7.0, 6.0, 10.0, 12.0, 13.0, 11.0, 19.0, 15.0, 20.0, 29.0, 16.0, 24.0, 23.0, 39.0, 32.0, 44.0, 29.0, 43.0, 41.0, 51.0, 40.0, 36.0, 38.0, 36.0, 38.0, 28.0, 30.0, 33.0, 28.0, 22.0, 24.0, 22.0, 29.0, 12.0, 18.0, 15.0, 10.0, 8.0, 11.0, 11.0, 3.0, 6.0, 3.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5380727648735046, -0.5195364952087402, -0.5010002851486206, -0.4824640452861786, -0.4639278054237366, -0.44539153575897217, -0.42685529589653015, -0.40831905603408813, -0.3897828161716461, -0.3712465763092041, -0.3527103364467621, -0.33417409658432007, -0.31563782691955566, -0.29710161685943604, -0.27856534719467163, -0.2600291073322296, -0.2414928674697876, -0.22295662760734558, -0.20442038774490356, -0.18588413298130035, -0.16734789311885834, -0.14881165325641632, -0.1302753984928131, -0.1117391586303711, -0.09320291876792908, -0.07466667890548706, -0.05613043159246445, -0.03759418800473213, -0.019057944416999817, -0.0005217045545578003, 0.018014542758464813, 0.03655079007148743, 0.05508708953857422, 0.07362332940101624, 0.09215957671403885, 0.11069582402706146, 0.12923206388950348, 0.1477683037519455, 0.1663045585155487, 0.18484079837799072, 0.20337703824043274, 0.22191327810287476, 0.24044951796531677, 0.2589857578277588, 0.2775220274925232, 0.2960582375526428, 0.3145945072174072, 0.33313074707984924, 0.35166698694229126, 0.3702032268047333, 0.3887394666671753, 0.4072757065296173, 0.4258119463920593, 0.44434821605682373, 0.46288445591926575, 0.48142069578170776, 0.4999569356441498, 0.5184931755065918, 0.5370294451713562, 0.5555656552314758, 0.5741019248962402, 0.5926381349563599, 0.6111744046211243, 0.6297106742858887, 0.6482468843460083]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 10.0, 14.0, 17.0, 24.0, 34.0, 41.0, 43.0, 79.0, 110.0, 132.0, 173.0, 238.0, 383.0, 490.0, 764.0, 1232.0, 1968.0, 3618.0, 6829.0, 14772.0, 38835.0, 167058.0, 536770.0, 197954.0, 43645.0, 15947.0, 7439.0, 3904.0, 2202.0, 1260.0, 767.0, 524.0, 351.0, 254.0, 182.0, 127.0, 94.0, 72.0, 51.0, 29.0, 24.0, 18.0, 16.0, 15.0, 9.0, 5.0, 4.0, 3.0, 2.0, 8.0, 3.0, 1.0, 4.0], "bins": [-0.22216796875, -0.215545654296875, -0.20892333984375, -0.202301025390625, -0.1956787109375, -0.189056396484375, -0.18243408203125, -0.175811767578125, -0.169189453125, -0.162567138671875, -0.15594482421875, -0.149322509765625, -0.1427001953125, -0.136077880859375, -0.12945556640625, -0.122833251953125, -0.1162109375, -0.109588623046875, -0.10296630859375, -0.096343994140625, -0.0897216796875, -0.083099365234375, -0.07647705078125, -0.069854736328125, -0.063232421875, -0.056610107421875, -0.04998779296875, -0.043365478515625, -0.0367431640625, -0.030120849609375, -0.02349853515625, -0.016876220703125, -0.01025390625, -0.003631591796875, 0.00299072265625, 0.009613037109375, 0.0162353515625, 0.022857666015625, 0.02947998046875, 0.036102294921875, 0.042724609375, 0.049346923828125, 0.05596923828125, 0.062591552734375, 0.0692138671875, 0.075836181640625, 0.08245849609375, 0.089080810546875, 0.095703125, 0.102325439453125, 0.10894775390625, 0.115570068359375, 0.1221923828125, 0.128814697265625, 0.13543701171875, 0.142059326171875, 0.148681640625, 0.155303955078125, 0.16192626953125, 0.168548583984375, 0.1751708984375, 0.181793212890625, 0.18841552734375, 0.195037841796875, 0.20166015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 11.0, 13.0, 12.0, 8.0, 11.0, 20.0, 21.0, 17.0, 29.0, 26.0, 22.0, 24.0, 37.0, 38.0, 39.0, 34.0, 47.0, 44.0, 54.0, 40.0, 35.0, 40.0, 35.0, 40.0, 29.0, 29.0, 24.0, 29.0, 31.0, 28.0, 14.0, 22.0, 14.0, 16.0, 8.0, 11.0, 8.0, 6.0, 8.0, 4.0, 9.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.369140625, -0.3572273254394531, -0.34531402587890625, -0.3334007263183594, -0.3214874267578125, -0.3095741271972656, -0.29766082763671875, -0.2857475280761719, -0.273834228515625, -0.2619209289550781, -0.25000762939453125, -0.23809432983398438, -0.2261810302734375, -0.21426773071289062, -0.20235443115234375, -0.19044113159179688, -0.17852783203125, -0.16661453247070312, -0.15470123291015625, -0.14278793334960938, -0.1308746337890625, -0.11896133422851562, -0.10704803466796875, -0.09513473510742188, -0.083221435546875, -0.07130813598632812, -0.05939483642578125, -0.047481536865234375, -0.0355682373046875, -0.023654937744140625, -0.01174163818359375, 0.000171661376953125, 0.0120849609375, 0.023998260498046875, 0.03591156005859375, 0.047824859619140625, 0.0597381591796875, 0.07165145874023438, 0.08356475830078125, 0.09547805786132812, 0.107391357421875, 0.11930465698242188, 0.13121795654296875, 0.14313125610351562, 0.1550445556640625, 0.16695785522460938, 0.17887115478515625, 0.19078445434570312, 0.20269775390625, 0.21461105346679688, 0.22652435302734375, 0.23843765258789062, 0.2503509521484375, 0.2622642517089844, 0.27417755126953125, 0.2860908508300781, 0.298004150390625, 0.3099174499511719, 0.32183074951171875, 0.3337440490722656, 0.3456573486328125, 0.3575706481933594, 0.36948394775390625, 0.3813972473144531, 0.393310546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 5.0, 14.0, 12.0, 23.0, 33.0, 44.0, 56.0, 105.0, 126.0, 176.0, 246.0, 381.0, 638.0, 1037.0, 1656.0, 2764.0, 4873.0, 9424.0, 19402.0, 46043.0, 132112.0, 356005.0, 299072.0, 101660.0, 37235.0, 16474.0, 8215.0, 4440.0, 2389.0, 1362.0, 877.0, 534.0, 322.0, 251.0, 167.0, 104.0, 87.0, 56.0, 44.0, 17.0, 25.0, 11.0, 14.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11309814453125, -0.10904216766357422, -0.10498619079589844, -0.10093021392822266, -0.09687423706054688, -0.0928182601928711, -0.08876228332519531, -0.08470630645751953, -0.08065032958984375, -0.07659435272216797, -0.07253837585449219, -0.0684823989868164, -0.06442642211914062, -0.060370445251464844, -0.05631446838378906, -0.05225849151611328, -0.0482025146484375, -0.04414653778076172, -0.04009056091308594, -0.036034584045410156, -0.031978607177734375, -0.027922630310058594, -0.023866653442382812, -0.01981067657470703, -0.01575469970703125, -0.011698722839355469, -0.0076427459716796875, -0.0035867691040039062, 0.000469207763671875, 0.004525184631347656, 0.008581161499023438, 0.012637138366699219, 0.016693115234375, 0.02074909210205078, 0.024805068969726562, 0.028861045837402344, 0.032917022705078125, 0.036972999572753906, 0.04102897644042969, 0.04508495330810547, 0.04914093017578125, 0.05319690704345703, 0.05725288391113281, 0.061308860778808594, 0.06536483764648438, 0.06942081451416016, 0.07347679138183594, 0.07753276824951172, 0.0815887451171875, 0.08564472198486328, 0.08970069885253906, 0.09375667572021484, 0.09781265258789062, 0.1018686294555664, 0.10592460632324219, 0.10998058319091797, 0.11403656005859375, 0.11809253692626953, 0.12214851379394531, 0.1262044906616211, 0.13026046752929688, 0.13431644439697266, 0.13837242126464844, 0.14242839813232422, 0.146484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 10.0, 3.0, 6.0, 7.0, 16.0, 17.0, 12.0, 22.0, 16.0, 21.0, 32.0, 30.0, 38.0, 36.0, 40.0, 48.0, 39.0, 37.0, 40.0, 35.0, 55.0, 41.0, 34.0, 45.0, 34.0, 30.0, 34.0, 28.0, 29.0, 24.0, 24.0, 23.0, 24.0, 11.0, 14.0, 16.0, 4.0, 4.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.0390625, -1.009063720703125, -0.97906494140625, -0.949066162109375, -0.9190673828125, -0.889068603515625, -0.85906982421875, -0.829071044921875, -0.799072265625, -0.769073486328125, -0.73907470703125, -0.709075927734375, -0.6790771484375, -0.649078369140625, -0.61907958984375, -0.589080810546875, -0.55908203125, -0.529083251953125, -0.49908447265625, -0.469085693359375, -0.4390869140625, -0.409088134765625, -0.37908935546875, -0.349090576171875, -0.319091796875, -0.289093017578125, -0.25909423828125, -0.229095458984375, -0.1990966796875, -0.169097900390625, -0.13909912109375, -0.109100341796875, -0.0791015625, -0.049102783203125, -0.01910400390625, 0.010894775390625, 0.0408935546875, 0.070892333984375, 0.10089111328125, 0.130889892578125, 0.160888671875, 0.190887451171875, 0.22088623046875, 0.250885009765625, 0.2808837890625, 0.310882568359375, 0.34088134765625, 0.370880126953125, 0.40087890625, 0.430877685546875, 0.46087646484375, 0.490875244140625, 0.5208740234375, 0.550872802734375, 0.58087158203125, 0.610870361328125, 0.640869140625, 0.670867919921875, 0.70086669921875, 0.730865478515625, 0.7608642578125, 0.790863037109375, 0.82086181640625, 0.850860595703125, 0.880859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 26.0, 34.0, 58.0, 101.0, 198.0, 360.0, 766.0, 1639.0, 3747.0, 11103.0, 51442.0, 401430.0, 490133.0, 66628.0, 13164.0, 4231.0, 1765.0, 756.0, 408.0, 238.0, 109.0, 75.0, 50.0, 33.0, 14.0, 9.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07635498046875, -0.0730447769165039, -0.06973457336425781, -0.06642436981201172, -0.06311416625976562, -0.05980396270751953, -0.05649375915527344, -0.053183555603027344, -0.04987335205078125, -0.046563148498535156, -0.04325294494628906, -0.03994274139404297, -0.036632537841796875, -0.03332233428955078, -0.030012130737304688, -0.026701927185058594, -0.0233917236328125, -0.020081520080566406, -0.016771316528320312, -0.013461112976074219, -0.010150909423828125, -0.006840705871582031, -0.0035305023193359375, -0.00022029876708984375, 0.00308990478515625, 0.006400108337402344, 0.009710311889648438, 0.013020515441894531, 0.016330718994140625, 0.01964092254638672, 0.022951126098632812, 0.026261329650878906, 0.029571533203125, 0.032881736755371094, 0.03619194030761719, 0.03950214385986328, 0.042812347412109375, 0.04612255096435547, 0.04943275451660156, 0.052742958068847656, 0.05605316162109375, 0.059363365173339844, 0.06267356872558594, 0.06598377227783203, 0.06929397583007812, 0.07260417938232422, 0.07591438293457031, 0.0792245864868164, 0.0825347900390625, 0.0858449935913086, 0.08915519714355469, 0.09246540069580078, 0.09577560424804688, 0.09908580780029297, 0.10239601135253906, 0.10570621490478516, 0.10901641845703125, 0.11232662200927734, 0.11563682556152344, 0.11894702911376953, 0.12225723266601562, 0.12556743621826172, 0.1288776397705078, 0.1321878433227539, 0.135498046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 8.0, 7.0, 13.0, 19.0, 21.0, 31.0, 42.0, 81.0, 96.0, 140.0, 90.0, 116.0, 93.0, 70.0, 60.0, 27.0, 27.0, 15.0, 10.0, 3.0, 6.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.054473876953125e-05, -4.915613681077957e-05, -4.776753485202789e-05, -4.6378932893276215e-05, -4.4990330934524536e-05, -4.360172897577286e-05, -4.221312701702118e-05, -4.08245250582695e-05, -3.943592309951782e-05, -3.8047321140766144e-05, -3.6658719182014465e-05, -3.527011722326279e-05, -3.388151526451111e-05, -3.249291330575943e-05, -3.110431134700775e-05, -2.9715709388256073e-05, -2.8327107429504395e-05, -2.6938505470752716e-05, -2.5549903512001038e-05, -2.416130155324936e-05, -2.277269959449768e-05, -2.1384097635746002e-05, -1.9995495676994324e-05, -1.8606893718242645e-05, -1.7218291759490967e-05, -1.582968980073929e-05, -1.444108784198761e-05, -1.3052485883235931e-05, -1.1663883924484253e-05, -1.0275281965732574e-05, -8.886680006980896e-06, -7.4980780482292175e-06, -6.109476089477539e-06, -4.720874130725861e-06, -3.332272171974182e-06, -1.9436702132225037e-06, -5.550682544708252e-07, 8.335337042808533e-07, 2.2221356630325317e-06, 3.61073762178421e-06, 4.999339580535889e-06, 6.387941539287567e-06, 7.776543498039246e-06, 9.165145456790924e-06, 1.0553747415542603e-05, 1.1942349374294281e-05, 1.333095133304596e-05, 1.4719553291797638e-05, 1.6108155250549316e-05, 1.7496757209300995e-05, 1.8885359168052673e-05, 2.0273961126804352e-05, 2.166256308555603e-05, 2.305116504430771e-05, 2.4439767003059387e-05, 2.5828368961811066e-05, 2.7216970920562744e-05, 2.8605572879314423e-05, 2.99941748380661e-05, 3.138277679681778e-05, 3.277137875556946e-05, 3.4159980714321136e-05, 3.5548582673072815e-05, 3.6937184631824493e-05, 3.832578659057617e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 11.0, 1.0, 12.0, 14.0, 10.0, 20.0, 26.0, 51.0, 67.0, 110.0, 136.0, 228.0, 348.0, 619.0, 1067.0, 2063.0, 3955.0, 8755.0, 21627.0, 58307.0, 170260.0, 359548.0, 266352.0, 96740.0, 33740.0, 12894.0, 5646.0, 2679.0, 1336.0, 754.0, 420.0, 239.0, 176.0, 103.0, 71.0, 52.0, 37.0, 27.0, 13.0, 14.0, 10.0, 5.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06231689453125, -0.06035327911376953, -0.05838966369628906, -0.056426048278808594, -0.054462432861328125, -0.052498817443847656, -0.05053520202636719, -0.04857158660888672, -0.04660797119140625, -0.04464435577392578, -0.04268074035644531, -0.040717124938964844, -0.038753509521484375, -0.036789894104003906, -0.03482627868652344, -0.03286266326904297, -0.0308990478515625, -0.02893543243408203, -0.026971817016601562, -0.025008201599121094, -0.023044586181640625, -0.021080970764160156, -0.019117355346679688, -0.01715373992919922, -0.01519012451171875, -0.013226509094238281, -0.011262893676757812, -0.009299278259277344, -0.007335662841796875, -0.005372047424316406, -0.0034084320068359375, -0.0014448165893554688, 0.000518798828125, 0.0024824142456054688, 0.0044460296630859375, 0.006409645080566406, 0.008373260498046875, 0.010336875915527344, 0.012300491333007812, 0.014264106750488281, 0.01622772216796875, 0.01819133758544922, 0.020154953002929688, 0.022118568420410156, 0.024082183837890625, 0.026045799255371094, 0.028009414672851562, 0.02997303009033203, 0.0319366455078125, 0.03390026092529297, 0.03586387634277344, 0.037827491760253906, 0.039791107177734375, 0.041754722595214844, 0.04371833801269531, 0.04568195343017578, 0.04764556884765625, 0.04960918426513672, 0.05157279968261719, 0.053536415100097656, 0.055500030517578125, 0.057463645935058594, 0.05942726135253906, 0.06139087677001953, 0.0633544921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 1.0, 7.0, 5.0, 7.0, 11.0, 3.0, 13.0, 16.0, 15.0, 23.0, 36.0, 43.0, 53.0, 57.0, 58.0, 87.0, 72.0, 78.0, 72.0, 52.0, 61.0, 43.0, 38.0, 36.0, 24.0, 24.0, 17.0, 10.0, 7.0, 6.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.023773193359375, -0.02312636375427246, -0.022479534149169922, -0.021832704544067383, -0.021185874938964844, -0.020539045333862305, -0.019892215728759766, -0.019245386123657227, -0.018598556518554688, -0.01795172691345215, -0.01730489730834961, -0.01665806770324707, -0.01601123809814453, -0.015364408493041992, -0.014717578887939453, -0.014070749282836914, -0.013423919677734375, -0.012777090072631836, -0.012130260467529297, -0.011483430862426758, -0.010836601257324219, -0.01018977165222168, -0.00954294204711914, -0.008896112442016602, -0.008249282836914062, -0.0076024532318115234, -0.006955623626708984, -0.006308794021606445, -0.005661964416503906, -0.005015134811401367, -0.004368305206298828, -0.003721475601196289, -0.00307464599609375, -0.002427816390991211, -0.0017809867858886719, -0.0011341571807861328, -0.00048732757568359375, 0.0001595020294189453, 0.0008063316345214844, 0.0014531612396240234, 0.0020999908447265625, 0.0027468204498291016, 0.0033936500549316406, 0.00404047966003418, 0.004687309265136719, 0.005334138870239258, 0.005980968475341797, 0.006627798080444336, 0.007274627685546875, 0.007921457290649414, 0.008568286895751953, 0.009215116500854492, 0.009861946105957031, 0.01050877571105957, 0.01115560531616211, 0.011802434921264648, 0.012449264526367188, 0.013096094131469727, 0.013742923736572266, 0.014389753341674805, 0.015036582946777344, 0.015683412551879883, 0.016330242156982422, 0.01697707176208496, 0.0176239013671875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 4.0, 12.0, 17.0, 15.0, 19.0, 34.0, 25.0, 34.0, 37.0, 52.0, 41.0, 63.0, 61.0, 64.0, 57.0, 51.0, 63.0, 62.0, 48.0, 53.0, 36.0, 36.0, 19.0, 16.0, 13.0, 16.0, 8.0, 11.0, 6.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5047309398651123, -0.4899222254753113, -0.47511351108551025, -0.46030479669570923, -0.4454961121082306, -0.43068739771842957, -0.41587868332862854, -0.4010699689388275, -0.3862612843513489, -0.37145256996154785, -0.3566438555717468, -0.3418351411819458, -0.32702645659446716, -0.31221774220466614, -0.2974090278148651, -0.2826003134250641, -0.26779159903526306, -0.25298288464546204, -0.2381741851568222, -0.22336547076702118, -0.20855677127838135, -0.19374805688858032, -0.1789393424987793, -0.16413062810897827, -0.14932192862033844, -0.13451321423053741, -0.11970451474189758, -0.10489580035209656, -0.09008709341287613, -0.0752783864736557, -0.060469672083854675, -0.04566096514463425, -0.03085225820541382, -0.01604354940354824, -0.001234840601682663, 0.013573870062828064, 0.028382577002048492, 0.04319128394126892, 0.057999998331069946, 0.07280870527029037, 0.0876174122095108, 0.10242611914873123, 0.11723482608795166, 0.13204354047775269, 0.1468522548675537, 0.16166095435619354, 0.17646966874599457, 0.1912783682346344, 0.20608708262443542, 0.22089579701423645, 0.23570449650287628, 0.2505131959915161, 0.26532191038131714, 0.28013062477111816, 0.2949393391609192, 0.3097480535507202, 0.32455676794052124, 0.33936548233032227, 0.3541741967201233, 0.3689829111099243, 0.38379159569740295, 0.398600310087204, 0.413409024477005, 0.42821773886680603, 0.44302642345428467]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 11.0, 5.0, 8.0, 11.0, 16.0, 16.0, 13.0, 24.0, 17.0, 16.0, 25.0, 24.0, 30.0, 25.0, 37.0, 37.0, 37.0, 50.0, 43.0, 39.0, 42.0, 46.0, 36.0, 41.0, 27.0, 36.0, 34.0, 27.0, 19.0, 27.0, 25.0, 28.0, 21.0, 14.0, 13.0, 12.0, 18.0, 9.0, 6.0, 10.0, 7.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.35974112153053284, -0.34840232133865356, -0.3370634913444519, -0.32572469115257263, -0.31438586115837097, -0.3030470609664917, -0.29170823097229004, -0.28036943078041077, -0.2690306007862091, -0.25769180059432983, -0.24635297060012817, -0.2350141555070877, -0.22367534041404724, -0.21233652532100677, -0.2009977102279663, -0.18965891003608704, -0.17832009494304657, -0.1669812798500061, -0.15564246475696564, -0.14430364966392517, -0.1329648345708847, -0.12162601947784424, -0.11028721183538437, -0.0989483967423439, -0.08760958164930344, -0.07627076655626297, -0.0649319514632225, -0.053593140095472336, -0.04225432500243187, -0.030915509909391403, -0.019576698541641235, -0.008237883448600769, 0.0031009316444396973, 0.014439745806157589, 0.02577855996787548, 0.0371173731982708, 0.048456188291311264, 0.05979500338435173, 0.0711338147521019, 0.08247262984514236, 0.09381144493818283, 0.1051502600312233, 0.11648907512426376, 0.12782788276672363, 0.1391666978597641, 0.15050551295280457, 0.16184432804584503, 0.1731831431388855, 0.18452195823192596, 0.19586077332496643, 0.2071995884180069, 0.21853840351104736, 0.22987721860408783, 0.2412160336971283, 0.25255483388900757, 0.26389366388320923, 0.2752324640750885, 0.2865712642669678, 0.29791009426116943, 0.3092488944530487, 0.32058772444725037, 0.33192652463912964, 0.3432653546333313, 0.35460415482521057, 0.36594298481941223]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 12.0, 22.0, 37.0, 51.0, 94.0, 168.0, 322.0, 507.0, 1003.0, 2147.0, 4441.0, 10508.0, 28622.0, 94114.0, 342733.0, 393104.0, 115104.0, 33433.0, 12242.0, 5086.0, 2340.0, 1115.0, 583.0, 327.0, 189.0, 90.0, 42.0, 42.0, 16.0, 19.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84228515625, -0.8160247802734375, -0.789764404296875, -0.7635040283203125, -0.73724365234375, -0.7109832763671875, -0.684722900390625, -0.6584625244140625, -0.6322021484375, -0.6059417724609375, -0.579681396484375, -0.5534210205078125, -0.52716064453125, -0.5009002685546875, -0.474639892578125, -0.4483795166015625, -0.422119140625, -0.3958587646484375, -0.369598388671875, -0.3433380126953125, -0.31707763671875, -0.2908172607421875, -0.264556884765625, -0.2382965087890625, -0.2120361328125, -0.1857757568359375, -0.159515380859375, -0.1332550048828125, -0.10699462890625, -0.0807342529296875, -0.054473876953125, -0.0282135009765625, -0.001953125, 0.0243072509765625, 0.050567626953125, 0.0768280029296875, 0.10308837890625, 0.1293487548828125, 0.155609130859375, 0.1818695068359375, 0.2081298828125, 0.2343902587890625, 0.260650634765625, 0.2869110107421875, 0.31317138671875, 0.3394317626953125, 0.365692138671875, 0.3919525146484375, 0.418212890625, 0.4444732666015625, 0.470733642578125, 0.4969940185546875, 0.52325439453125, 0.5495147705078125, 0.575775146484375, 0.6020355224609375, 0.6282958984375, 0.6545562744140625, 0.680816650390625, 0.7070770263671875, 0.73333740234375, 0.7595977783203125, 0.785858154296875, 0.8121185302734375, 0.83837890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 4.0, 5.0, 4.0, 8.0, 22.0, 10.0, 23.0, 16.0, 17.0, 14.0, 17.0, 36.0, 30.0, 45.0, 42.0, 49.0, 54.0, 59.0, 38.0, 65.0, 48.0, 44.0, 45.0, 34.0, 45.0, 31.0, 36.0, 27.0, 25.0, 26.0, 20.0, 10.0, 10.0, 7.0, 10.0, 13.0, 7.0, 3.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63134765625, -0.6061172485351562, -0.5808868408203125, -0.5556564331054688, -0.530426025390625, -0.5051956176757812, -0.4799652099609375, -0.45473480224609375, -0.42950439453125, -0.40427398681640625, -0.3790435791015625, -0.35381317138671875, -0.328582763671875, -0.30335235595703125, -0.2781219482421875, -0.25289154052734375, -0.2276611328125, -0.20243072509765625, -0.1772003173828125, -0.15196990966796875, -0.126739501953125, -0.10150909423828125, -0.0762786865234375, -0.05104827880859375, -0.02581787109375, -0.00058746337890625, 0.0246429443359375, 0.04987335205078125, 0.075103759765625, 0.10033416748046875, 0.1255645751953125, 0.15079498291015625, 0.176025390625, 0.20125579833984375, 0.2264862060546875, 0.25171661376953125, 0.276947021484375, 0.30217742919921875, 0.3274078369140625, 0.35263824462890625, 0.37786865234375, 0.40309906005859375, 0.4283294677734375, 0.45355987548828125, 0.478790283203125, 0.5040206909179688, 0.5292510986328125, 0.5544815063476562, 0.5797119140625, 0.6049423217773438, 0.6301727294921875, 0.6554031372070312, 0.680633544921875, 0.7058639526367188, 0.7310943603515625, 0.7563247680664062, 0.78155517578125, 0.8067855834960938, 0.8320159912109375, 0.8572463989257812, 0.882476806640625, 0.9077072143554688, 0.9329376220703125, 0.9581680297851562, 0.9833984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 10.0, 9.0, 11.0, 6.0, 18.0, 18.0, 36.0, 56.0, 65.0, 94.0, 153.0, 251.0, 397.0, 756.0, 1402.0, 3297.0, 8570.0, 25908.0, 97204.0, 398488.0, 380667.0, 91633.0, 25190.0, 8020.0, 3084.0, 1411.0, 682.0, 407.0, 240.0, 151.0, 85.0, 68.0, 53.0, 33.0, 16.0, 16.0, 9.0, 11.0, 12.0, 9.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1650390625, -1.1307525634765625, -1.096466064453125, -1.0621795654296875, -1.02789306640625, -0.9936065673828125, -0.959320068359375, -0.9250335693359375, -0.8907470703125, -0.8564605712890625, -0.822174072265625, -0.7878875732421875, -0.75360107421875, -0.7193145751953125, -0.685028076171875, -0.6507415771484375, -0.616455078125, -0.5821685791015625, -0.547882080078125, -0.5135955810546875, -0.47930908203125, -0.4450225830078125, -0.410736083984375, -0.3764495849609375, -0.3421630859375, -0.3078765869140625, -0.273590087890625, -0.2393035888671875, -0.20501708984375, -0.1707305908203125, -0.136444091796875, -0.1021575927734375, -0.06787109375, -0.0335845947265625, 0.000701904296875, 0.0349884033203125, 0.06927490234375, 0.1035614013671875, 0.137847900390625, 0.1721343994140625, 0.2064208984375, 0.2407073974609375, 0.274993896484375, 0.3092803955078125, 0.34356689453125, 0.3778533935546875, 0.412139892578125, 0.4464263916015625, 0.480712890625, 0.5149993896484375, 0.549285888671875, 0.5835723876953125, 0.61785888671875, 0.6521453857421875, 0.686431884765625, 0.7207183837890625, 0.7550048828125, 0.7892913818359375, 0.823577880859375, 0.8578643798828125, 0.89215087890625, 0.9264373779296875, 0.960723876953125, 0.9950103759765625, 1.029296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 7.0, 5.0, 8.0, 15.0, 15.0, 16.0, 21.0, 23.0, 17.0, 27.0, 28.0, 25.0, 36.0, 38.0, 35.0, 42.0, 47.0, 53.0, 47.0, 49.0, 37.0, 49.0, 49.0, 38.0, 35.0, 32.0, 27.0, 27.0, 26.0, 17.0, 16.0, 14.0, 10.0, 8.0, 14.0, 8.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.73486328125, -0.7114181518554688, -0.6879730224609375, -0.6645278930664062, -0.641082763671875, -0.6176376342773438, -0.5941925048828125, -0.5707473754882812, -0.54730224609375, -0.5238571166992188, -0.5004119873046875, -0.47696685791015625, -0.453521728515625, -0.43007659912109375, -0.4066314697265625, -0.38318634033203125, -0.3597412109375, -0.33629608154296875, -0.3128509521484375, -0.28940582275390625, -0.265960693359375, -0.24251556396484375, -0.2190704345703125, -0.19562530517578125, -0.17218017578125, -0.14873504638671875, -0.1252899169921875, -0.10184478759765625, -0.078399658203125, -0.05495452880859375, -0.0315093994140625, -0.00806427001953125, 0.015380859375, 0.03882598876953125, 0.0622711181640625, 0.08571624755859375, 0.109161376953125, 0.13260650634765625, 0.1560516357421875, 0.17949676513671875, 0.20294189453125, 0.22638702392578125, 0.2498321533203125, 0.27327728271484375, 0.296722412109375, 0.32016754150390625, 0.3436126708984375, 0.36705780029296875, 0.3905029296875, 0.41394805908203125, 0.4373931884765625, 0.46083831787109375, 0.484283447265625, 0.5077285766601562, 0.5311737060546875, 0.5546188354492188, 0.57806396484375, 0.6015090942382812, 0.6249542236328125, 0.6483993530273438, 0.671844482421875, 0.6952896118164062, 0.7187347412109375, 0.7421798706054688, 0.765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 9.0, 5.0, 5.0, 7.0, 7.0, 25.0, 28.0, 34.0, 83.0, 94.0, 163.0, 247.0, 464.0, 883.0, 1671.0, 3846.0, 9619.0, 26978.0, 79703.0, 220315.0, 414998.0, 186967.0, 65242.0, 22313.0, 8210.0, 3353.0, 1447.0, 773.0, 417.0, 233.0, 120.0, 100.0, 61.0, 49.0, 29.0, 17.0, 13.0, 9.0, 7.0, 4.0, 8.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11505126953125, -0.1112680435180664, -0.10748481750488281, -0.10370159149169922, -0.09991836547851562, -0.09613513946533203, -0.09235191345214844, -0.08856868743896484, -0.08478546142578125, -0.08100223541259766, -0.07721900939941406, -0.07343578338623047, -0.06965255737304688, -0.06586933135986328, -0.06208610534667969, -0.058302879333496094, -0.0545196533203125, -0.050736427307128906, -0.04695320129394531, -0.04316997528076172, -0.039386749267578125, -0.03560352325439453, -0.03182029724121094, -0.028037071228027344, -0.02425384521484375, -0.020470619201660156, -0.016687393188476562, -0.012904167175292969, -0.009120941162109375, -0.005337715148925781, -0.0015544891357421875, 0.0022287368774414062, 0.006011962890625, 0.009795188903808594, 0.013578414916992188, 0.01736164093017578, 0.021144866943359375, 0.02492809295654297, 0.028711318969726562, 0.032494544982910156, 0.03627777099609375, 0.040060997009277344, 0.04384422302246094, 0.04762744903564453, 0.051410675048828125, 0.05519390106201172, 0.05897712707519531, 0.0627603530883789, 0.0665435791015625, 0.0703268051147461, 0.07411003112792969, 0.07789325714111328, 0.08167648315429688, 0.08545970916748047, 0.08924293518066406, 0.09302616119384766, 0.09680938720703125, 0.10059261322021484, 0.10437583923339844, 0.10815906524658203, 0.11194229125976562, 0.11572551727294922, 0.11950874328613281, 0.1232919692993164, 0.1270751953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 8.0, 13.0, 12.0, 20.0, 23.0, 28.0, 32.0, 30.0, 58.0, 55.0, 64.0, 102.0, 124.0, 80.0, 76.0, 52.0, 50.0, 38.0, 27.0, 20.0, 25.0, 12.0, 11.0, 11.0, 2.0, 7.0, 7.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9265880584716797e-05, -2.8411857783794403e-05, -2.755783498287201e-05, -2.6703812181949615e-05, -2.584978938102722e-05, -2.4995766580104828e-05, -2.4141743779182434e-05, -2.328772097826004e-05, -2.2433698177337646e-05, -2.1579675376415253e-05, -2.072565257549286e-05, -1.9871629774570465e-05, -1.901760697364807e-05, -1.8163584172725677e-05, -1.7309561371803284e-05, -1.645553857088089e-05, -1.5601515769958496e-05, -1.4747492969036102e-05, -1.3893470168113708e-05, -1.3039447367191315e-05, -1.2185424566268921e-05, -1.1331401765346527e-05, -1.0477378964424133e-05, -9.62335616350174e-06, -8.769333362579346e-06, -7.915310561656952e-06, -7.061287760734558e-06, -6.207264959812164e-06, -5.3532421588897705e-06, -4.499219357967377e-06, -3.645196557044983e-06, -2.791173756122589e-06, -1.9371509552001953e-06, -1.0831281542778015e-06, -2.2910535335540771e-07, 6.249174475669861e-07, 1.4789402484893799e-06, 2.3329630494117737e-06, 3.1869858503341675e-06, 4.041008651256561e-06, 4.895031452178955e-06, 5.749054253101349e-06, 6.603077054023743e-06, 7.4570998549461365e-06, 8.31112265586853e-06, 9.165145456790924e-06, 1.0019168257713318e-05, 1.0873191058635712e-05, 1.1727213859558105e-05, 1.25812366604805e-05, 1.3435259461402893e-05, 1.4289282262325287e-05, 1.514330506324768e-05, 1.5997327864170074e-05, 1.6851350665092468e-05, 1.7705373466014862e-05, 1.8559396266937256e-05, 1.941341906785965e-05, 2.0267441868782043e-05, 2.1121464669704437e-05, 2.197548747062683e-05, 2.2829510271549225e-05, 2.368353307247162e-05, 2.4537555873394012e-05, 2.5391578674316406e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 8.0, 13.0, 13.0, 23.0, 24.0, 45.0, 51.0, 73.0, 101.0, 118.0, 169.0, 250.0, 391.0, 551.0, 888.0, 1505.0, 2554.0, 5523.0, 13613.0, 41016.0, 136053.0, 435163.0, 278178.0, 86187.0, 26800.0, 9545.0, 4057.0, 2098.0, 1220.0, 747.0, 466.0, 289.0, 224.0, 163.0, 110.0, 96.0, 77.0, 49.0, 28.0, 35.0, 11.0, 10.0, 12.0, 2.0, 8.0, 0.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16015625, -0.1552753448486328, -0.15039443969726562, -0.14551353454589844, -0.14063262939453125, -0.13575172424316406, -0.13087081909179688, -0.1259899139404297, -0.1211090087890625, -0.11622810363769531, -0.11134719848632812, -0.10646629333496094, -0.10158538818359375, -0.09670448303222656, -0.09182357788085938, -0.08694267272949219, -0.082061767578125, -0.07718086242675781, -0.07229995727539062, -0.06741905212402344, -0.06253814697265625, -0.05765724182128906, -0.052776336669921875, -0.04789543151855469, -0.0430145263671875, -0.03813362121582031, -0.033252716064453125, -0.028371810913085938, -0.02349090576171875, -0.018610000610351562, -0.013729095458984375, -0.008848190307617188, -0.00396728515625, 0.0009136199951171875, 0.005794525146484375, 0.010675430297851562, 0.01555633544921875, 0.020437240600585938, 0.025318145751953125, 0.030199050903320312, 0.0350799560546875, 0.03996086120605469, 0.044841766357421875, 0.04972267150878906, 0.05460357666015625, 0.05948448181152344, 0.06436538696289062, 0.06924629211425781, 0.074127197265625, 0.07900810241699219, 0.08388900756835938, 0.08876991271972656, 0.09365081787109375, 0.09853172302246094, 0.10341262817382812, 0.10829353332519531, 0.1131744384765625, 0.11805534362792969, 0.12293624877929688, 0.12781715393066406, 0.13269805908203125, 0.13757896423339844, 0.14245986938476562, 0.1473407745361328, 0.1522216796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 9.0, 16.0, 16.0, 33.0, 40.0, 65.0, 77.0, 95.0, 179.0, 114.0, 110.0, 75.0, 54.0, 47.0, 29.0, 10.0, 10.0, 7.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1370849609375, -0.13301849365234375, -0.1289520263671875, -0.12488555908203125, -0.120819091796875, -0.11675262451171875, -0.1126861572265625, -0.10861968994140625, -0.10455322265625, -0.10048675537109375, -0.0964202880859375, -0.09235382080078125, -0.088287353515625, -0.08422088623046875, -0.0801544189453125, -0.07608795166015625, -0.072021484375, -0.06795501708984375, -0.0638885498046875, -0.05982208251953125, -0.055755615234375, -0.05168914794921875, -0.0476226806640625, -0.04355621337890625, -0.03948974609375, -0.03542327880859375, -0.0313568115234375, -0.02729034423828125, -0.023223876953125, -0.01915740966796875, -0.0150909423828125, -0.01102447509765625, -0.0069580078125, -0.00289154052734375, 0.0011749267578125, 0.00524139404296875, 0.009307861328125, 0.01337432861328125, 0.0174407958984375, 0.02150726318359375, 0.02557373046875, 0.02964019775390625, 0.0337066650390625, 0.03777313232421875, 0.041839599609375, 0.04590606689453125, 0.0499725341796875, 0.05403900146484375, 0.05810546875, 0.06217193603515625, 0.0662384033203125, 0.07030487060546875, 0.074371337890625, 0.07843780517578125, 0.0825042724609375, 0.08657073974609375, 0.09063720703125, 0.09470367431640625, 0.0987701416015625, 0.10283660888671875, 0.106903076171875, 0.11096954345703125, 0.1150360107421875, 0.11910247802734375, 0.1231689453125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 12.0, 38.0, 97.0, 200.0, 263.0, 190.0, 119.0, 49.0, 19.0, 9.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1071416139602661, -0.9914671778678894, -0.8757927417755127, -0.7601182460784912, -0.6444438695907593, -0.5287693738937378, -0.4130949378013611, -0.2974205017089844, -0.18174606561660767, -0.06607162207365036, 0.049602821469306946, 0.16527727246284485, 0.28095170855522156, 0.39662617444992065, 0.5123006105422974, 0.6279750466346741, 0.7436494827270508, 0.8593239188194275, 0.9749983549118042, 1.0906728506088257, 1.2063472270965576, 1.322021722793579, 1.4376962184906006, 1.5533705949783325, 1.6690449714660645, 1.784719467163086, 1.9003938436508179, 2.01606822013855, 2.1317427158355713, 2.2474172115325928, 2.3630917072296143, 2.4787659645080566, 2.5944406986236572, 2.7101151943206787, 2.8257896900177, 2.9414639472961426, 3.057138442993164, 3.1728129386901855, 3.288487434387207, 3.4041619300842285, 3.519836187362671, 3.6355106830596924, 3.751185178756714, 3.8668594360351562, 3.9825339317321777, 4.098208427429199, 4.213882923126221, 4.329557418823242, 4.445231914520264, 4.560906410217285, 4.676580905914307, 4.792255401611328, 4.90792989730835, 5.023604393005371, 5.139278411865234, 5.254952907562256, 5.370627403259277, 5.486301898956299, 5.60197639465332, 5.717650890350342, 5.833325386047363, 5.948999404907227, 6.064673900604248, 6.1803483963012695, 6.296022891998291]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 11.0, 7.0, 13.0, 10.0, 20.0, 17.0, 21.0, 29.0, 25.0, 22.0, 25.0, 37.0, 32.0, 34.0, 47.0, 42.0, 46.0, 42.0, 38.0, 40.0, 41.0, 53.0, 26.0, 45.0, 33.0, 39.0, 35.0, 26.0, 18.0, 17.0, 25.0, 15.0, 21.0, 17.0, 9.0, 2.0, 5.0, 10.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5122652053833008, -1.4709608554840088, -1.4296565055847168, -1.3883522748947144, -1.3470479249954224, -1.3057435750961304, -1.2644392251968384, -1.2231348752975464, -1.181830644607544, -1.140526294708252, -1.09922194480896, -1.0579177141189575, -1.0166133642196655, -0.9753090143203735, -0.9340046644210815, -0.8927003145217896, -0.8513959646224976, -0.8100916147232056, -0.7687873244285583, -0.7274829745292664, -0.6861786842346191, -0.6448743343353271, -0.6035699844360352, -0.5622656345367432, -0.520961344242096, -0.47965702414512634, -0.43835270404815674, -0.39704835414886475, -0.35574403405189514, -0.31443971395492554, -0.27313536405563354, -0.23183104395866394, -0.19052660465240479, -0.14922228455543518, -0.10791794955730438, -0.06661362200975418, -0.02530929446220398, 0.015995025634765625, 0.05729936063289642, 0.09860369563102722, 0.13990801572799683, 0.18121233582496643, 0.22251667082309723, 0.263821005821228, 0.30512532591819763, 0.34642964601516724, 0.38773399591445923, 0.42903831601142883, 0.47034263610839844, 0.5116469860076904, 0.5529512763023376, 0.5942556262016296, 0.6355599164962769, 0.6768642663955688, 0.7181686162948608, 0.7594729661941528, 0.8007772564888, 0.842081606388092, 0.8833858966827393, 0.9246902465820312, 0.9659945964813232, 1.0072989463806152, 1.0486031770706177, 1.0899075269699097, 1.1312118768692017]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 15.0, 16.0, 16.0, 27.0, 31.0, 50.0, 62.0, 119.0, 224.0, 357.0, 631.0, 1460.0, 4112.0, 13847.0, 1021078.0, 5064.0, 1687.0, 751.0, 430.0, 225.0, 123.0, 87.0, 49.0, 39.0, 23.0, 16.0, 11.0, 10.0, 6.0, 6.0, 6.0, 2.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4936835765838623, -2.4205307960510254, -2.3473782539367676, -2.2742257118225098, -2.201072931289673, -2.127920150756836, -2.054767608642578, -1.9816149473190308, -1.9084622859954834, -1.835309624671936, -1.7621569633483887, -1.6890043020248413, -1.615851640701294, -1.5426989793777466, -1.4695463180541992, -1.3963936567306519, -1.3232409954071045, -1.2500883340835571, -1.1769356727600098, -1.1037830114364624, -1.030630350112915, -0.9574776887893677, -0.8843250274658203, -0.811172366142273, -0.7380197048187256, -0.6648670434951782, -0.5917143821716309, -0.5185617208480835, -0.44540905952453613, -0.37225639820098877, -0.2991037368774414, -0.22595107555389404, -0.15279841423034668, -0.07964575290679932, -0.006493091583251953, 0.06665956974029541, 0.13981223106384277, 0.21296489238739014, 0.2861175537109375, 0.35927021503448486, 0.4324228763580322, 0.5055755376815796, 0.578728199005127, 0.6518808603286743, 0.7250335216522217, 0.798186182975769, 0.8713388442993164, 0.9444915056228638, 1.0176441669464111, 1.0907968282699585, 1.1639494895935059, 1.2371021509170532, 1.3102548122406006, 1.383407473564148, 1.4565601348876953, 1.5297127962112427, 1.60286545753479, 1.6760181188583374, 1.7491707801818848, 1.8223234415054321, 1.8954761028289795, 1.9686287641525269, 2.041781425476074, 2.114933967590332, 2.188086748123169]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 15.0, 26.0, 31.0, 50.0, 88.0, 153.0, 239.0, 337.0, 532.0, 957.0, 1885.0, 4371.0, 51436176.0, 18969.0, 3005.0, 1434.0, 764.0, 447.0, 293.0, 182.0, 123.0, 74.0, 58.0, 32.0, 20.0, 14.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.352810859680176, -10.995879173278809, -10.638947486877441, -10.282015800476074, -9.925085067749023, -9.568153381347656, -9.211221694946289, -8.854290008544922, -8.497358322143555, -8.140426635742188, -7.78349494934082, -7.426563739776611, -7.069632053375244, -6.712700366973877, -6.355769157409668, -5.998837471008301, -5.641905784606934, -5.284974098205566, -4.928042411804199, -4.57111120223999, -4.214179515838623, -3.857247829437256, -3.5003163814544678, -3.1433849334716797, -2.7864532470703125, -2.4295215606689453, -2.0725901126861572, -1.7156585454940796, -1.358726978302002, -1.0017954111099243, -0.6448638439178467, -0.2879323959350586, 0.069000244140625, 0.42593181133270264, 0.7828633785247803, 1.139794945716858, 1.4967265129089355, 1.8536580801010132, 2.210589647293091, 2.567521095275879, 2.924452781677246, 3.2813844680786133, 3.6383159160614014, 3.9952473640441895, 4.352179050445557, 4.709110736846924, 5.066041946411133, 5.4229736328125, 5.779905319213867, 6.136837005615234, 6.493768692016602, 6.8506999015808105, 7.207631587982178, 7.564563274383545, 7.921494483947754, 8.278426170349121, 8.635357856750488, 8.992289543151855, 9.349221229553223, 9.70615291595459, 10.06308364868164, 10.420015335083008, 10.776947021484375, 11.133878707885742, 11.49081039428711]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 8.0, 3.0, 12.0, 10.0, 27.0, 38.0, 67.0, 108.0, 210.0, 344.0, 480.0, 852.0, 1513.0, 2668.0, 4711.0, 8792.0, 16680.0, 32671.0, 64602.0, 125280.0, 232551.0, 387165.0, 748690.0, 3455405.0, 505303.0, 319696.0, 183115.0, 96828.0, 49413.0, 25049.0, 13124.0, 7046.0, 3950.0, 2031.0, 1212.0, 731.0, 439.0, 249.0, 146.0, 80.0, 54.0, 36.0, 19.0, 8.0, 13.0, 10.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.99169921875, -0.9600143432617188, -0.9283294677734375, -0.8966445922851562, -0.864959716796875, -0.8332748413085938, -0.8015899658203125, -0.7699050903320312, -0.73822021484375, -0.7065353393554688, -0.6748504638671875, -0.6431655883789062, -0.611480712890625, -0.5797958374023438, -0.5481109619140625, -0.5164260864257812, -0.4847412109375, -0.45305633544921875, -0.4213714599609375, -0.38968658447265625, -0.358001708984375, -0.32631683349609375, -0.2946319580078125, -0.26294708251953125, -0.23126220703125, -0.19957733154296875, -0.1678924560546875, -0.13620758056640625, -0.104522705078125, -0.07283782958984375, -0.0411529541015625, -0.00946807861328125, 0.022216796875, 0.05390167236328125, 0.0855865478515625, 0.11727142333984375, 0.148956298828125, 0.18064117431640625, 0.2123260498046875, 0.24401092529296875, 0.27569580078125, 0.30738067626953125, 0.3390655517578125, 0.37075042724609375, 0.402435302734375, 0.43412017822265625, 0.4658050537109375, 0.49748992919921875, 0.5291748046875, 0.5608596801757812, 0.5925445556640625, 0.6242294311523438, 0.655914306640625, 0.6875991821289062, 0.7192840576171875, 0.7509689331054688, 0.78265380859375, 0.8143386840820312, 0.8460235595703125, 0.8777084350585938, 0.909393310546875, 0.9410781860351562, 0.9727630615234375, 1.0044479370117188, 1.0361328125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 4.0, 8.0, 11.0, 15.0, 18.0, 16.0, 13.0, 20.0, 23.0, 36.0, 39.0, 31.0, 29.0, 37.0, 38.0, 31.0, 62.0, 200.0, 871.0, 100.0, 46.0, 43.0, 36.0, 31.0, 39.0, 31.0, 28.0, 28.0, 27.0, 19.0, 19.0, 14.0, 9.0, 7.0, 7.0, 10.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.13671875, -6.9013671875, -6.666015625, -6.4306640625, -6.1953125, -5.9599609375, -5.724609375, -5.4892578125, -5.25390625, -5.0185546875, -4.783203125, -4.5478515625, -4.3125, -4.0771484375, -3.841796875, -3.6064453125, -3.37109375, -3.1357421875, -2.900390625, -2.6650390625, -2.4296875, -2.1943359375, -1.958984375, -1.7236328125, -1.48828125, -1.2529296875, -1.017578125, -0.7822265625, -0.546875, -0.3115234375, -0.076171875, 0.1591796875, 0.39453125, 0.6298828125, 0.865234375, 1.1005859375, 1.3359375, 1.5712890625, 1.806640625, 2.0419921875, 2.27734375, 2.5126953125, 2.748046875, 2.9833984375, 3.21875, 3.4541015625, 3.689453125, 3.9248046875, 4.16015625, 4.3955078125, 4.630859375, 4.8662109375, 5.1015625, 5.3369140625, 5.572265625, 5.8076171875, 6.04296875, 6.2783203125, 6.513671875, 6.7490234375, 6.984375, 7.2197265625, 7.455078125, 7.6904296875, 7.92578125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 10.0, 5.0, 13.0, 25.0, 46.0, 44.0, 101.0, 138.0, 204.0, 329.0, 517.0, 828.0, 1280.0, 1871.0, 2976.0, 4693.0, 7404.0, 11253.0, 17983.0, 28303.0, 43888.0, 66366.0, 99190.0, 141712.0, 193871.0, 249595.0, 307774.0, 1071633.0, 2705785.0, 350135.0, 271931.0, 215431.0, 160706.0, 113821.0, 77652.0, 51324.0, 33133.0, 21346.0, 13609.0, 8942.0, 5483.0, 3567.0, 2268.0, 1441.0, 1017.0, 687.0, 380.0, 263.0, 183.0, 112.0, 72.0, 37.0, 23.0, 19.0, 13.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.468505859375, -0.4534873962402344, -0.43846893310546875, -0.4234504699707031, -0.4084320068359375, -0.3934135437011719, -0.37839508056640625, -0.3633766174316406, -0.348358154296875, -0.3333396911621094, -0.31832122802734375, -0.3033027648925781, -0.2882843017578125, -0.2732658386230469, -0.25824737548828125, -0.24322891235351562, -0.22821044921875, -0.21319198608398438, -0.19817352294921875, -0.18315505981445312, -0.1681365966796875, -0.15311813354492188, -0.13809967041015625, -0.12308120727539062, -0.108062744140625, -0.09304428100585938, -0.07802581787109375, -0.06300735473632812, -0.0479888916015625, -0.032970428466796875, -0.01795196533203125, -0.002933502197265625, 0.0120849609375, 0.027103424072265625, 0.04212188720703125, 0.057140350341796875, 0.0721588134765625, 0.08717727661132812, 0.10219573974609375, 0.11721420288085938, 0.132232666015625, 0.14725112915039062, 0.16226959228515625, 0.17728805541992188, 0.1923065185546875, 0.20732498168945312, 0.22234344482421875, 0.23736190795898438, 0.25238037109375, 0.2673988342285156, 0.28241729736328125, 0.2974357604980469, 0.3124542236328125, 0.3274726867675781, 0.34249114990234375, 0.3575096130371094, 0.372528076171875, 0.3875465393066406, 0.40256500244140625, 0.4175834655761719, 0.4326019287109375, 0.4476203918457031, 0.46263885498046875, 0.4776573181152344, 0.49267578125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 8.0, 17.0, 5.0, 11.0, 13.0, 13.0, 18.0, 19.0, 28.0, 24.0, 16.0, 30.0, 45.0, 35.0, 45.0, 47.0, 61.0, 635.0, 465.0, 46.0, 42.0, 45.0, 35.0, 35.0, 30.0, 29.0, 40.0, 18.0, 24.0, 27.0, 20.0, 18.0, 11.0, 12.0, 16.0, 7.0, 4.0, 4.0, 9.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.328125, -6.14666748046875, -5.9652099609375, -5.78375244140625, -5.602294921875, -5.42083740234375, -5.2393798828125, -5.05792236328125, -4.87646484375, -4.69500732421875, -4.5135498046875, -4.33209228515625, -4.150634765625, -3.96917724609375, -3.7877197265625, -3.60626220703125, -3.4248046875, -3.24334716796875, -3.0618896484375, -2.88043212890625, -2.698974609375, -2.51751708984375, -2.3360595703125, -2.15460205078125, -1.97314453125, -1.79168701171875, -1.6102294921875, -1.42877197265625, -1.247314453125, -1.06585693359375, -0.8843994140625, -0.70294189453125, -0.521484375, -0.34002685546875, -0.1585693359375, 0.02288818359375, 0.204345703125, 0.38580322265625, 0.5672607421875, 0.74871826171875, 0.93017578125, 1.11163330078125, 1.2930908203125, 1.47454833984375, 1.656005859375, 1.83746337890625, 2.0189208984375, 2.20037841796875, 2.3818359375, 2.56329345703125, 2.7447509765625, 2.92620849609375, 3.107666015625, 3.28912353515625, 3.4705810546875, 3.65203857421875, 3.83349609375, 4.01495361328125, 4.1964111328125, 4.37786865234375, 4.559326171875, 4.74078369140625, 4.9222412109375, 5.10369873046875, 5.28515625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 8.0, 17.0, 11.0, 28.0, 28.0, 45.0, 52.0, 81.0, 110.0, 135.0, 156.0, 214.0, 328.0, 423.0, 589.0, 841.0, 1318.0, 1902.0, 3015.0, 5546.0, 10888.0, 23024.0, 51172.0, 108644.0, 965297.0, 4893232.0, 116614.0, 55231.0, 25013.0, 11674.0, 5889.0, 3298.0, 1995.0, 1339.0, 947.0, 621.0, 458.0, 341.0, 226.0, 155.0, 124.0, 81.0, 81.0, 52.0, 52.0, 38.0, 27.0, 18.0, 14.0, 13.0, 6.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0], "bins": [-1.6728515625, -1.62066650390625, -1.5684814453125, -1.51629638671875, -1.464111328125, -1.41192626953125, -1.3597412109375, -1.30755615234375, -1.25537109375, -1.20318603515625, -1.1510009765625, -1.09881591796875, -1.046630859375, -0.99444580078125, -0.9422607421875, -0.89007568359375, -0.837890625, -0.78570556640625, -0.7335205078125, -0.68133544921875, -0.629150390625, -0.57696533203125, -0.5247802734375, -0.47259521484375, -0.42041015625, -0.36822509765625, -0.3160400390625, -0.26385498046875, -0.211669921875, -0.15948486328125, -0.1072998046875, -0.05511474609375, -0.0029296875, 0.04925537109375, 0.1014404296875, 0.15362548828125, 0.205810546875, 0.25799560546875, 0.3101806640625, 0.36236572265625, 0.41455078125, 0.46673583984375, 0.5189208984375, 0.57110595703125, 0.623291015625, 0.67547607421875, 0.7276611328125, 0.77984619140625, 0.83203125, 0.88421630859375, 0.9364013671875, 0.98858642578125, 1.040771484375, 1.09295654296875, 1.1451416015625, 1.19732666015625, 1.24951171875, 1.30169677734375, 1.3538818359375, 1.40606689453125, 1.458251953125, 1.51043701171875, 1.5626220703125, 1.61480712890625, 1.6669921875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 6.0, 8.0, 8.0, 5.0, 14.0, 17.0, 14.0, 22.0, 33.0, 29.0, 21.0, 42.0, 36.0, 28.0, 35.0, 41.0, 50.0, 113.0, 884.0, 160.0, 48.0, 34.0, 40.0, 30.0, 33.0, 32.0, 39.0, 25.0, 27.0, 24.0, 15.0, 10.0, 17.0, 14.0, 15.0, 4.0, 4.0, 6.0, 2.0, 11.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.69140625, -5.52655029296875, -5.3616943359375, -5.19683837890625, -5.031982421875, -4.86712646484375, -4.7022705078125, -4.53741455078125, -4.37255859375, -4.20770263671875, -4.0428466796875, -3.87799072265625, -3.713134765625, -3.54827880859375, -3.3834228515625, -3.21856689453125, -3.0537109375, -2.88885498046875, -2.7239990234375, -2.55914306640625, -2.394287109375, -2.22943115234375, -2.0645751953125, -1.89971923828125, -1.73486328125, -1.57000732421875, -1.4051513671875, -1.24029541015625, -1.075439453125, -0.91058349609375, -0.7457275390625, -0.58087158203125, -0.416015625, -0.25115966796875, -0.0863037109375, 0.07855224609375, 0.243408203125, 0.40826416015625, 0.5731201171875, 0.73797607421875, 0.90283203125, 1.06768798828125, 1.2325439453125, 1.39739990234375, 1.562255859375, 1.72711181640625, 1.8919677734375, 2.05682373046875, 2.2216796875, 2.38653564453125, 2.5513916015625, 2.71624755859375, 2.881103515625, 3.04595947265625, 3.2108154296875, 3.37567138671875, 3.54052734375, 3.70538330078125, 3.8702392578125, 4.03509521484375, 4.199951171875, 4.36480712890625, 4.5296630859375, 4.69451904296875, 4.859375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 13.0, 20.0, 15.0, 23.0, 32.0, 43.0, 48.0, 58.0, 123.0, 183.0, 111.0, 66.0, 58.0, 46.0, 34.0, 28.0, 11.0, 20.0, 13.0, 13.0, 3.0, 6.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.38465881347656, -37.480552673339844, -36.57645034790039, -35.67234420776367, -34.76824188232422, -33.8641357421875, -32.96003341674805, -32.05592727661133, -31.151823043823242, -30.247718811035156, -29.34361457824707, -28.439510345458984, -27.535404205322266, -26.631301879882812, -25.727195739746094, -24.823091506958008, -23.918987274169922, -23.014883041381836, -22.11077880859375, -21.206674575805664, -20.302570343017578, -19.39846420288086, -18.494359970092773, -17.590255737304688, -16.6861515045166, -15.782047271728516, -14.87794303894043, -13.973837852478027, -13.069733619689941, -12.165629386901855, -11.261524200439453, -10.357419967651367, -9.453313827514648, -8.549209594726562, -7.645104885101318, -6.741000175476074, -5.836895942687988, -4.932791709899902, -4.028687000274658, -3.124582290649414, -2.220478057861328, -1.316373586654663, -0.41226911544799805, 0.491835355758667, 1.395939826965332, 2.300044059753418, 3.204148769378662, 4.108253479003906, 5.012357711791992, 5.916461944580078, 6.820566654205322, 7.724671363830566, 8.628775596618652, 9.532879829406738, 10.43698501586914, 11.341089248657227, 12.245193481445312, 13.149297714233398, 14.053401947021484, 14.957507133483887, 15.861611366271973, 16.765716552734375, 17.66982078552246, 18.573925018310547, 19.478029251098633]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 7.0, 5.0, 5.0, 4.0, 10.0, 15.0, 11.0, 22.0, 19.0, 17.0, 19.0, 31.0, 31.0, 34.0, 48.0, 73.0, 88.0, 115.0, 92.0, 51.0, 48.0, 41.0, 36.0, 26.0, 24.0, 22.0, 14.0, 14.0, 7.0, 13.0, 10.0, 4.0, 9.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.30535125732422, -64.30560302734375, -62.30585861206055, -60.306114196777344, -58.306365966796875, -56.30662155151367, -54.30687713623047, -52.30712890625, -50.3073844909668, -48.307640075683594, -46.307891845703125, -44.30814743041992, -42.30840301513672, -40.30865478515625, -38.30891036987305, -36.309165954589844, -34.309417724609375, -32.30967330932617, -30.309925079345703, -28.3101806640625, -26.310434341430664, -24.310688018798828, -22.310943603515625, -20.31119728088379, -18.311450958251953, -16.311704635620117, -14.311959266662598, -12.312213897705078, -10.312467575073242, -8.312721252441406, -6.312975883483887, -4.313230514526367, -2.313488006591797, -0.31374216079711914, 1.6860036849975586, 3.6857495307922363, 5.685495376586914, 7.68524169921875, 9.68498706817627, 11.684732437133789, 13.684478759765625, 15.684225082397461, 17.683971405029297, 19.6837158203125, 21.683462142944336, 23.683208465576172, 25.682952880859375, 27.68269920349121, 29.682445526123047, 31.682191848754883, 33.68193817138672, 35.68168258666992, 37.681427001953125, 39.681175231933594, 41.6809196472168, 43.6806640625, 45.68041229248047, 47.68015670776367, 49.67990493774414, 51.679649353027344, 53.67939758300781, 55.679141998291016, 57.67888641357422, 59.67863464355469, 61.67837905883789]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 1.0, 5.0, 9.0, 17.0, 14.0, 21.0, 34.0, 61.0, 95.0, 115.0, 168.0, 245.0, 406.0, 694.0, 1116.0, 1969.0, 3681.0, 7889.0, 19253.0, 68017.0, 3066853.0, 931969.0, 57839.0, 17726.0, 7268.0, 3715.0, 1980.0, 1141.0, 665.0, 443.0, 273.0, 196.0, 116.0, 86.0, 64.0, 39.0, 24.0, 20.0, 24.0, 8.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11614990234375, -0.11227130889892578, -0.10839271545410156, -0.10451412200927734, -0.10063552856445312, -0.0967569351196289, -0.09287834167480469, -0.08899974822998047, -0.08512115478515625, -0.08124256134033203, -0.07736396789550781, -0.0734853744506836, -0.06960678100585938, -0.06572818756103516, -0.06184959411621094, -0.05797100067138672, -0.0540924072265625, -0.05021381378173828, -0.04633522033691406, -0.042456626892089844, -0.038578033447265625, -0.034699440002441406, -0.030820846557617188, -0.02694225311279297, -0.02306365966796875, -0.01918506622314453, -0.015306472778320312, -0.011427879333496094, -0.007549285888671875, -0.0036706924438476562, 0.0002079010009765625, 0.004086494445800781, 0.007965087890625, 0.011843681335449219, 0.015722274780273438, 0.019600868225097656, 0.023479461669921875, 0.027358055114746094, 0.031236648559570312, 0.03511524200439453, 0.03899383544921875, 0.04287242889404297, 0.04675102233886719, 0.050629615783691406, 0.054508209228515625, 0.058386802673339844, 0.06226539611816406, 0.06614398956298828, 0.0700225830078125, 0.07390117645263672, 0.07777976989746094, 0.08165836334228516, 0.08553695678710938, 0.0894155502319336, 0.09329414367675781, 0.09717273712158203, 0.10105133056640625, 0.10492992401123047, 0.10880851745605469, 0.1126871109008789, 0.11656570434570312, 0.12044429779052734, 0.12432289123535156, 0.12820148468017578, 0.132080078125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 1.0, 3.0, 9.0, 8.0, 9.0, 15.0, 20.0, 8.0, 28.0, 35.0, 35.0, 64.0, 110.0, 288.0, 92.0, 69.0, 49.0, 37.0, 23.0, 18.0, 17.0, 10.0, 12.0, 6.0, 8.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056488037109375, -0.054802894592285156, -0.05311775207519531, -0.05143260955810547, -0.049747467041015625, -0.04806232452392578, -0.04637718200683594, -0.044692039489746094, -0.04300689697265625, -0.041321754455566406, -0.03963661193847656, -0.03795146942138672, -0.036266326904296875, -0.03458118438720703, -0.03289604187011719, -0.031210899353027344, -0.0295257568359375, -0.027840614318847656, -0.026155471801757812, -0.02447032928466797, -0.022785186767578125, -0.02110004425048828, -0.019414901733398438, -0.017729759216308594, -0.01604461669921875, -0.014359474182128906, -0.012674331665039062, -0.010989189147949219, -0.009304046630859375, -0.007618904113769531, -0.0059337615966796875, -0.004248619079589844, -0.0025634765625, -0.0008783340454101562, 0.0008068084716796875, 0.0024919509887695312, 0.004177093505859375, 0.005862236022949219, 0.0075473785400390625, 0.009232521057128906, 0.01091766357421875, 0.012602806091308594, 0.014287948608398438, 0.01597309112548828, 0.017658233642578125, 0.01934337615966797, 0.021028518676757812, 0.022713661193847656, 0.0243988037109375, 0.026083946228027344, 0.027769088745117188, 0.02945423126220703, 0.031139373779296875, 0.03282451629638672, 0.03450965881347656, 0.036194801330566406, 0.03787994384765625, 0.039565086364746094, 0.04125022888183594, 0.04293537139892578, 0.044620513916015625, 0.04630565643310547, 0.04799079895019531, 0.049675941467285156, 0.051361083984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 11.0, 25.0, 22.0, 32.0, 47.0, 88.0, 163.0, 265.0, 564.0, 1149.0, 2682.0, 6895.0, 21692.0, 100490.0, 1060386.0, 2768791.0, 183269.0, 32539.0, 9163.0, 3313.0, 1350.0, 629.0, 336.0, 156.0, 77.0, 44.0, 33.0, 18.0, 14.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12371826171875, -0.11998748779296875, -0.1162567138671875, -0.11252593994140625, -0.108795166015625, -0.10506439208984375, -0.1013336181640625, -0.09760284423828125, -0.0938720703125, -0.09014129638671875, -0.0864105224609375, -0.08267974853515625, -0.078948974609375, -0.07521820068359375, -0.0714874267578125, -0.06775665283203125, -0.06402587890625, -0.06029510498046875, -0.0565643310546875, -0.05283355712890625, -0.049102783203125, -0.04537200927734375, -0.0416412353515625, -0.03791046142578125, -0.0341796875, -0.03044891357421875, -0.0267181396484375, -0.02298736572265625, -0.019256591796875, -0.01552581787109375, -0.0117950439453125, -0.00806427001953125, -0.00433349609375, -0.00060272216796875, 0.0031280517578125, 0.00685882568359375, 0.010589599609375, 0.01432037353515625, 0.0180511474609375, 0.02178192138671875, 0.0255126953125, 0.02924346923828125, 0.0329742431640625, 0.03670501708984375, 0.040435791015625, 0.04416656494140625, 0.0478973388671875, 0.05162811279296875, 0.05535888671875, 0.05908966064453125, 0.0628204345703125, 0.06655120849609375, 0.070281982421875, 0.07401275634765625, 0.0777435302734375, 0.08147430419921875, 0.085205078125, 0.08893585205078125, 0.0926666259765625, 0.09639739990234375, 0.100128173828125, 0.10385894775390625, 0.1075897216796875, 0.11132049560546875, 0.11505126953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 9.0, 3.0, 9.0, 6.0, 7.0, 18.0, 11.0, 21.0, 37.0, 50.0, 65.0, 101.0, 154.0, 302.0, 619.0, 1113.0, 714.0, 307.0, 198.0, 120.0, 66.0, 48.0, 32.0, 22.0, 12.0, 8.0, 3.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050994873046875, -0.04938220977783203, -0.04776954650878906, -0.046156883239746094, -0.044544219970703125, -0.042931556701660156, -0.04131889343261719, -0.03970623016357422, -0.03809356689453125, -0.03648090362548828, -0.03486824035644531, -0.033255577087402344, -0.031642913818359375, -0.030030250549316406, -0.028417587280273438, -0.02680492401123047, -0.0251922607421875, -0.02357959747314453, -0.021966934204101562, -0.020354270935058594, -0.018741607666015625, -0.017128944396972656, -0.015516281127929688, -0.013903617858886719, -0.01229095458984375, -0.010678291320800781, -0.009065628051757812, -0.007452964782714844, -0.005840301513671875, -0.004227638244628906, -0.0026149749755859375, -0.0010023117065429688, 0.0006103515625, 0.0022230148315429688, 0.0038356781005859375, 0.005448341369628906, 0.007061004638671875, 0.008673667907714844, 0.010286331176757812, 0.011898994445800781, 0.01351165771484375, 0.015124320983886719, 0.016736984252929688, 0.018349647521972656, 0.019962310791015625, 0.021574974060058594, 0.023187637329101562, 0.02480030059814453, 0.0264129638671875, 0.02802562713623047, 0.029638290405273438, 0.031250953674316406, 0.032863616943359375, 0.034476280212402344, 0.03608894348144531, 0.03770160675048828, 0.03931427001953125, 0.04092693328857422, 0.04253959655761719, 0.044152259826660156, 0.045764923095703125, 0.047377586364746094, 0.04899024963378906, 0.05060291290283203, 0.052215576171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 12.0, 36.0, 186.0, 506.0, 224.0, 26.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5204178690910339, -0.4938589632511139, -0.46730005741119385, -0.4407411217689514, -0.41418221592903137, -0.38762331008911133, -0.3610643744468689, -0.33450546860694885, -0.3079465627670288, -0.28138765692710876, -0.2548287510871887, -0.2282698154449463, -0.20171090960502625, -0.1751520037651062, -0.14859308302402496, -0.12203416228294373, -0.09547525644302368, -0.06891634315252304, -0.0423574298620224, -0.01579851657152176, 0.010760396718978882, 0.037319302558898926, 0.06387822329998016, 0.0904371440410614, 0.11699604988098145, 0.1435549557209015, 0.17011387646198273, 0.19667279720306396, 0.223231703042984, 0.24979060888290405, 0.2763495445251465, 0.30290845036506653, 0.3294672966003418, 0.35602620244026184, 0.3825851082801819, 0.4091440439224243, 0.43570294976234436, 0.4622618556022644, 0.48882079124450684, 0.5153796672821045, 0.5419386029243469, 0.5684975385665894, 0.595056414604187, 0.6216153502464294, 0.6481742858886719, 0.6747331619262695, 0.701292097568512, 0.7278510332107544, 0.754409909248352, 0.7809688448905945, 0.8075277209281921, 0.8340866565704346, 0.8606455326080322, 0.8872044682502747, 0.9137634038925171, 0.9403222799301147, 0.9668812155723572, 0.9934401512145996, 1.0199990272521973, 1.046557903289795, 1.0731168985366821, 1.0996757745742798, 1.1262346506118774, 1.1527936458587646, 1.1793525218963623]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 8.0, 5.0, 8.0, 8.0, 7.0, 12.0, 14.0, 30.0, 37.0, 45.0, 50.0, 73.0, 65.0, 56.0, 82.0, 67.0, 79.0, 67.0, 54.0, 47.0, 47.0, 49.0, 21.0, 10.0, 15.0, 11.0, 5.0, 8.0, 1.0, 4.0, 3.0, 2.0, 7.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.27869975566864014, -0.2711939811706543, -0.26368820667266846, -0.2561824321746826, -0.24867665767669678, -0.24117088317871094, -0.2336651086807251, -0.22615933418273926, -0.21865355968475342, -0.21114778518676758, -0.20364201068878174, -0.1961362361907959, -0.18863046169281006, -0.18112468719482422, -0.17361891269683838, -0.16611313819885254, -0.1586073487997055, -0.15110157430171967, -0.14359579980373383, -0.13609002530574799, -0.12858425080776215, -0.1210784763097763, -0.11357269436120987, -0.10606691986322403, -0.09856114536523819, -0.09105537086725235, -0.08354959636926651, -0.07604381442070007, -0.06853803992271423, -0.06103226915001869, -0.053526490926742554, -0.046020716428756714, -0.038514941930770874, -0.031009167432785034, -0.023503391072154045, -0.015997614711523056, -0.008491840213537216, -0.0009860657155513763, 0.006519712507724762, 0.014025487005710602, 0.02153126150369644, 0.02903703600168228, 0.03654281049966812, 0.04404858872294426, 0.0515543632209301, 0.05906013771891594, 0.06656591594219208, 0.07407169044017792, 0.08157746493816376, 0.0890832394361496, 0.09658901393413544, 0.10409478843212128, 0.11160056293010712, 0.11910633742809296, 0.12661212682724, 0.13411790132522583, 0.14162367582321167, 0.1491294503211975, 0.15663522481918335, 0.1641409993171692, 0.17164677381515503, 0.17915254831314087, 0.1866583228111267, 0.19416409730911255, 0.2016698718070984]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 16.0, 16.0, 14.0, 26.0, 34.0, 43.0, 62.0, 103.0, 102.0, 156.0, 232.0, 323.0, 455.0, 686.0, 969.0, 1596.0, 2574.0, 4154.0, 7147.0, 12799.0, 24611.0, 55024.0, 172675.0, 568454.0, 108857.0, 41049.0, 19929.0, 10488.0, 5894.0, 3507.0, 2183.0, 1448.0, 903.0, 597.0, 442.0, 288.0, 185.0, 159.0, 96.0, 68.0, 49.0, 36.0, 35.0, 15.0, 18.0, 11.0, 3.0, 11.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0], "bins": [-0.143310546875, -0.13901138305664062, -0.13471221923828125, -0.13041305541992188, -0.1261138916015625, -0.12181472778320312, -0.11751556396484375, -0.11321640014648438, -0.108917236328125, -0.10461807250976562, -0.10031890869140625, -0.09601974487304688, -0.0917205810546875, -0.08742141723632812, -0.08312225341796875, -0.07882308959960938, -0.07452392578125, -0.07022476196289062, -0.06592559814453125, -0.061626434326171875, -0.0573272705078125, -0.053028106689453125, -0.04872894287109375, -0.044429779052734375, -0.040130615234375, -0.035831451416015625, -0.03153228759765625, -0.027233123779296875, -0.0229339599609375, -0.018634796142578125, -0.01433563232421875, -0.010036468505859375, -0.0057373046875, -0.001438140869140625, 0.00286102294921875, 0.007160186767578125, 0.0114593505859375, 0.015758514404296875, 0.02005767822265625, 0.024356842041015625, 0.028656005859375, 0.032955169677734375, 0.03725433349609375, 0.041553497314453125, 0.0458526611328125, 0.050151824951171875, 0.05445098876953125, 0.058750152587890625, 0.06304931640625, 0.06734848022460938, 0.07164764404296875, 0.07594680786132812, 0.0802459716796875, 0.08454513549804688, 0.08884429931640625, 0.09314346313476562, 0.097442626953125, 0.10174179077148438, 0.10604095458984375, 0.11034011840820312, 0.1146392822265625, 0.11893844604492188, 0.12323760986328125, 0.12753677368164062, 0.1318359375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 6.0, 3.0, 3.0, 5.0, 9.0, 14.0, 10.0, 16.0, 18.0, 20.0, 21.0, 34.0, 47.0, 66.0, 177.0, 217.0, 79.0, 61.0, 41.0, 39.0, 17.0, 20.0, 17.0, 12.0, 11.0, 11.0, 8.0, 2.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0523681640625, -0.05079507827758789, -0.04922199249267578, -0.04764890670776367, -0.04607582092285156, -0.04450273513793945, -0.042929649353027344, -0.041356563568115234, -0.039783477783203125, -0.038210391998291016, -0.036637306213378906, -0.0350642204284668, -0.03349113464355469, -0.03191804885864258, -0.03034496307373047, -0.02877187728881836, -0.02719879150390625, -0.02562570571899414, -0.02405261993408203, -0.022479534149169922, -0.020906448364257812, -0.019333362579345703, -0.017760276794433594, -0.016187191009521484, -0.014614105224609375, -0.013041019439697266, -0.011467933654785156, -0.009894847869873047, -0.008321762084960938, -0.006748676300048828, -0.005175590515136719, -0.0036025047302246094, -0.0020294189453125, -0.0004563331604003906, 0.0011167526245117188, 0.002689838409423828, 0.0042629241943359375, 0.005836009979248047, 0.007409095764160156, 0.008982181549072266, 0.010555267333984375, 0.012128353118896484, 0.013701438903808594, 0.015274524688720703, 0.016847610473632812, 0.018420696258544922, 0.01999378204345703, 0.02156686782836914, 0.02313995361328125, 0.02471303939819336, 0.02628612518310547, 0.027859210968017578, 0.029432296752929688, 0.031005382537841797, 0.032578468322753906, 0.034151554107666016, 0.035724639892578125, 0.037297725677490234, 0.038870811462402344, 0.04044389724731445, 0.04201698303222656, 0.04359006881713867, 0.04516315460205078, 0.04673624038696289, 0.048309326171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 10.0, 11.0, 16.0, 16.0, 29.0, 39.0, 48.0, 90.0, 109.0, 172.0, 327.0, 543.0, 1085.0, 2373.0, 6085.0, 16793.0, 57394.0, 247730.0, 508974.0, 149356.0, 37186.0, 11804.0, 4484.0, 1799.0, 897.0, 433.0, 278.0, 141.0, 102.0, 45.0, 48.0, 29.0, 25.0, 27.0, 14.0, 10.0, 5.0, 8.0, 4.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11474609375, -0.111083984375, -0.107421875, -0.103759765625, -0.10009765625, -0.096435546875, -0.0927734375, -0.089111328125, -0.08544921875, -0.081787109375, -0.078125, -0.074462890625, -0.07080078125, -0.067138671875, -0.0634765625, -0.059814453125, -0.05615234375, -0.052490234375, -0.048828125, -0.045166015625, -0.04150390625, -0.037841796875, -0.0341796875, -0.030517578125, -0.02685546875, -0.023193359375, -0.01953125, -0.015869140625, -0.01220703125, -0.008544921875, -0.0048828125, -0.001220703125, 0.00244140625, 0.006103515625, 0.009765625, 0.013427734375, 0.01708984375, 0.020751953125, 0.0244140625, 0.028076171875, 0.03173828125, 0.035400390625, 0.0390625, 0.042724609375, 0.04638671875, 0.050048828125, 0.0537109375, 0.057373046875, 0.06103515625, 0.064697265625, 0.068359375, 0.072021484375, 0.07568359375, 0.079345703125, 0.0830078125, 0.086669921875, 0.09033203125, 0.093994140625, 0.09765625, 0.101318359375, 0.10498046875, 0.108642578125, 0.1123046875, 0.115966796875, 0.11962890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 9.0, 13.0, 8.0, 19.0, 19.0, 24.0, 30.0, 31.0, 33.0, 27.0, 38.0, 30.0, 28.0, 48.0, 39.0, 47.0, 37.0, 36.0, 52.0, 33.0, 36.0, 30.0, 30.0, 44.0, 44.0, 28.0, 30.0, 18.0, 20.0, 21.0, 17.0, 18.0, 13.0, 6.0, 9.0, 5.0, 6.0, 6.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15869140625, -0.15356826782226562, -0.14844512939453125, -0.14332199096679688, -0.1381988525390625, -0.13307571411132812, -0.12795257568359375, -0.12282943725585938, -0.117706298828125, -0.11258316040039062, -0.10746002197265625, -0.10233688354492188, -0.0972137451171875, -0.09209060668945312, -0.08696746826171875, -0.08184432983398438, -0.07672119140625, -0.07159805297851562, -0.06647491455078125, -0.061351776123046875, -0.0562286376953125, -0.051105499267578125, -0.04598236083984375, -0.040859222412109375, -0.035736083984375, -0.030612945556640625, -0.02548980712890625, -0.020366668701171875, -0.0152435302734375, -0.010120391845703125, -0.00499725341796875, 0.000125885009765625, 0.0052490234375, 0.010372161865234375, 0.01549530029296875, 0.020618438720703125, 0.0257415771484375, 0.030864715576171875, 0.03598785400390625, 0.041110992431640625, 0.046234130859375, 0.051357269287109375, 0.05648040771484375, 0.061603546142578125, 0.0667266845703125, 0.07184982299804688, 0.07697296142578125, 0.08209609985351562, 0.08721923828125, 0.09234237670898438, 0.09746551513671875, 0.10258865356445312, 0.1077117919921875, 0.11283493041992188, 0.11795806884765625, 0.12308120727539062, 0.128204345703125, 0.13332748413085938, 0.13845062255859375, 0.14357376098632812, 0.1486968994140625, 0.15382003784179688, 0.15894317626953125, 0.16406631469726562, 0.169189453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 13.0, 18.0, 26.0, 45.0, 60.0, 92.0, 176.0, 278.0, 524.0, 1031.0, 2368.0, 6036.0, 20288.0, 121087.0, 670870.0, 186366.0, 26567.0, 7341.0, 2769.0, 1215.0, 570.0, 308.0, 182.0, 100.0, 65.0, 37.0, 30.0, 26.0, 11.0, 10.0, 9.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10418701171875, -0.10117530822753906, -0.09816360473632812, -0.09515190124511719, -0.09214019775390625, -0.08912849426269531, -0.08611679077148438, -0.08310508728027344, -0.0800933837890625, -0.07708168029785156, -0.07406997680664062, -0.07105827331542969, -0.06804656982421875, -0.06503486633300781, -0.062023162841796875, -0.05901145935058594, -0.055999755859375, -0.05298805236816406, -0.049976348876953125, -0.04696464538574219, -0.04395294189453125, -0.04094123840332031, -0.037929534912109375, -0.03491783142089844, -0.0319061279296875, -0.028894424438476562, -0.025882720947265625, -0.022871017456054688, -0.01985931396484375, -0.016847610473632812, -0.013835906982421875, -0.010824203491210938, -0.0078125, -0.0048007965087890625, -0.001789093017578125, 0.0012226104736328125, 0.00423431396484375, 0.0072460174560546875, 0.010257720947265625, 0.013269424438476562, 0.0162811279296875, 0.019292831420898438, 0.022304534912109375, 0.025316238403320312, 0.02832794189453125, 0.03133964538574219, 0.034351348876953125, 0.03736305236816406, 0.040374755859375, 0.04338645935058594, 0.046398162841796875, 0.04940986633300781, 0.05242156982421875, 0.05543327331542969, 0.058444976806640625, 0.06145668029785156, 0.0644683837890625, 0.06748008728027344, 0.07049179077148438, 0.07350349426269531, 0.07651519775390625, 0.07952690124511719, 0.08253860473632812, 0.08555030822753906, 0.08856201171875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 5.0, 8.0, 18.0, 23.0, 37.0, 41.0, 42.0, 57.0, 73.0, 92.0, 94.0, 63.0, 91.0, 68.0, 64.0, 65.0, 40.0, 31.0, 18.0, 18.0, 12.0, 10.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6193599700927734e-05, -4.4547952711582184e-05, -4.290230572223663e-05, -4.125665873289108e-05, -3.961101174354553e-05, -3.796536475419998e-05, -3.631971776485443e-05, -3.467407077550888e-05, -3.302842378616333e-05, -3.138277679681778e-05, -2.973712980747223e-05, -2.809148281812668e-05, -2.6445835828781128e-05, -2.4800188839435577e-05, -2.3154541850090027e-05, -2.1508894860744476e-05, -1.9863247871398926e-05, -1.8217600882053375e-05, -1.6571953892707825e-05, -1.4926306903362274e-05, -1.3280659914016724e-05, -1.1635012924671173e-05, -9.989365935325623e-06, -8.343718945980072e-06, -6.6980719566345215e-06, -5.052424967288971e-06, -3.4067779779434204e-06, -1.7611309885978699e-06, -1.1548399925231934e-07, 1.5301629900932312e-06, 3.1758099794387817e-06, 4.821456968784332e-06, 6.467103958129883e-06, 8.112750947475433e-06, 9.758397936820984e-06, 1.1404044926166534e-05, 1.3049691915512085e-05, 1.4695338904857635e-05, 1.6340985894203186e-05, 1.7986632883548737e-05, 1.9632279872894287e-05, 2.1277926862239838e-05, 2.2923573851585388e-05, 2.456922084093094e-05, 2.621486783027649e-05, 2.786051481962204e-05, 2.950616180896759e-05, 3.115180879831314e-05, 3.279745578765869e-05, 3.444310277700424e-05, 3.608874976634979e-05, 3.773439675569534e-05, 3.9380043745040894e-05, 4.1025690734386444e-05, 4.2671337723731995e-05, 4.4316984713077545e-05, 4.5962631702423096e-05, 4.7608278691768646e-05, 4.92539256811142e-05, 5.089957267045975e-05, 5.25452196598053e-05, 5.419086664915085e-05, 5.58365136384964e-05, 5.748216062784195e-05, 5.91278076171875e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 7.0, 7.0, 7.0, 30.0, 14.0, 35.0, 42.0, 67.0, 100.0, 143.0, 239.0, 396.0, 784.0, 1393.0, 3005.0, 7153.0, 19552.0, 67939.0, 306136.0, 468567.0, 123479.0, 30644.0, 10244.0, 4262.0, 1939.0, 985.0, 517.0, 353.0, 180.0, 112.0, 77.0, 35.0, 30.0, 26.0, 18.0, 10.0, 9.0, 5.0, 8.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06182861328125, -0.05963611602783203, -0.05744361877441406, -0.055251121520996094, -0.053058624267578125, -0.050866127014160156, -0.04867362976074219, -0.04648113250732422, -0.04428863525390625, -0.04209613800048828, -0.03990364074707031, -0.037711143493652344, -0.035518646240234375, -0.033326148986816406, -0.031133651733398438, -0.02894115447998047, -0.0267486572265625, -0.02455615997314453, -0.022363662719726562, -0.020171165466308594, -0.017978668212890625, -0.015786170959472656, -0.013593673706054688, -0.011401176452636719, -0.00920867919921875, -0.007016181945800781, -0.0048236846923828125, -0.0026311874389648438, -0.000438690185546875, 0.0017538070678710938, 0.0039463043212890625, 0.006138801574707031, 0.008331298828125, 0.010523796081542969, 0.012716293334960938, 0.014908790588378906, 0.017101287841796875, 0.019293785095214844, 0.021486282348632812, 0.02367877960205078, 0.02587127685546875, 0.02806377410888672, 0.030256271362304688, 0.032448768615722656, 0.034641265869140625, 0.036833763122558594, 0.03902626037597656, 0.04121875762939453, 0.0434112548828125, 0.04560375213623047, 0.04779624938964844, 0.049988746643066406, 0.052181243896484375, 0.054373741149902344, 0.05656623840332031, 0.05875873565673828, 0.06095123291015625, 0.06314373016357422, 0.06533622741699219, 0.06752872467041016, 0.06972122192382812, 0.0719137191772461, 0.07410621643066406, 0.07629871368408203, 0.0784912109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 7.0, 10.0, 10.0, 20.0, 24.0, 39.0, 44.0, 51.0, 65.0, 84.0, 81.0, 63.0, 99.0, 73.0, 75.0, 58.0, 44.0, 25.0, 31.0, 18.0, 15.0, 13.0, 9.0, 7.0, 10.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1080322265625, -0.10537195205688477, -0.10271167755126953, -0.1000514030456543, -0.09739112854003906, -0.09473085403442383, -0.0920705795288086, -0.08941030502319336, -0.08675003051757812, -0.08408975601196289, -0.08142948150634766, -0.07876920700073242, -0.07610893249511719, -0.07344865798950195, -0.07078838348388672, -0.06812810897827148, -0.06546783447265625, -0.06280755996704102, -0.06014728546142578, -0.05748701095581055, -0.05482673645019531, -0.05216646194458008, -0.049506187438964844, -0.04684591293334961, -0.044185638427734375, -0.04152536392211914, -0.038865089416503906, -0.03620481491088867, -0.03354454040527344, -0.030884265899658203, -0.02822399139404297, -0.025563716888427734, -0.0229034423828125, -0.020243167877197266, -0.01758289337158203, -0.014922618865966797, -0.012262344360351562, -0.009602069854736328, -0.006941795349121094, -0.004281520843505859, -0.001621246337890625, 0.0010390281677246094, 0.0036993026733398438, 0.006359577178955078, 0.009019851684570312, 0.011680126190185547, 0.014340400695800781, 0.017000675201416016, 0.01966094970703125, 0.022321224212646484, 0.02498149871826172, 0.027641773223876953, 0.030302047729492188, 0.03296232223510742, 0.035622596740722656, 0.03828287124633789, 0.040943145751953125, 0.04360342025756836, 0.046263694763183594, 0.04892396926879883, 0.05158424377441406, 0.0542445182800293, 0.05690479278564453, 0.059565067291259766, 0.062225341796875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 8.0, 29.0, 75.0, 422.0, 380.0, 65.0, 17.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7165491580963135, -1.6089847087860107, -1.501420259475708, -1.3938559293746948, -1.286291480064392, -1.1787270307540894, -1.0711627006530762, -0.9635982513427734, -0.8560338020324707, -0.748469352722168, -0.64090496301651, -0.533340573310852, -0.4257761240005493, -0.3182116746902466, -0.21064728498458862, -0.10308289527893066, 0.00448155403137207, 0.11204597353935242, 0.21961039304733276, 0.3271748125553131, 0.43473923206329346, 0.5423036813735962, 0.6498680710792542, 0.7574324607849121, 0.8649969100952148, 0.9725613594055176, 1.0801258087158203, 1.1876901388168335, 1.2952545881271362, 1.402819037437439, 1.5103833675384521, 1.6179478168487549, 1.7255125045776367, 1.8330769538879395, 1.9406414031982422, 2.048205852508545, 2.1557703018188477, 2.2633347511291504, 2.370898962020874, 2.4784634113311768, 2.5860278606414795, 2.6935923099517822, 2.801156759262085, 2.9087212085723877, 3.0162854194641113, 3.123849868774414, 3.231414318084717, 3.3389787673950195, 3.4465432167053223, 3.554107666015625, 3.6616721153259277, 3.7692365646362305, 3.876801013946533, 3.984365463256836, 4.091929912567139, 4.199494361877441, 4.307058334350586, 4.414622783660889, 4.522187232971191, 4.629751682281494, 4.737316131591797, 4.8448805809021, 4.952445030212402, 5.060009002685547, 5.167573928833008]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 6.0, 5.0, 8.0, 4.0, 13.0, 18.0, 30.0, 62.0, 106.0, 143.0, 163.0, 145.0, 106.0, 69.0, 32.0, 19.0, 9.0, 13.0, 4.0, 6.0, 6.0, 7.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9579219818115234, -2.851120710372925, -2.744319438934326, -2.6375181674957275, -2.530716896057129, -2.4239156246185303, -2.3171143531799316, -2.210313320159912, -2.1035118103027344, -1.9967105388641357, -1.889909267425537, -1.7831079959869385, -1.6763067245483398, -1.5695054531097412, -1.4627043008804321, -1.3559030294418335, -1.2491018772125244, -1.1423006057739258, -1.0354993343353271, -0.9286981225013733, -0.8218968510627747, -0.715095579624176, -0.6082943677902222, -0.5014930963516235, -0.3946918249130249, -0.28789055347442627, -0.18108931183815002, -0.07428807020187378, 0.032513201236724854, 0.1393144726753235, 0.24611568450927734, 0.352916955947876, 0.4597184658050537, 0.5665197372436523, 0.673321008682251, 0.7801222205162048, 0.8869234919548035, 0.9937247633934021, 1.100525975227356, 1.2073272466659546, 1.3141285181045532, 1.4209297895431519, 1.5277310609817505, 1.6345322132110596, 1.7413334846496582, 1.8481347560882568, 1.9549360275268555, 2.061737298965454, 2.1685385704040527, 2.2753398418426514, 2.38214111328125, 2.4889423847198486, 2.5957436561584473, 2.702544927597046, 2.8093461990356445, 2.916147232055664, 3.022948741912842, 3.1297500133514404, 3.236551284790039, 3.3433525562286377, 3.4501538276672363, 3.556955099105835, 3.6637563705444336, 3.770557403564453, 3.8773586750030518]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 13.0, 25.0, 11.0, 27.0, 44.0, 75.0, 131.0, 210.0, 348.0, 630.0, 1148.0, 2108.0, 4630.0, 11633.0, 36517.0, 237185.0, 3702418.0, 147026.0, 30372.0, 10406.0, 4423.0, 2157.0, 1123.0, 673.0, 388.0, 204.0, 111.0, 88.0, 45.0, 27.0, 32.0, 12.0, 10.0, 7.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.383544921875, -0.37133026123046875, -0.3591156005859375, -0.34690093994140625, -0.334686279296875, -0.32247161865234375, -0.3102569580078125, -0.29804229736328125, -0.28582763671875, -0.27361297607421875, -0.2613983154296875, -0.24918365478515625, -0.236968994140625, -0.22475433349609375, -0.2125396728515625, -0.20032501220703125, -0.1881103515625, -0.17589569091796875, -0.1636810302734375, -0.15146636962890625, -0.139251708984375, -0.12703704833984375, -0.1148223876953125, -0.10260772705078125, -0.09039306640625, -0.07817840576171875, -0.0659637451171875, -0.05374908447265625, -0.041534423828125, -0.02931976318359375, -0.0171051025390625, -0.00489044189453125, 0.00732421875, 0.01953887939453125, 0.0317535400390625, 0.04396820068359375, 0.056182861328125, 0.06839752197265625, 0.0806121826171875, 0.09282684326171875, 0.10504150390625, 0.11725616455078125, 0.1294708251953125, 0.14168548583984375, 0.153900146484375, 0.16611480712890625, 0.1783294677734375, 0.19054412841796875, 0.2027587890625, 0.21497344970703125, 0.2271881103515625, 0.23940277099609375, 0.251617431640625, 0.26383209228515625, 0.2760467529296875, 0.28826141357421875, 0.30047607421875, 0.31269073486328125, 0.3249053955078125, 0.33712005615234375, 0.349334716796875, 0.36154937744140625, 0.3737640380859375, 0.38597869873046875, 0.398193359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 8.0, 11.0, 7.0, 13.0, 12.0, 17.0, 19.0, 23.0, 31.0, 45.0, 73.0, 89.0, 181.0, 138.0, 75.0, 54.0, 36.0, 26.0, 32.0, 14.0, 16.0, 15.0, 16.0, 5.0, 8.0, 10.0, 5.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.045745849609375, -0.04431343078613281, -0.042881011962890625, -0.04144859313964844, -0.04001617431640625, -0.03858375549316406, -0.037151336669921875, -0.03571891784667969, -0.0342864990234375, -0.03285408020019531, -0.031421661376953125, -0.029989242553710938, -0.02855682373046875, -0.027124404907226562, -0.025691986083984375, -0.024259567260742188, -0.0228271484375, -0.021394729614257812, -0.019962310791015625, -0.018529891967773438, -0.01709747314453125, -0.015665054321289062, -0.014232635498046875, -0.012800216674804688, -0.0113677978515625, -0.009935379028320312, -0.008502960205078125, -0.0070705413818359375, -0.00563812255859375, -0.0042057037353515625, -0.002773284912109375, -0.0013408660888671875, 9.1552734375e-05, 0.0015239715576171875, 0.002956390380859375, 0.0043888092041015625, 0.00582122802734375, 0.0072536468505859375, 0.008686065673828125, 0.010118484497070312, 0.0115509033203125, 0.012983322143554688, 0.014415740966796875, 0.015848159790039062, 0.01728057861328125, 0.018712997436523438, 0.020145416259765625, 0.021577835083007812, 0.02301025390625, 0.024442672729492188, 0.025875091552734375, 0.027307510375976562, 0.02873992919921875, 0.030172348022460938, 0.031604766845703125, 0.03303718566894531, 0.0344696044921875, 0.03590202331542969, 0.037334442138671875, 0.03876686096191406, 0.04019927978515625, 0.04163169860839844, 0.043064117431640625, 0.04449653625488281, 0.045928955078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 9.0, 11.0, 15.0, 17.0, 24.0, 36.0, 51.0, 72.0, 121.0, 231.0, 441.0, 909.0, 2056.0, 5031.0, 15985.0, 66275.0, 556714.0, 3249499.0, 240684.0, 38746.0, 10647.0, 3668.0, 1553.0, 677.0, 345.0, 155.0, 114.0, 68.0, 39.0, 21.0, 19.0, 18.0, 8.0, 10.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.27099609375, -0.2626152038574219, -0.25423431396484375, -0.24585342407226562, -0.2374725341796875, -0.22909164428710938, -0.22071075439453125, -0.21232986450195312, -0.203948974609375, -0.19556808471679688, -0.18718719482421875, -0.17880630493164062, -0.1704254150390625, -0.16204452514648438, -0.15366363525390625, -0.14528274536132812, -0.13690185546875, -0.12852096557617188, -0.12014007568359375, -0.11175918579101562, -0.1033782958984375, -0.09499740600585938, -0.08661651611328125, -0.07823562622070312, -0.069854736328125, -0.061473846435546875, -0.05309295654296875, -0.044712066650390625, -0.0363311767578125, -0.027950286865234375, -0.01956939697265625, -0.011188507080078125, -0.0028076171875, 0.005573272705078125, 0.01395416259765625, 0.022335052490234375, 0.0307159423828125, 0.039096832275390625, 0.04747772216796875, 0.055858612060546875, 0.064239501953125, 0.07262039184570312, 0.08100128173828125, 0.08938217163085938, 0.0977630615234375, 0.10614395141601562, 0.11452484130859375, 0.12290573120117188, 0.13128662109375, 0.13966751098632812, 0.14804840087890625, 0.15642929077148438, 0.1648101806640625, 0.17319107055664062, 0.18157196044921875, 0.18995285034179688, 0.198333740234375, 0.20671463012695312, 0.21509552001953125, 0.22347640991210938, 0.2318572998046875, 0.24023818969726562, 0.24861907958984375, 0.2569999694824219, 0.265380859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 10.0, 5.0, 6.0, 11.0, 10.0, 18.0, 31.0, 56.0, 84.0, 109.0, 193.0, 368.0, 773.0, 1320.0, 481.0, 237.0, 118.0, 74.0, 46.0, 26.0, 18.0, 20.0, 12.0, 13.0, 2.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.057159423828125, -0.05538225173950195, -0.053605079650878906, -0.05182790756225586, -0.05005073547363281, -0.048273563385009766, -0.04649639129638672, -0.04471921920776367, -0.042942047119140625, -0.04116487503051758, -0.03938770294189453, -0.037610530853271484, -0.03583335876464844, -0.03405618667602539, -0.032279014587402344, -0.030501842498779297, -0.02872467041015625, -0.026947498321533203, -0.025170326232910156, -0.02339315414428711, -0.021615982055664062, -0.019838809967041016, -0.01806163787841797, -0.016284465789794922, -0.014507293701171875, -0.012730121612548828, -0.010952949523925781, -0.009175777435302734, -0.0073986053466796875, -0.005621433258056641, -0.0038442611694335938, -0.002067089080810547, -0.0002899169921875, 0.0014872550964355469, 0.0032644271850585938, 0.005041599273681641, 0.0068187713623046875, 0.008595943450927734, 0.010373115539550781, 0.012150287628173828, 0.013927459716796875, 0.015704631805419922, 0.01748180389404297, 0.019258975982666016, 0.021036148071289062, 0.02281332015991211, 0.024590492248535156, 0.026367664337158203, 0.02814483642578125, 0.029922008514404297, 0.031699180603027344, 0.03347635269165039, 0.03525352478027344, 0.037030696868896484, 0.03880786895751953, 0.04058504104614258, 0.042362213134765625, 0.04413938522338867, 0.04591655731201172, 0.047693729400634766, 0.04947090148925781, 0.05124807357788086, 0.053025245666503906, 0.05480241775512695, 0.05657958984375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 9.0, 9.0, 22.0, 70.0, 187.0, 332.0, 258.0, 76.0, 29.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2700851559638977, -0.25392162799835205, -0.2377581149339676, -0.22159460186958313, -0.20543107390403748, -0.18926754593849182, -0.17310403287410736, -0.1569405198097229, -0.14077699184417725, -0.12461347132921219, -0.10844995081424713, -0.09228643029928207, -0.07612290978431702, -0.05995938926935196, -0.0437958687543869, -0.027632348239421844, -0.011468827724456787, 0.00469469279050827, 0.020858213305473328, 0.037021733820438385, 0.05318525433540344, 0.0693487748503685, 0.08551229536533356, 0.10167581588029861, 0.11783933639526367, 0.13400286436080933, 0.1501663774251938, 0.16632989048957825, 0.1824934184551239, 0.19865694642066956, 0.21482045948505402, 0.23098397254943848, 0.2471475601196289, 0.26331108808517456, 0.2794746160507202, 0.2956381142139435, 0.31180164217948914, 0.3279651701450348, 0.34412866830825806, 0.3602921962738037, 0.37645572423934937, 0.392619252204895, 0.4087827801704407, 0.42494627833366394, 0.4411098062992096, 0.45727333426475525, 0.4734368324279785, 0.48960036039352417, 0.5057638883590698, 0.5219274163246155, 0.5380909442901611, 0.5542544722557068, 0.5704180002212524, 0.5865814685821533, 0.602744996547699, 0.6189085245132446, 0.6350720524787903, 0.6512355804443359, 0.6673991084098816, 0.6835626363754272, 0.6997261047363281, 0.7158896327018738, 0.7320531606674194, 0.7482166886329651, 0.7643802165985107]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 12.0, 7.0, 16.0, 22.0, 25.0, 20.0, 58.0, 66.0, 69.0, 70.0, 73.0, 104.0, 79.0, 74.0, 70.0, 57.0, 33.0, 33.0, 21.0, 13.0, 11.0, 15.0, 3.0, 6.0, 7.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.30907267332077026, -0.30069243907928467, -0.2923122048377991, -0.2839319407939911, -0.2755517065525055, -0.2671714723110199, -0.2587912380695343, -0.2504109740257263, -0.24203073978424072, -0.23365050554275513, -0.22527025640010834, -0.21689002215862274, -0.20850977301597595, -0.20012953877449036, -0.19174930453300476, -0.18336905539035797, -0.17498882114887238, -0.16660858690738678, -0.15822833776474, -0.1498481035232544, -0.1414678543806076, -0.133087620139122, -0.12470737844705582, -0.11632713675498962, -0.10794689506292343, -0.09956665337085724, -0.09118641167879105, -0.08280616998672485, -0.07442593574523926, -0.06604568660259247, -0.05766545236110687, -0.04928521066904068, -0.04090496897697449, -0.032524727284908295, -0.02414448745548725, -0.015764247626066208, -0.007384005934000015, 0.0009962357580661774, 0.009376473724842072, 0.017756715416908264, 0.026136957108974457, 0.03451719880104065, 0.04289744049310684, 0.051277678459882736, 0.05965792015194893, 0.06803816556930542, 0.07641839981079102, 0.08479864150285721, 0.0931788831949234, 0.1015591248869896, 0.10993936657905579, 0.11831960082054138, 0.12669984996318817, 0.13508008420467377, 0.14346033334732056, 0.15184056758880615, 0.16022080183029175, 0.16860103607177734, 0.17698128521442413, 0.18536151945590973, 0.19374176859855652, 0.20212200284004211, 0.2105022370815277, 0.2188824862241745, 0.2272627353668213]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 1.0, 3.0, 1.0, 5.0, 8.0, 23.0, 17.0, 24.0, 39.0, 55.0, 78.0, 149.0, 219.0, 305.0, 511.0, 895.0, 1635.0, 3045.0, 6174.0, 13751.0, 34325.0, 108008.0, 545376.0, 237159.0, 57266.0, 21087.0, 8982.0, 4302.0, 2155.0, 1122.0, 677.0, 425.0, 269.0, 154.0, 98.0, 74.0, 46.0, 29.0, 18.0, 11.0, 14.0, 6.0, 9.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.218017578125, -0.21135902404785156, -0.20470046997070312, -0.1980419158935547, -0.19138336181640625, -0.1847248077392578, -0.17806625366210938, -0.17140769958496094, -0.1647491455078125, -0.15809059143066406, -0.15143203735351562, -0.1447734832763672, -0.13811492919921875, -0.1314563751220703, -0.12479782104492188, -0.11813926696777344, -0.111480712890625, -0.10482215881347656, -0.09816360473632812, -0.09150505065917969, -0.08484649658203125, -0.07818794250488281, -0.07152938842773438, -0.06487083435058594, -0.0582122802734375, -0.05155372619628906, -0.044895172119140625, -0.03823661804199219, -0.03157806396484375, -0.024919509887695312, -0.018260955810546875, -0.011602401733398438, -0.00494384765625, 0.0017147064208984375, 0.008373260498046875, 0.015031814575195312, 0.02169036865234375, 0.028348922729492188, 0.035007476806640625, 0.04166603088378906, 0.0483245849609375, 0.05498313903808594, 0.061641693115234375, 0.06830024719238281, 0.07495880126953125, 0.08161735534667969, 0.08827590942382812, 0.09493446350097656, 0.101593017578125, 0.10825157165527344, 0.11491012573242188, 0.12156867980957031, 0.12822723388671875, 0.1348857879638672, 0.14154434204101562, 0.14820289611816406, 0.1548614501953125, 0.16152000427246094, 0.16817855834960938, 0.1748371124267578, 0.18149566650390625, 0.1881542205810547, 0.19481277465820312, 0.20147132873535156, 0.2081298828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 3.0, 10.0, 8.0, 14.0, 13.0, 19.0, 24.0, 27.0, 36.0, 34.0, 66.0, 125.0, 136.0, 132.0, 79.0, 62.0, 47.0, 29.0, 27.0, 19.0, 19.0, 14.0, 9.0, 13.0, 10.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.046875, -0.045491695404052734, -0.04410839080810547, -0.0427250862121582, -0.04134178161621094, -0.03995847702026367, -0.038575172424316406, -0.03719186782836914, -0.035808563232421875, -0.03442525863647461, -0.033041954040527344, -0.03165864944458008, -0.030275344848632812, -0.028892040252685547, -0.02750873565673828, -0.026125431060791016, -0.02474212646484375, -0.023358821868896484, -0.02197551727294922, -0.020592212677001953, -0.019208908081054688, -0.017825603485107422, -0.016442298889160156, -0.01505899429321289, -0.013675689697265625, -0.01229238510131836, -0.010909080505371094, -0.009525775909423828, -0.008142471313476562, -0.006759166717529297, -0.005375862121582031, -0.003992557525634766, -0.0026092529296875, -0.0012259483337402344, 0.00015735626220703125, 0.0015406608581542969, 0.0029239654541015625, 0.004307270050048828, 0.005690574645996094, 0.007073879241943359, 0.008457183837890625, 0.00984048843383789, 0.011223793029785156, 0.012607097625732422, 0.013990402221679688, 0.015373706817626953, 0.01675701141357422, 0.018140316009521484, 0.01952362060546875, 0.020906925201416016, 0.02229022979736328, 0.023673534393310547, 0.025056838989257812, 0.026440143585205078, 0.027823448181152344, 0.02920675277709961, 0.030590057373046875, 0.03197336196899414, 0.033356666564941406, 0.03473997116088867, 0.03612327575683594, 0.0375065803527832, 0.03888988494873047, 0.040273189544677734, 0.041656494140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 6.0, 5.0, 4.0, 10.0, 19.0, 15.0, 20.0, 36.0, 42.0, 52.0, 74.0, 99.0, 146.0, 228.0, 405.0, 665.0, 1351.0, 2605.0, 5702.0, 13291.0, 39251.0, 159457.0, 523136.0, 219890.0, 51979.0, 16821.0, 6748.0, 2927.0, 1469.0, 769.0, 485.0, 278.0, 173.0, 124.0, 72.0, 51.0, 35.0, 33.0, 15.0, 23.0, 13.0, 7.0, 7.0, 7.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1353759765625, -0.1312236785888672, -0.12707138061523438, -0.12291908264160156, -0.11876678466796875, -0.11461448669433594, -0.11046218872070312, -0.10630989074707031, -0.1021575927734375, -0.09800529479980469, -0.09385299682617188, -0.08970069885253906, -0.08554840087890625, -0.08139610290527344, -0.07724380493164062, -0.07309150695800781, -0.068939208984375, -0.06478691101074219, -0.060634613037109375, -0.05648231506347656, -0.05233001708984375, -0.04817771911621094, -0.044025421142578125, -0.03987312316894531, -0.0357208251953125, -0.03156852722167969, -0.027416229248046875, -0.023263931274414062, -0.01911163330078125, -0.014959335327148438, -0.010807037353515625, -0.0066547393798828125, -0.00250244140625, 0.0016498565673828125, 0.005802154541015625, 0.009954452514648438, 0.01410675048828125, 0.018259048461914062, 0.022411346435546875, 0.026563644409179688, 0.0307159423828125, 0.03486824035644531, 0.039020538330078125, 0.04317283630371094, 0.04732513427734375, 0.05147743225097656, 0.055629730224609375, 0.05978202819824219, 0.063934326171875, 0.06808662414550781, 0.07223892211914062, 0.07639122009277344, 0.08054351806640625, 0.08469581604003906, 0.08884811401367188, 0.09300041198730469, 0.0971527099609375, 0.10130500793457031, 0.10545730590820312, 0.10960960388183594, 0.11376190185546875, 0.11791419982910156, 0.12206649780273438, 0.1262187957763672, 0.13037109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 7.0, 7.0, 8.0, 11.0, 7.0, 16.0, 15.0, 12.0, 18.0, 20.0, 38.0, 30.0, 26.0, 51.0, 34.0, 43.0, 45.0, 55.0, 39.0, 56.0, 43.0, 34.0, 49.0, 41.0, 46.0, 23.0, 31.0, 29.0, 26.0, 20.0, 21.0, 26.0, 15.0, 12.0, 12.0, 5.0, 11.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1298828125, -0.12584877014160156, -0.12181472778320312, -0.11778068542480469, -0.11374664306640625, -0.10971260070800781, -0.10567855834960938, -0.10164451599121094, -0.0976104736328125, -0.09357643127441406, -0.08954238891601562, -0.08550834655761719, -0.08147430419921875, -0.07744026184082031, -0.07340621948242188, -0.06937217712402344, -0.065338134765625, -0.06130409240722656, -0.057270050048828125, -0.05323600769042969, -0.04920196533203125, -0.04516792297363281, -0.041133880615234375, -0.03709983825683594, -0.0330657958984375, -0.029031753540039062, -0.024997711181640625, -0.020963668823242188, -0.01692962646484375, -0.012895584106445312, -0.008861541748046875, -0.0048274993896484375, -0.00079345703125, 0.0032405853271484375, 0.007274627685546875, 0.011308670043945312, 0.01534271240234375, 0.019376754760742188, 0.023410797119140625, 0.027444839477539062, 0.0314788818359375, 0.03551292419433594, 0.039546966552734375, 0.04358100891113281, 0.04761505126953125, 0.05164909362792969, 0.055683135986328125, 0.05971717834472656, 0.063751220703125, 0.06778526306152344, 0.07181930541992188, 0.07585334777832031, 0.07988739013671875, 0.08392143249511719, 0.08795547485351562, 0.09198951721191406, 0.0960235595703125, 0.10005760192871094, 0.10409164428710938, 0.10812568664550781, 0.11215972900390625, 0.11619377136230469, 0.12022781372070312, 0.12426185607910156, 0.1282958984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 13.0, 12.0, 27.0, 32.0, 65.0, 96.0, 157.0, 286.0, 512.0, 1155.0, 2701.0, 8122.0, 34641.0, 273251.0, 615854.0, 87862.0, 15842.0, 4549.0, 1627.0, 792.0, 396.0, 210.0, 120.0, 67.0, 44.0, 26.0, 28.0, 19.0, 10.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.205078125, -0.19890975952148438, -0.19274139404296875, -0.18657302856445312, -0.1804046630859375, -0.17423629760742188, -0.16806793212890625, -0.16189956665039062, -0.155731201171875, -0.14956283569335938, -0.14339447021484375, -0.13722610473632812, -0.1310577392578125, -0.12488937377929688, -0.11872100830078125, -0.11255264282226562, -0.10638427734375, -0.10021591186523438, -0.09404754638671875, -0.08787918090820312, -0.0817108154296875, -0.07554244995117188, -0.06937408447265625, -0.06320571899414062, -0.057037353515625, -0.050868988037109375, -0.04470062255859375, -0.038532257080078125, -0.0323638916015625, -0.026195526123046875, -0.02002716064453125, -0.013858795166015625, -0.0076904296875, -0.001522064208984375, 0.00464630126953125, 0.010814666748046875, 0.0169830322265625, 0.023151397705078125, 0.02931976318359375, 0.035488128662109375, 0.041656494140625, 0.047824859619140625, 0.05399322509765625, 0.060161590576171875, 0.0663299560546875, 0.07249832153320312, 0.07866668701171875, 0.08483505249023438, 0.09100341796875, 0.09717178344726562, 0.10334014892578125, 0.10950851440429688, 0.1156768798828125, 0.12184524536132812, 0.12801361083984375, 0.13418197631835938, 0.140350341796875, 0.14651870727539062, 0.15268707275390625, 0.15885543823242188, 0.1650238037109375, 0.17119216918945312, 0.17736053466796875, 0.18352890014648438, 0.189697265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 4.0, 12.0, 13.0, 19.0, 27.0, 30.0, 35.0, 60.0, 80.0, 127.0, 100.0, 102.0, 108.0, 86.0, 56.0, 43.0, 30.0, 23.0, 9.0, 12.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013375282287597656, -0.00013048294931650162, -0.00012721307575702667, -0.00012394320219755173, -0.00012067332863807678, -0.00011740345507860184, -0.00011413358151912689, -0.00011086370795965195, -0.000107593834400177, -0.00010432396084070206, -0.00010105408728122711, -9.778421372175217e-05, -9.451434016227722e-05, -9.124446660280228e-05, -8.797459304332733e-05, -8.470471948385239e-05, -8.143484592437744e-05, -7.81649723649025e-05, -7.489509880542755e-05, -7.16252252459526e-05, -6.835535168647766e-05, -6.508547812700272e-05, -6.181560456752777e-05, -5.8545731008052826e-05, -5.527585744857788e-05, -5.2005983889102936e-05, -4.873611032962799e-05, -4.5466236770153046e-05, -4.21963632106781e-05, -3.8926489651203156e-05, -3.565661609172821e-05, -3.2386742532253265e-05, -2.911686897277832e-05, -2.5846995413303375e-05, -2.257712185382843e-05, -1.9307248294353485e-05, -1.603737473487854e-05, -1.2767501175403595e-05, -9.49762761592865e-06, -6.227754056453705e-06, -2.9578804969787598e-06, 3.119930624961853e-07, 3.5818666219711304e-06, 6.8517401814460754e-06, 1.012161374092102e-05, 1.3391487300395966e-05, 1.666136085987091e-05, 1.9931234419345856e-05, 2.32011079788208e-05, 2.6470981538295746e-05, 2.974085509777069e-05, 3.3010728657245636e-05, 3.628060221672058e-05, 3.9550475776195526e-05, 4.282034933567047e-05, 4.6090222895145416e-05, 4.936009645462036e-05, 5.2629970014095306e-05, 5.589984357357025e-05, 5.9169717133045197e-05, 6.243959069252014e-05, 6.570946425199509e-05, 6.897933781147003e-05, 7.224921137094498e-05, 7.551908493041992e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 13.0, 12.0, 19.0, 27.0, 38.0, 73.0, 91.0, 158.0, 228.0, 465.0, 734.0, 1498.0, 3050.0, 6882.0, 18062.0, 58498.0, 226616.0, 459290.0, 192940.0, 51433.0, 16265.0, 6285.0, 2783.0, 1339.0, 722.0, 390.0, 216.0, 136.0, 69.0, 67.0, 36.0, 32.0, 17.0, 11.0, 11.0, 7.0, 9.0, 2.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.131103515625, -0.12750530242919922, -0.12390708923339844, -0.12030887603759766, -0.11671066284179688, -0.1131124496459961, -0.10951423645019531, -0.10591602325439453, -0.10231781005859375, -0.09871959686279297, -0.09512138366699219, -0.0915231704711914, -0.08792495727539062, -0.08432674407958984, -0.08072853088378906, -0.07713031768798828, -0.0735321044921875, -0.06993389129638672, -0.06633567810058594, -0.06273746490478516, -0.059139251708984375, -0.055541038513183594, -0.05194282531738281, -0.04834461212158203, -0.04474639892578125, -0.04114818572998047, -0.03754997253417969, -0.033951759338378906, -0.030353546142578125, -0.026755332946777344, -0.023157119750976562, -0.01955890655517578, -0.015960693359375, -0.012362480163574219, -0.008764266967773438, -0.005166053771972656, -0.001567840576171875, 0.0020303726196289062, 0.0056285858154296875, 0.009226799011230469, 0.01282501220703125, 0.01642322540283203, 0.020021438598632812, 0.023619651794433594, 0.027217864990234375, 0.030816078186035156, 0.03441429138183594, 0.03801250457763672, 0.0416107177734375, 0.04520893096923828, 0.04880714416503906, 0.052405357360839844, 0.056003570556640625, 0.059601783752441406, 0.06319999694824219, 0.06679821014404297, 0.07039642333984375, 0.07399463653564453, 0.07759284973144531, 0.0811910629272461, 0.08478927612304688, 0.08838748931884766, 0.09198570251464844, 0.09558391571044922, 0.09918212890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 3.0, 7.0, 8.0, 9.0, 18.0, 15.0, 12.0, 19.0, 29.0, 29.0, 62.0, 56.0, 68.0, 59.0, 69.0, 80.0, 72.0, 69.0, 57.0, 42.0, 39.0, 30.0, 34.0, 20.0, 20.0, 16.0, 8.0, 15.0, 6.0, 4.0, 8.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1004638671875, -0.09743309020996094, -0.09440231323242188, -0.09137153625488281, -0.08834075927734375, -0.08530998229980469, -0.08227920532226562, -0.07924842834472656, -0.0762176513671875, -0.07318687438964844, -0.07015609741210938, -0.06712532043457031, -0.06409454345703125, -0.06106376647949219, -0.058032989501953125, -0.05500221252441406, -0.051971435546875, -0.04894065856933594, -0.045909881591796875, -0.04287910461425781, -0.03984832763671875, -0.03681755065917969, -0.033786773681640625, -0.030755996704101562, -0.0277252197265625, -0.024694442749023438, -0.021663665771484375, -0.018632888793945312, -0.01560211181640625, -0.012571334838867188, -0.009540557861328125, -0.0065097808837890625, -0.00347900390625, -0.0004482269287109375, 0.002582550048828125, 0.0056133270263671875, 0.00864410400390625, 0.011674880981445312, 0.014705657958984375, 0.017736434936523438, 0.0207672119140625, 0.023797988891601562, 0.026828765869140625, 0.029859542846679688, 0.03289031982421875, 0.03592109680175781, 0.038951873779296875, 0.04198265075683594, 0.045013427734375, 0.04804420471191406, 0.051074981689453125, 0.05410575866699219, 0.05713653564453125, 0.06016731262207031, 0.06319808959960938, 0.06622886657714844, 0.0692596435546875, 0.07229042053222656, 0.07532119750976562, 0.07835197448730469, 0.08138275146484375, 0.08441352844238281, 0.08744430541992188, 0.09047508239746094, 0.093505859375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 9.0, 28.0, 57.0, 146.0, 232.0, 251.0, 145.0, 65.0, 29.0, 16.0, 8.0, 3.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.541589379310608, -1.4990280866622925, -1.4564666748046875, -1.413905382156372, -1.3713440895080566, -1.3287826776504517, -1.2862213850021362, -1.2436599731445312, -1.2010986804962158, -1.1585373878479004, -1.1159759759902954, -1.07341468334198, -1.030853271484375, -0.9882919788360596, -0.9457306861877441, -0.9031693339347839, -0.8606079816818237, -0.8180466294288635, -0.7754852771759033, -0.7329239845275879, -0.6903626322746277, -0.6478012800216675, -0.605239987373352, -0.5626786351203918, -0.5201172828674316, -0.47755593061447144, -0.4349946081638336, -0.3924332857131958, -0.3498719334602356, -0.3073105812072754, -0.2647492587566376, -0.22218793630599976, -0.17962646484375, -0.137065127491951, -0.09450379014015198, -0.051942452788352966, -0.009381115436553955, 0.033180221915245056, 0.07574155926704407, 0.11830288171768188, 0.1608642339706421, 0.2034255713224411, 0.2459869086742401, 0.28854823112487793, 0.33110958337783813, 0.37367093563079834, 0.41623225808143616, 0.458793580532074, 0.5013549327850342, 0.5439162850379944, 0.5864776372909546, 0.62903892993927, 0.6716002821922302, 0.7141616344451904, 0.7567229270935059, 0.7992842793464661, 0.8418456315994263, 0.8844069838523865, 0.9269683361053467, 0.9695296287536621, 1.0120909214019775, 1.0546523332595825, 1.097213625907898, 1.139775037765503, 1.1823363304138184]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 1.0, 9.0, 4.0, 9.0, 20.0, 20.0, 28.0, 37.0, 48.0, 53.0, 51.0, 76.0, 74.0, 73.0, 87.0, 67.0, 65.0, 52.0, 40.0, 38.0, 34.0, 28.0, 20.0, 8.0, 12.0, 6.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-1.2606399059295654, -1.2212210893630981, -1.1818022727966309, -1.1423835754394531, -1.1029647588729858, -1.0635459423065186, -1.0241272449493408, -0.9847084283828735, -0.9452896118164062, -0.905870795249939, -0.8664520382881165, -0.827033281326294, -0.7876144647598267, -0.7481956481933594, -0.7087768912315369, -0.6693581342697144, -0.6299393177032471, -0.5905205011367798, -0.5511017441749573, -0.5116829872131348, -0.4722641706466675, -0.4328453838825226, -0.3934265971183777, -0.3540078103542328, -0.3145890235900879, -0.275170236825943, -0.2357514500617981, -0.1963326632976532, -0.1569138765335083, -0.1174950897693634, -0.0780763030052185, -0.03865751624107361, 0.0007613897323608398, 0.04018017649650574, 0.07959896326065063, 0.11901775002479553, 0.15843653678894043, 0.19785532355308533, 0.23727411031723022, 0.2766928970813751, 0.31611168384552, 0.3555304706096649, 0.3949492573738098, 0.4343680441379547, 0.4737868309020996, 0.5132056474685669, 0.5526244044303894, 0.5920431613922119, 0.6314619779586792, 0.6708807945251465, 0.710299551486969, 0.7497183084487915, 0.7891371250152588, 0.8285559415817261, 0.8679746985435486, 0.9073934555053711, 0.9468122720718384, 0.9862310886383057, 1.0256497859954834, 1.0650686025619507, 1.104487419128418, 1.1439062356948853, 1.1833250522613525, 1.2227437496185303, 1.2621625661849976]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 9.0, 15.0, 15.0, 16.0, 16.0, 36.0, 46.0, 77.0, 98.0, 156.0, 217.0, 343.0, 527.0, 839.0, 1242.0, 2037.0, 3509.0, 7633.0, 19028.0, 79393.0, 3409459.0, 591113.0, 48762.0, 14605.0, 6300.0, 3376.0, 2002.0, 1198.0, 743.0, 440.0, 298.0, 219.0, 160.0, 93.0, 67.0, 45.0, 31.0, 21.0, 18.0, 12.0, 20.0, 5.0, 11.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.416259765625, -0.4023170471191406, -0.38837432861328125, -0.3744316101074219, -0.3604888916015625, -0.3465461730957031, -0.33260345458984375, -0.3186607360839844, -0.304718017578125, -0.2907752990722656, -0.27683258056640625, -0.2628898620605469, -0.2489471435546875, -0.23500442504882812, -0.22106170654296875, -0.20711898803710938, -0.19317626953125, -0.17923355102539062, -0.16529083251953125, -0.15134811401367188, -0.1374053955078125, -0.12346267700195312, -0.10951995849609375, -0.09557723999023438, -0.081634521484375, -0.06769180297851562, -0.05374908447265625, -0.039806365966796875, -0.0258636474609375, -0.011920928955078125, 0.00202178955078125, 0.015964508056640625, 0.0299072265625, 0.043849945068359375, 0.05779266357421875, 0.07173538208007812, 0.0856781005859375, 0.09962081909179688, 0.11356353759765625, 0.12750625610351562, 0.141448974609375, 0.15539169311523438, 0.16933441162109375, 0.18327713012695312, 0.1972198486328125, 0.21116256713867188, 0.22510528564453125, 0.23904800415039062, 0.25299072265625, 0.2669334411621094, 0.28087615966796875, 0.2948188781738281, 0.3087615966796875, 0.3227043151855469, 0.33664703369140625, 0.3505897521972656, 0.364532470703125, 0.3784751892089844, 0.39241790771484375, 0.4063606262207031, 0.4203033447265625, 0.4342460632324219, 0.44818878173828125, 0.4621315002441406, 0.47607421875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 9.0, 3.0, 8.0, 11.0, 9.0, 16.0, 23.0, 17.0, 51.0, 37.0, 71.0, 86.0, 127.0, 136.0, 101.0, 69.0, 38.0, 42.0, 29.0, 22.0, 22.0, 16.0, 19.0, 8.0, 10.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04510498046875, -0.04370594024658203, -0.04230690002441406, -0.040907859802246094, -0.039508819580078125, -0.038109779357910156, -0.03671073913574219, -0.03531169891357422, -0.03391265869140625, -0.03251361846923828, -0.031114578247070312, -0.029715538024902344, -0.028316497802734375, -0.026917457580566406, -0.025518417358398438, -0.02411937713623047, -0.0227203369140625, -0.02132129669189453, -0.019922256469726562, -0.018523216247558594, -0.017124176025390625, -0.015725135803222656, -0.014326095581054688, -0.012927055358886719, -0.01152801513671875, -0.010128974914550781, -0.008729934692382812, -0.007330894470214844, -0.005931854248046875, -0.004532814025878906, -0.0031337738037109375, -0.0017347335815429688, -0.000335693359375, 0.0010633468627929688, 0.0024623870849609375, 0.0038614273071289062, 0.005260467529296875, 0.006659507751464844, 0.008058547973632812, 0.009457588195800781, 0.01085662841796875, 0.012255668640136719, 0.013654708862304688, 0.015053749084472656, 0.016452789306640625, 0.017851829528808594, 0.019250869750976562, 0.02064990997314453, 0.0220489501953125, 0.02344799041748047, 0.024847030639648438, 0.026246070861816406, 0.027645111083984375, 0.029044151306152344, 0.030443191528320312, 0.03184223175048828, 0.03324127197265625, 0.03464031219482422, 0.03603935241699219, 0.037438392639160156, 0.038837432861328125, 0.040236473083496094, 0.04163551330566406, 0.04303455352783203, 0.04443359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 8.0, 15.0, 12.0, 21.0, 26.0, 41.0, 77.0, 157.0, 309.0, 708.0, 1876.0, 5614.0, 20312.0, 131433.0, 3366189.0, 604485.0, 47084.0, 10480.0, 3243.0, 1179.0, 458.0, 209.0, 116.0, 67.0, 38.0, 26.0, 23.0, 11.0, 8.0, 7.0, 7.0, 8.0, 6.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.367919921875, -0.3555564880371094, -0.34319305419921875, -0.3308296203613281, -0.3184661865234375, -0.3061027526855469, -0.29373931884765625, -0.2813758850097656, -0.269012451171875, -0.2566490173339844, -0.24428558349609375, -0.23192214965820312, -0.2195587158203125, -0.20719528198242188, -0.19483184814453125, -0.18246841430664062, -0.17010498046875, -0.15774154663085938, -0.14537811279296875, -0.13301467895507812, -0.1206512451171875, -0.10828781127929688, -0.09592437744140625, -0.08356094360351562, -0.071197509765625, -0.058834075927734375, -0.04647064208984375, -0.034107208251953125, -0.0217437744140625, -0.009380340576171875, 0.00298309326171875, 0.015346527099609375, 0.0277099609375, 0.040073394775390625, 0.05243682861328125, 0.06480026245117188, 0.0771636962890625, 0.08952713012695312, 0.10189056396484375, 0.11425399780273438, 0.126617431640625, 0.13898086547851562, 0.15134429931640625, 0.16370773315429688, 0.1760711669921875, 0.18843460083007812, 0.20079803466796875, 0.21316146850585938, 0.22552490234375, 0.23788833618164062, 0.25025177001953125, 0.2626152038574219, 0.2749786376953125, 0.2873420715332031, 0.29970550537109375, 0.3120689392089844, 0.324432373046875, 0.3367958068847656, 0.34915924072265625, 0.3615226745605469, 0.3738861083984375, 0.3862495422363281, 0.39861297607421875, 0.4109764099121094, 0.42333984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 5.0, 5.0, 6.0, 6.0, 15.0, 19.0, 17.0, 27.0, 47.0, 61.0, 101.0, 163.0, 300.0, 732.0, 1424.0, 502.0, 264.0, 110.0, 79.0, 68.0, 28.0, 18.0, 13.0, 12.0, 7.0, 8.0, 4.0, 8.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.0666036605834961, -0.06460380554199219, -0.06260395050048828, -0.060604095458984375, -0.05860424041748047, -0.05660438537597656, -0.054604530334472656, -0.05260467529296875, -0.050604820251464844, -0.04860496520996094, -0.04660511016845703, -0.044605255126953125, -0.04260540008544922, -0.04060554504394531, -0.038605690002441406, -0.0366058349609375, -0.034605979919433594, -0.03260612487792969, -0.03060626983642578, -0.028606414794921875, -0.02660655975341797, -0.024606704711914062, -0.022606849670410156, -0.02060699462890625, -0.018607139587402344, -0.016607284545898438, -0.014607429504394531, -0.012607574462890625, -0.010607719421386719, -0.008607864379882812, -0.006608009338378906, -0.004608154296875, -0.0026082992553710938, -0.0006084442138671875, 0.0013914108276367188, 0.003391265869140625, 0.005391120910644531, 0.0073909759521484375, 0.009390830993652344, 0.01139068603515625, 0.013390541076660156, 0.015390396118164062, 0.01739025115966797, 0.019390106201171875, 0.02138996124267578, 0.023389816284179688, 0.025389671325683594, 0.0273895263671875, 0.029389381408691406, 0.03138923645019531, 0.03338909149169922, 0.035388946533203125, 0.03738880157470703, 0.03938865661621094, 0.041388511657714844, 0.04338836669921875, 0.045388221740722656, 0.04738807678222656, 0.04938793182373047, 0.051387786865234375, 0.05338764190673828, 0.05538749694824219, 0.057387351989746094, 0.05938720703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 11.0, 57.0, 175.0, 318.0, 278.0, 112.0, 32.0, 10.0, 7.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43601012229919434, -0.4150972366333008, -0.3941843807697296, -0.37327152490615845, -0.3523586392402649, -0.33144575357437134, -0.31053289771080017, -0.289620041847229, -0.26870715618133545, -0.2477942854166031, -0.22688141465187073, -0.20596854388713837, -0.185055673122406, -0.16414280235767365, -0.14322993159294128, -0.12231706082820892, -0.10140419006347656, -0.0804913192987442, -0.05957844853401184, -0.03866557776927948, -0.01775270700454712, 0.0031601637601852417, 0.024073034524917603, 0.04498590528964996, 0.06589877605438232, 0.08681164681911469, 0.10772451758384705, 0.1286373883485794, 0.14955025911331177, 0.17046312987804413, 0.1913760006427765, 0.21228887140750885, 0.2332017421722412, 0.25411462783813477, 0.27502748370170593, 0.2959403395652771, 0.31685322523117065, 0.3377661108970642, 0.3586789667606354, 0.37959182262420654, 0.4005047082901001, 0.42141759395599365, 0.4423304498195648, 0.463243305683136, 0.48415619134902954, 0.5050690770149231, 0.5259819030761719, 0.5468947887420654, 0.567807674407959, 0.5887205600738525, 0.6096334457397461, 0.6305462718009949, 0.6514591574668884, 0.672372043132782, 0.6932848691940308, 0.7141977548599243, 0.7351106405258179, 0.7560235261917114, 0.776936411857605, 0.7978492379188538, 0.8187621235847473, 0.8396750092506409, 0.8605878353118896, 0.8815007209777832, 0.9024136066436768]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 9.0, 4.0, 6.0, 8.0, 12.0, 11.0, 17.0, 23.0, 31.0, 29.0, 38.0, 45.0, 49.0, 61.0, 64.0, 70.0, 64.0, 60.0, 61.0, 55.0, 52.0, 39.0, 39.0, 24.0, 27.0, 19.0, 22.0, 21.0, 12.0, 5.0, 3.0, 7.0, 4.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2592061758041382, -0.251478374004364, -0.24375058710575104, -0.23602278530597687, -0.2282949984073639, -0.22056719660758972, -0.21283939480781555, -0.20511159300804138, -0.1973838061094284, -0.18965600430965424, -0.18192821741104126, -0.1742004156112671, -0.16647261381149292, -0.15874482691287994, -0.15101702511310577, -0.1432892382144928, -0.13556143641471863, -0.12783363461494446, -0.12010584771633148, -0.11237804591655731, -0.10465025156736374, -0.09692245721817017, -0.089194655418396, -0.08146686106920242, -0.07373906672000885, -0.06601127237081528, -0.058283474296331406, -0.050555676221847534, -0.04282788187265396, -0.03510008752346039, -0.027372289448976517, -0.019644491374492645, -0.011916697025299072, -0.00418890081346035, 0.003538895398378372, 0.011266691610217094, 0.018994487822055817, 0.02672228217124939, 0.03445008024573326, 0.04217787832021713, 0.049905672669410706, 0.05763346701860428, 0.06536126136779785, 0.07308906316757202, 0.0808168575167656, 0.08854465186595917, 0.09627245366573334, 0.10400024801492691, 0.11172804236412048, 0.11945583671331406, 0.12718363106250763, 0.1349114328622818, 0.14263921976089478, 0.15036702156066895, 0.15809482336044312, 0.16582262516021729, 0.17355041205883026, 0.18127821385860443, 0.1890060007572174, 0.19673380255699158, 0.20446160435676575, 0.21218939125537872, 0.2199171930551529, 0.22764497995376587, 0.23537278175354004]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 3.0, 7.0, 10.0, 12.0, 14.0, 18.0, 28.0, 31.0, 41.0, 72.0, 108.0, 154.0, 243.0, 376.0, 579.0, 905.0, 1666.0, 3057.0, 6111.0, 13383.0, 33300.0, 101944.0, 397524.0, 345858.0, 88691.0, 29747.0, 12230.0, 5635.0, 2819.0, 1496.0, 881.0, 549.0, 339.0, 223.0, 133.0, 110.0, 81.0, 49.0, 35.0, 19.0, 16.0, 10.0, 7.0, 12.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.218505859375, -0.21120834350585938, -0.20391082763671875, -0.19661331176757812, -0.1893157958984375, -0.18201828002929688, -0.17472076416015625, -0.16742324829101562, -0.160125732421875, -0.15282821655273438, -0.14553070068359375, -0.13823318481445312, -0.1309356689453125, -0.12363815307617188, -0.11634063720703125, -0.10904312133789062, -0.10174560546875, -0.09444808959960938, -0.08715057373046875, -0.07985305786132812, -0.0725555419921875, -0.06525802612304688, -0.05796051025390625, -0.050662994384765625, -0.043365478515625, -0.036067962646484375, -0.02877044677734375, -0.021472930908203125, -0.0141754150390625, -0.006877899169921875, 0.00041961669921875, 0.007717132568359375, 0.0150146484375, 0.022312164306640625, 0.02960968017578125, 0.036907196044921875, 0.0442047119140625, 0.051502227783203125, 0.05879974365234375, 0.06609725952148438, 0.073394775390625, 0.08069229125976562, 0.08798980712890625, 0.09528732299804688, 0.1025848388671875, 0.10988235473632812, 0.11717987060546875, 0.12447738647460938, 0.13177490234375, 0.13907241821289062, 0.14636993408203125, 0.15366744995117188, 0.1609649658203125, 0.16826248168945312, 0.17555999755859375, 0.18285751342773438, 0.190155029296875, 0.19745254516601562, 0.20475006103515625, 0.21204757690429688, 0.2193450927734375, 0.22664260864257812, 0.23394012451171875, 0.24123764038085938, 0.24853515625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 5.0, 12.0, 10.0, 13.0, 17.0, 20.0, 28.0, 29.0, 42.0, 57.0, 91.0, 95.0, 127.0, 101.0, 71.0, 65.0, 41.0, 44.0, 30.0, 21.0, 17.0, 13.0, 10.0, 11.0, 9.0, 4.0, 0.0, 7.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0361328125, -0.03486919403076172, -0.03360557556152344, -0.032341957092285156, -0.031078338623046875, -0.029814720153808594, -0.028551101684570312, -0.02728748321533203, -0.02602386474609375, -0.02476024627685547, -0.023496627807617188, -0.022233009338378906, -0.020969390869140625, -0.019705772399902344, -0.018442153930664062, -0.01717853546142578, -0.0159149169921875, -0.014651298522949219, -0.013387680053710938, -0.012124061584472656, -0.010860443115234375, -0.009596824645996094, -0.008333206176757812, -0.007069587707519531, -0.00580596923828125, -0.004542350769042969, -0.0032787322998046875, -0.0020151138305664062, -0.000751495361328125, 0.0005121231079101562, 0.0017757415771484375, 0.0030393600463867188, 0.004302978515625, 0.005566596984863281, 0.0068302154541015625, 0.008093833923339844, 0.009357452392578125, 0.010621070861816406, 0.011884689331054688, 0.013148307800292969, 0.01441192626953125, 0.01567554473876953, 0.016939163208007812, 0.018202781677246094, 0.019466400146484375, 0.020730018615722656, 0.021993637084960938, 0.02325725555419922, 0.0245208740234375, 0.02578449249267578, 0.027048110961914062, 0.028311729431152344, 0.029575347900390625, 0.030838966369628906, 0.03210258483886719, 0.03336620330810547, 0.03462982177734375, 0.03589344024658203, 0.03715705871582031, 0.038420677185058594, 0.039684295654296875, 0.040947914123535156, 0.04221153259277344, 0.04347515106201172, 0.04473876953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 5.0, 3.0, 7.0, 7.0, 11.0, 8.0, 18.0, 22.0, 35.0, 42.0, 52.0, 86.0, 109.0, 178.0, 296.0, 406.0, 732.0, 1465.0, 3851.0, 13555.0, 60782.0, 313426.0, 502657.0, 116425.0, 23787.0, 6025.0, 2141.0, 917.0, 537.0, 345.0, 190.0, 127.0, 88.0, 60.0, 39.0, 32.0, 25.0, 20.0, 10.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.276123046875, -0.26727294921875, -0.2584228515625, -0.24957275390625, -0.24072265625, -0.23187255859375, -0.2230224609375, -0.21417236328125, -0.205322265625, -0.19647216796875, -0.1876220703125, -0.17877197265625, -0.169921875, -0.16107177734375, -0.1522216796875, -0.14337158203125, -0.134521484375, -0.12567138671875, -0.1168212890625, -0.10797119140625, -0.09912109375, -0.09027099609375, -0.0814208984375, -0.07257080078125, -0.063720703125, -0.05487060546875, -0.0460205078125, -0.03717041015625, -0.0283203125, -0.01947021484375, -0.0106201171875, -0.00177001953125, 0.007080078125, 0.01593017578125, 0.0247802734375, 0.03363037109375, 0.04248046875, 0.05133056640625, 0.0601806640625, 0.06903076171875, 0.077880859375, 0.08673095703125, 0.0955810546875, 0.10443115234375, 0.11328125, 0.12213134765625, 0.1309814453125, 0.13983154296875, 0.148681640625, 0.15753173828125, 0.1663818359375, 0.17523193359375, 0.18408203125, 0.19293212890625, 0.2017822265625, 0.21063232421875, 0.219482421875, 0.22833251953125, 0.2371826171875, 0.24603271484375, 0.2548828125, 0.26373291015625, 0.2725830078125, 0.28143310546875, 0.290283203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 3.0, 4.0, 6.0, 9.0, 8.0, 10.0, 8.0, 18.0, 15.0, 14.0, 22.0, 28.0, 24.0, 23.0, 31.0, 34.0, 34.0, 49.0, 32.0, 33.0, 37.0, 41.0, 46.0, 47.0, 54.0, 46.0, 48.0, 48.0, 41.0, 28.0, 22.0, 19.0, 17.0, 25.0, 11.0, 11.0, 16.0, 7.0, 13.0, 9.0, 4.0, 4.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.149169921875, -0.14434814453125, -0.1395263671875, -0.13470458984375, -0.1298828125, -0.12506103515625, -0.1202392578125, -0.11541748046875, -0.110595703125, -0.10577392578125, -0.1009521484375, -0.09613037109375, -0.09130859375, -0.08648681640625, -0.0816650390625, -0.07684326171875, -0.072021484375, -0.06719970703125, -0.0623779296875, -0.05755615234375, -0.052734375, -0.04791259765625, -0.0430908203125, -0.03826904296875, -0.033447265625, -0.02862548828125, -0.0238037109375, -0.01898193359375, -0.01416015625, -0.00933837890625, -0.0045166015625, 0.00030517578125, 0.005126953125, 0.00994873046875, 0.0147705078125, 0.01959228515625, 0.0244140625, 0.02923583984375, 0.0340576171875, 0.03887939453125, 0.043701171875, 0.04852294921875, 0.0533447265625, 0.05816650390625, 0.06298828125, 0.06781005859375, 0.0726318359375, 0.07745361328125, 0.082275390625, 0.08709716796875, 0.0919189453125, 0.09674072265625, 0.1015625, 0.10638427734375, 0.1112060546875, 0.11602783203125, 0.120849609375, 0.12567138671875, 0.1304931640625, 0.13531494140625, 0.14013671875, 0.14495849609375, 0.1497802734375, 0.15460205078125, 0.159423828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 5.0, 10.0, 10.0, 20.0, 20.0, 30.0, 45.0, 79.0, 148.0, 212.0, 406.0, 787.0, 1517.0, 3633.0, 8838.0, 25182.0, 85201.0, 305035.0, 415140.0, 140361.0, 39441.0, 13031.0, 4951.0, 2238.0, 969.0, 506.0, 279.0, 170.0, 92.0, 56.0, 41.0, 29.0, 25.0, 12.0, 10.0, 6.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1419677734375, -0.1378154754638672, -0.13366317749023438, -0.12951087951660156, -0.12535858154296875, -0.12120628356933594, -0.11705398559570312, -0.11290168762207031, -0.1087493896484375, -0.10459709167480469, -0.10044479370117188, -0.09629249572753906, -0.09214019775390625, -0.08798789978027344, -0.08383560180664062, -0.07968330383300781, -0.075531005859375, -0.07137870788574219, -0.06722640991210938, -0.06307411193847656, -0.05892181396484375, -0.05476951599121094, -0.050617218017578125, -0.04646492004394531, -0.0423126220703125, -0.03816032409667969, -0.034008026123046875, -0.029855728149414062, -0.02570343017578125, -0.021551132202148438, -0.017398834228515625, -0.013246536254882812, -0.00909423828125, -0.0049419403076171875, -0.000789642333984375, 0.0033626556396484375, 0.00751495361328125, 0.011667251586914062, 0.015819549560546875, 0.019971847534179688, 0.0241241455078125, 0.028276443481445312, 0.032428741455078125, 0.03658103942871094, 0.04073333740234375, 0.04488563537597656, 0.049037933349609375, 0.05319023132324219, 0.057342529296875, 0.06149482727050781, 0.06564712524414062, 0.06979942321777344, 0.07395172119140625, 0.07810401916503906, 0.08225631713867188, 0.08640861511230469, 0.0905609130859375, 0.09471321105957031, 0.09886550903320312, 0.10301780700683594, 0.10717010498046875, 0.11132240295410156, 0.11547470092773438, 0.11962699890136719, 0.123779296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 3.0, 4.0, 11.0, 33.0, 31.0, 42.0, 50.0, 49.0, 73.0, 106.0, 88.0, 85.0, 70.0, 73.0, 65.0, 66.0, 37.0, 28.0, 23.0, 16.0, 11.0, 8.0, 11.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00012218952178955078, -0.00011922325938940048, -0.00011625699698925018, -0.00011329073458909988, -0.00011032447218894958, -0.00010735820978879929, -0.00010439194738864899, -0.00010142568498849869, -9.845942258834839e-05, -9.549316018819809e-05, -9.252689778804779e-05, -8.956063538789749e-05, -8.659437298774719e-05, -8.36281105875969e-05, -8.06618481874466e-05, -7.76955857872963e-05, -7.4729323387146e-05, -7.17630609869957e-05, -6.87967985868454e-05, -6.58305361866951e-05, -6.28642737865448e-05, -5.98980113863945e-05, -5.69317489862442e-05, -5.39654865860939e-05, -5.0999224185943604e-05, -4.8032961785793304e-05, -4.5066699385643005e-05, -4.2100436985492706e-05, -3.913417458534241e-05, -3.616791218519211e-05, -3.320164978504181e-05, -3.023538738489151e-05, -2.726912498474121e-05, -2.4302862584590912e-05, -2.1336600184440613e-05, -1.8370337784290314e-05, -1.5404075384140015e-05, -1.2437812983989716e-05, -9.471550583839417e-06, -6.5052881836891174e-06, -3.5390257835388184e-06, -5.727633833885193e-07, 2.3934990167617798e-06, 5.359761416912079e-06, 8.326023817062378e-06, 1.1292286217212677e-05, 1.4258548617362976e-05, 1.7224811017513275e-05, 2.0191073417663574e-05, 2.3157335817813873e-05, 2.6123598217964172e-05, 2.908986061811447e-05, 3.205612301826477e-05, 3.502238541841507e-05, 3.798864781856537e-05, 4.095491021871567e-05, 4.392117261886597e-05, 4.6887435019016266e-05, 4.9853697419166565e-05, 5.2819959819316864e-05, 5.578622221946716e-05, 5.875248461961746e-05, 6.171874701976776e-05, 6.468500941991806e-05, 6.765127182006836e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 6.0, 7.0, 15.0, 10.0, 33.0, 56.0, 67.0, 120.0, 266.0, 432.0, 1054.0, 2957.0, 11421.0, 71307.0, 608955.0, 309265.0, 32699.0, 6485.0, 1897.0, 740.0, 332.0, 181.0, 90.0, 53.0, 40.0, 18.0, 18.0, 11.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2352294921875, -0.2280597686767578, -0.22089004516601562, -0.21372032165527344, -0.20655059814453125, -0.19938087463378906, -0.19221115112304688, -0.1850414276123047, -0.1778717041015625, -0.1707019805908203, -0.16353225708007812, -0.15636253356933594, -0.14919281005859375, -0.14202308654785156, -0.13485336303710938, -0.1276836395263672, -0.120513916015625, -0.11334419250488281, -0.10617446899414062, -0.09900474548339844, -0.09183502197265625, -0.08466529846191406, -0.07749557495117188, -0.07032585144042969, -0.0631561279296875, -0.05598640441894531, -0.048816680908203125, -0.04164695739746094, -0.03447723388671875, -0.027307510375976562, -0.020137786865234375, -0.012968063354492188, -0.00579833984375, 0.0013713836669921875, 0.008541107177734375, 0.015710830688476562, 0.02288055419921875, 0.030050277709960938, 0.037220001220703125, 0.04438972473144531, 0.0515594482421875, 0.05872917175292969, 0.06589889526367188, 0.07306861877441406, 0.08023834228515625, 0.08740806579589844, 0.09457778930664062, 0.10174751281738281, 0.108917236328125, 0.11608695983886719, 0.12325668334960938, 0.13042640686035156, 0.13759613037109375, 0.14476585388183594, 0.15193557739257812, 0.1591053009033203, 0.1662750244140625, 0.1734447479248047, 0.18061447143554688, 0.18778419494628906, 0.19495391845703125, 0.20212364196777344, 0.20929336547851562, 0.2164630889892578, 0.2236328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 8.0, 15.0, 9.0, 15.0, 25.0, 34.0, 41.0, 53.0, 61.0, 85.0, 99.0, 113.0, 89.0, 93.0, 63.0, 39.0, 39.0, 26.0, 15.0, 14.0, 14.0, 11.0, 9.0, 5.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.1273193359375, -0.12417125701904297, -0.12102317810058594, -0.1178750991821289, -0.11472702026367188, -0.11157894134521484, -0.10843086242675781, -0.10528278350830078, -0.10213470458984375, -0.09898662567138672, -0.09583854675292969, -0.09269046783447266, -0.08954238891601562, -0.0863943099975586, -0.08324623107910156, -0.08009815216064453, -0.0769500732421875, -0.07380199432373047, -0.07065391540527344, -0.0675058364868164, -0.06435775756835938, -0.061209678649902344, -0.05806159973144531, -0.05491352081298828, -0.05176544189453125, -0.04861736297607422, -0.04546928405761719, -0.042321205139160156, -0.039173126220703125, -0.036025047302246094, -0.03287696838378906, -0.02972888946533203, -0.026580810546875, -0.02343273162841797, -0.020284652709960938, -0.017136573791503906, -0.013988494873046875, -0.010840415954589844, -0.0076923370361328125, -0.004544258117675781, -0.00139617919921875, 0.0017518997192382812, 0.0048999786376953125, 0.008048057556152344, 0.011196136474609375, 0.014344215393066406, 0.017492294311523438, 0.02064037322998047, 0.0237884521484375, 0.02693653106689453, 0.030084609985351562, 0.033232688903808594, 0.036380767822265625, 0.039528846740722656, 0.04267692565917969, 0.04582500457763672, 0.04897308349609375, 0.05212116241455078, 0.05526924133300781, 0.058417320251464844, 0.061565399169921875, 0.0647134780883789, 0.06786155700683594, 0.07100963592529297, 0.07415771484375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 10.0, 18.0, 32.0, 57.0, 146.0, 224.0, 230.0, 141.0, 71.0, 38.0, 12.0, 14.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.209059953689575, -3.1378350257873535, -3.066610097885132, -2.99538516998291, -2.9241602420806885, -2.852935314178467, -2.781710386276245, -2.7104854583740234, -2.6392602920532227, -2.568035364151001, -2.4968104362487793, -2.4255855083465576, -2.354360580444336, -2.2831356525421143, -2.2119107246398926, -2.140685558319092, -2.069460868835449, -1.9982359409332275, -1.9270110130310059, -1.8557860851287842, -1.7845611572265625, -1.7133362293243408, -1.6421111822128296, -1.570886254310608, -1.4996613264083862, -1.4284363985061646, -1.3572114706039429, -1.2859865427017212, -1.21476149559021, -1.1435365676879883, -1.0723116397857666, -1.001086711883545, -0.9298619031906128, -0.8586369752883911, -0.7874120473861694, -0.716187059879303, -0.6449621319770813, -0.5737372040748596, -0.5025122165679932, -0.4312872886657715, -0.3600623607635498, -0.2888374328613281, -0.21761247515678406, -0.14638753235340118, -0.07516258955001831, -0.003937661647796631, 0.06728729605674744, 0.1385122537612915, 0.20973718166351318, 0.28096210956573486, 0.35218706727027893, 0.423412024974823, 0.4946369528770447, 0.5658618807792664, 0.6370868682861328, 0.7083117961883545, 0.7795367240905762, 0.8507616519927979, 0.9219865798950195, 0.993211567401886, 1.064436435699463, 1.1356613636016846, 1.2068864107131958, 1.2781113386154175, 1.3493362665176392]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 4.0, 11.0, 7.0, 18.0, 13.0, 20.0, 28.0, 31.0, 38.0, 31.0, 44.0, 50.0, 57.0, 61.0, 65.0, 72.0, 78.0, 58.0, 48.0, 43.0, 44.0, 35.0, 32.0, 32.0, 23.0, 17.0, 11.0, 10.0, 3.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.0063319206237793, -1.957811713218689, -1.9092915058135986, -1.8607712984085083, -1.812251091003418, -1.763730764389038, -1.7152105569839478, -1.6666903495788574, -1.618170142173767, -1.5696499347686768, -1.5211297273635864, -1.472609519958496, -1.4240891933441162, -1.3755689859390259, -1.3270487785339355, -1.2785285711288452, -1.2300083637237549, -1.1814881563186646, -1.1329679489135742, -1.0844477415084839, -1.0359275341033936, -0.9874072670936584, -0.9388870000839233, -0.890366792678833, -0.8418465852737427, -0.7933263778686523, -0.744806170463562, -0.6962859034538269, -0.6477656960487366, -0.5992454886436462, -0.5507252216339111, -0.5022050142288208, -0.4536846876144409, -0.4051644802093506, -0.35664424300193787, -0.30812400579452515, -0.2596037983894348, -0.2110835760831833, -0.16256335377693176, -0.11404311656951904, -0.06552290916442871, -0.017002686858177185, 0.03151753544807434, 0.08003775775432587, 0.1285579800605774, 0.17707820236682892, 0.22559842467308044, 0.27411866188049316, 0.3226388692855835, 0.37115907669067383, 0.41967931389808655, 0.46819955110549927, 0.5167197585105896, 0.5652399659156799, 0.613760232925415, 0.6622804403305054, 0.7108006477355957, 0.759320855140686, 0.8078410625457764, 0.8563613295555115, 0.9048815369606018, 0.9534017443656921, 1.0019220113754272, 1.0504422187805176, 1.098962426185608]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 7.0, 10.0, 14.0, 23.0, 35.0, 66.0, 80.0, 195.0, 331.0, 724.0, 1892.0, 6817.0, 53784.0, 3943837.0, 169734.0, 12035.0, 2717.0, 957.0, 459.0, 214.0, 123.0, 74.0, 41.0, 34.0, 17.0, 10.0, 8.0, 15.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77685546875, -0.75067138671875, -0.7244873046875, -0.69830322265625, -0.672119140625, -0.64593505859375, -0.6197509765625, -0.59356689453125, -0.5673828125, -0.54119873046875, -0.5150146484375, -0.48883056640625, -0.462646484375, -0.43646240234375, -0.4102783203125, -0.38409423828125, -0.35791015625, -0.33172607421875, -0.3055419921875, -0.27935791015625, -0.253173828125, -0.22698974609375, -0.2008056640625, -0.17462158203125, -0.1484375, -0.12225341796875, -0.0960693359375, -0.06988525390625, -0.043701171875, -0.01751708984375, 0.0086669921875, 0.03485107421875, 0.06103515625, 0.08721923828125, 0.1134033203125, 0.13958740234375, 0.165771484375, 0.19195556640625, 0.2181396484375, 0.24432373046875, 0.2705078125, 0.29669189453125, 0.3228759765625, 0.34906005859375, 0.375244140625, 0.40142822265625, 0.4276123046875, 0.45379638671875, 0.47998046875, 0.50616455078125, 0.5323486328125, 0.55853271484375, 0.584716796875, 0.61090087890625, 0.6370849609375, 0.66326904296875, 0.689453125, 0.71563720703125, 0.7418212890625, 0.76800537109375, 0.794189453125, 0.82037353515625, 0.8465576171875, 0.87274169921875, 0.89892578125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 7.0, 2.0, 4.0, 4.0, 10.0, 8.0, 11.0, 26.0, 20.0, 21.0, 33.0, 43.0, 41.0, 54.0, 64.0, 71.0, 84.0, 79.0, 70.0, 79.0, 53.0, 43.0, 38.0, 27.0, 28.0, 12.0, 21.0, 9.0, 6.0, 6.0, 5.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04052734375, -0.03921318054199219, -0.037899017333984375, -0.03658485412597656, -0.03527069091796875, -0.03395652770996094, -0.032642364501953125, -0.03132820129394531, -0.0300140380859375, -0.028699874877929688, -0.027385711669921875, -0.026071548461914062, -0.02475738525390625, -0.023443222045898438, -0.022129058837890625, -0.020814895629882812, -0.019500732421875, -0.018186569213867188, -0.016872406005859375, -0.015558242797851562, -0.01424407958984375, -0.012929916381835938, -0.011615753173828125, -0.010301589965820312, -0.0089874267578125, -0.0076732635498046875, -0.006359100341796875, -0.0050449371337890625, -0.00373077392578125, -0.0024166107177734375, -0.001102447509765625, 0.0002117156982421875, 0.00152587890625, 0.0028400421142578125, 0.004154205322265625, 0.0054683685302734375, 0.00678253173828125, 0.008096694946289062, 0.009410858154296875, 0.010725021362304688, 0.0120391845703125, 0.013353347778320312, 0.014667510986328125, 0.015981674194335938, 0.01729583740234375, 0.018610000610351562, 0.019924163818359375, 0.021238327026367188, 0.022552490234375, 0.023866653442382812, 0.025180816650390625, 0.026494979858398438, 0.02780914306640625, 0.029123306274414062, 0.030437469482421875, 0.03175163269042969, 0.0330657958984375, 0.03437995910644531, 0.035694122314453125, 0.03700828552246094, 0.03832244873046875, 0.03963661193847656, 0.040950775146484375, 0.04226493835449219, 0.0435791015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 12.0, 15.0, 29.0, 54.0, 112.0, 222.0, 510.0, 1617.0, 5566.0, 26021.0, 216274.0, 3611162.0, 292262.0, 30764.0, 6482.0, 1920.0, 659.0, 275.0, 134.0, 74.0, 45.0, 26.0, 19.0, 16.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.344970703125, -0.3314704895019531, -0.31797027587890625, -0.3044700622558594, -0.2909698486328125, -0.2774696350097656, -0.26396942138671875, -0.2504692077636719, -0.236968994140625, -0.22346878051757812, -0.20996856689453125, -0.19646835327148438, -0.1829681396484375, -0.16946792602539062, -0.15596771240234375, -0.14246749877929688, -0.12896728515625, -0.11546707153320312, -0.10196685791015625, -0.08846664428710938, -0.0749664306640625, -0.061466217041015625, -0.04796600341796875, -0.034465789794921875, -0.020965576171875, -0.007465362548828125, 0.00603485107421875, 0.019535064697265625, 0.0330352783203125, 0.046535491943359375, 0.06003570556640625, 0.07353591918945312, 0.0870361328125, 0.10053634643554688, 0.11403656005859375, 0.12753677368164062, 0.1410369873046875, 0.15453720092773438, 0.16803741455078125, 0.18153762817382812, 0.195037841796875, 0.20853805541992188, 0.22203826904296875, 0.23553848266601562, 0.2490386962890625, 0.2625389099121094, 0.27603912353515625, 0.2895393371582031, 0.30303955078125, 0.3165397644042969, 0.33003997802734375, 0.3435401916503906, 0.3570404052734375, 0.3705406188964844, 0.38404083251953125, 0.3975410461425781, 0.411041259765625, 0.4245414733886719, 0.43804168701171875, 0.4515419006347656, 0.4650421142578125, 0.4785423278808594, 0.49204254150390625, 0.5055427551269531, 0.51904296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 13.0, 17.0, 20.0, 27.0, 45.0, 89.0, 147.0, 224.0, 576.0, 1771.0, 570.0, 238.0, 130.0, 80.0, 39.0, 27.0, 23.0, 20.0, 9.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06072998046875, -0.05761241912841797, -0.05449485778808594, -0.051377296447753906, -0.048259735107421875, -0.045142173767089844, -0.04202461242675781, -0.03890705108642578, -0.03578948974609375, -0.03267192840576172, -0.029554367065429688, -0.026436805725097656, -0.023319244384765625, -0.020201683044433594, -0.017084121704101562, -0.013966560363769531, -0.0108489990234375, -0.007731437683105469, -0.0046138763427734375, -0.0014963150024414062, 0.001621246337890625, 0.004738807678222656, 0.007856369018554688, 0.010973930358886719, 0.01409149169921875, 0.01720905303955078, 0.020326614379882812, 0.023444175720214844, 0.026561737060546875, 0.029679298400878906, 0.03279685974121094, 0.03591442108154297, 0.039031982421875, 0.04214954376220703, 0.04526710510253906, 0.048384666442871094, 0.051502227783203125, 0.054619789123535156, 0.05773735046386719, 0.06085491180419922, 0.06397247314453125, 0.06709003448486328, 0.07020759582519531, 0.07332515716552734, 0.07644271850585938, 0.0795602798461914, 0.08267784118652344, 0.08579540252685547, 0.0889129638671875, 0.09203052520751953, 0.09514808654785156, 0.0982656478881836, 0.10138320922851562, 0.10450077056884766, 0.10761833190917969, 0.11073589324951172, 0.11385345458984375, 0.11697101593017578, 0.12008857727050781, 0.12320613861083984, 0.12632369995117188, 0.1294412612915039, 0.13255882263183594, 0.13567638397216797, 0.1387939453125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 18.0, 33.0, 82.0, 183.0, 302.0, 233.0, 92.0, 43.0, 12.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2170950323343277, -0.19176141917705536, -0.16642779111862183, -0.1410941779613495, -0.11576056480407715, -0.09042695164680481, -0.06509332358837128, -0.03975971043109894, -0.014426097273826599, 0.010907519608736038, 0.036241136491298676, 0.06157475709915161, 0.08690837025642395, 0.11224198341369629, 0.13757561147212982, 0.16290922462940216, 0.1882428377866745, 0.21357645094394684, 0.23891007900238037, 0.2642436921596527, 0.28957730531692505, 0.3149109184741974, 0.3402445316314697, 0.36557817459106445, 0.3909117579460144, 0.41624537110328674, 0.4415789842605591, 0.4669126272201538, 0.49224621057510376, 0.5175798535346985, 0.5429134368896484, 0.5682470798492432, 0.5935807228088379, 0.6189143657684326, 0.6442479491233826, 0.6695815920829773, 0.6949151754379272, 0.720248818397522, 0.7455824613571167, 0.7709160447120667, 0.7962496280670166, 0.8215832710266113, 0.8469168543815613, 0.872250497341156, 0.897584080696106, 0.9229177236557007, 0.9482513666152954, 0.9735849499702454, 0.9989185929298401, 1.02425217628479, 1.0495858192443848, 1.0749194622039795, 1.1002531051635742, 1.1255866289138794, 1.1509202718734741, 1.1762539148330688, 1.2015875577926636, 1.2269212007522583, 1.252254843711853, 1.2775883674621582, 1.302922010421753, 1.3282556533813477, 1.3535892963409424, 1.378922939300537, 1.4042564630508423]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 9.0, 7.0, 14.0, 11.0, 9.0, 15.0, 16.0, 13.0, 14.0, 24.0, 40.0, 31.0, 24.0, 40.0, 44.0, 52.0, 38.0, 45.0, 48.0, 36.0, 46.0, 62.0, 37.0, 45.0, 43.0, 32.0, 33.0, 31.0, 20.0, 16.0, 17.0, 16.0, 6.0, 10.0, 12.0, 10.0, 8.0, 7.0, 9.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2006056308746338, -0.1934179812669754, -0.1862303465604782, -0.17904269695281982, -0.17185504734516144, -0.16466739773750305, -0.15747976303100586, -0.15029211342334747, -0.1431044638156891, -0.1359168142080307, -0.1287291795015335, -0.12154152989387512, -0.11435388028621674, -0.10716623812913895, -0.09997859597206116, -0.09279094636440277, -0.08560331165790558, -0.07841566950082779, -0.0712280198931694, -0.06404037773609161, -0.056852731853723526, -0.04966508597135544, -0.04247744381427765, -0.03528979793190956, -0.028102152049541473, -0.020914506167173386, -0.013726862147450447, -0.0065392181277275085, 0.0006484277546405792, 0.007836073637008667, 0.015023715794086456, 0.022211361676454544, 0.029399007558822632, 0.03658665344119072, 0.04377429932355881, 0.0509619414806366, 0.058149587363004684, 0.06533723324537277, 0.07252487540245056, 0.07971252501010895, 0.08690016716718674, 0.09408780932426453, 0.10127545893192291, 0.1084631010890007, 0.11565074324607849, 0.12283839285373688, 0.13002604246139526, 0.13721367716789246, 0.14440132677555084, 0.15158897638320923, 0.15877661108970642, 0.1659642606973648, 0.1731519103050232, 0.18033954501152039, 0.18752719461917877, 0.19471484422683716, 0.20190247893333435, 0.20909012854099274, 0.21627776324748993, 0.22346541285514832, 0.2306530624628067, 0.2378407120704651, 0.24502834677696228, 0.2522159814834595, 0.25940364599227905]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 9.0, 9.0, 15.0, 28.0, 25.0, 34.0, 66.0, 109.0, 160.0, 269.0, 456.0, 849.0, 1660.0, 3403.0, 8192.0, 24305.0, 88347.0, 347761.0, 413087.0, 111932.0, 30023.0, 9744.0, 3993.0, 1823.0, 963.0, 508.0, 269.0, 185.0, 106.0, 73.0, 44.0, 38.0, 16.0, 11.0, 11.0, 8.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2406005859375, -0.2323284149169922, -0.22405624389648438, -0.21578407287597656, -0.20751190185546875, -0.19923973083496094, -0.19096755981445312, -0.1826953887939453, -0.1744232177734375, -0.1661510467529297, -0.15787887573242188, -0.14960670471191406, -0.14133453369140625, -0.13306236267089844, -0.12479019165039062, -0.11651802062988281, -0.108245849609375, -0.09997367858886719, -0.09170150756835938, -0.08342933654785156, -0.07515716552734375, -0.06688499450683594, -0.058612823486328125, -0.05034065246582031, -0.0420684814453125, -0.03379631042480469, -0.025524139404296875, -0.017251968383789062, -0.00897979736328125, -0.0007076263427734375, 0.007564544677734375, 0.015836715698242188, 0.02410888671875, 0.03238105773925781, 0.040653228759765625, 0.04892539978027344, 0.05719757080078125, 0.06546974182128906, 0.07374191284179688, 0.08201408386230469, 0.0902862548828125, 0.09855842590332031, 0.10683059692382812, 0.11510276794433594, 0.12337493896484375, 0.13164710998535156, 0.13991928100585938, 0.1481914520263672, 0.156463623046875, 0.1647357940673828, 0.17300796508789062, 0.18128013610839844, 0.18955230712890625, 0.19782447814941406, 0.20609664916992188, 0.2143688201904297, 0.2226409912109375, 0.2309131622314453, 0.23918533325195312, 0.24745750427246094, 0.25572967529296875, 0.26400184631347656, 0.2722740173339844, 0.2805461883544922, 0.288818359375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 11.0, 9.0, 20.0, 30.0, 25.0, 36.0, 39.0, 44.0, 61.0, 71.0, 86.0, 82.0, 71.0, 81.0, 68.0, 50.0, 41.0, 34.0, 33.0, 13.0, 17.0, 16.0, 12.0, 4.0, 8.0, 10.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0382080078125, -0.03683042526245117, -0.035452842712402344, -0.034075260162353516, -0.03269767761230469, -0.03132009506225586, -0.02994251251220703, -0.028564929962158203, -0.027187347412109375, -0.025809764862060547, -0.02443218231201172, -0.02305459976196289, -0.021677017211914062, -0.020299434661865234, -0.018921852111816406, -0.017544269561767578, -0.01616668701171875, -0.014789104461669922, -0.013411521911621094, -0.012033939361572266, -0.010656356811523438, -0.00927877426147461, -0.007901191711425781, -0.006523609161376953, -0.005146026611328125, -0.003768444061279297, -0.0023908615112304688, -0.0010132789611816406, 0.0003643035888671875, 0.0017418861389160156, 0.0031194686889648438, 0.004497051239013672, 0.0058746337890625, 0.007252216339111328, 0.008629798889160156, 0.010007381439208984, 0.011384963989257812, 0.01276254653930664, 0.014140129089355469, 0.015517711639404297, 0.016895294189453125, 0.018272876739501953, 0.01965045928955078, 0.02102804183959961, 0.022405624389648438, 0.023783206939697266, 0.025160789489746094, 0.026538372039794922, 0.02791595458984375, 0.029293537139892578, 0.030671119689941406, 0.032048702239990234, 0.03342628479003906, 0.03480386734008789, 0.03618144989013672, 0.03755903244018555, 0.038936614990234375, 0.0403141975402832, 0.04169178009033203, 0.04306936264038086, 0.04444694519042969, 0.045824527740478516, 0.047202110290527344, 0.04857969284057617, 0.049957275390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 10.0, 15.0, 13.0, 19.0, 20.0, 39.0, 54.0, 88.0, 103.0, 138.0, 224.0, 350.0, 637.0, 1127.0, 2496.0, 6776.0, 21462.0, 79860.0, 304304.0, 440910.0, 136737.0, 35495.0, 10425.0, 3650.0, 1527.0, 770.0, 417.0, 282.0, 172.0, 122.0, 88.0, 56.0, 44.0, 23.0, 16.0, 19.0, 16.0, 8.0, 10.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.278076171875, -0.2696990966796875, -0.261322021484375, -0.2529449462890625, -0.24456787109375, -0.2361907958984375, -0.227813720703125, -0.2194366455078125, -0.2110595703125, -0.2026824951171875, -0.194305419921875, -0.1859283447265625, -0.17755126953125, -0.1691741943359375, -0.160797119140625, -0.1524200439453125, -0.14404296875, -0.1356658935546875, -0.127288818359375, -0.1189117431640625, -0.11053466796875, -0.1021575927734375, -0.093780517578125, -0.0854034423828125, -0.0770263671875, -0.0686492919921875, -0.060272216796875, -0.0518951416015625, -0.04351806640625, -0.0351409912109375, -0.026763916015625, -0.0183868408203125, -0.010009765625, -0.0016326904296875, 0.006744384765625, 0.0151214599609375, 0.02349853515625, 0.0318756103515625, 0.040252685546875, 0.0486297607421875, 0.0570068359375, 0.0653839111328125, 0.073760986328125, 0.0821380615234375, 0.09051513671875, 0.0988922119140625, 0.107269287109375, 0.1156463623046875, 0.1240234375, 0.1324005126953125, 0.140777587890625, 0.1491546630859375, 0.15753173828125, 0.1659088134765625, 0.174285888671875, 0.1826629638671875, 0.1910400390625, 0.1994171142578125, 0.207794189453125, 0.2161712646484375, 0.22454833984375, 0.2329254150390625, 0.241302490234375, 0.2496795654296875, 0.258056640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 8.0, 8.0, 12.0, 8.0, 14.0, 16.0, 18.0, 23.0, 23.0, 33.0, 20.0, 39.0, 30.0, 32.0, 35.0, 56.0, 51.0, 35.0, 39.0, 57.0, 47.0, 30.0, 41.0, 49.0, 34.0, 28.0, 30.0, 21.0, 16.0, 18.0, 23.0, 20.0, 11.0, 13.0, 14.0, 8.0, 6.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.20263671875, -0.19637489318847656, -0.19011306762695312, -0.1838512420654297, -0.17758941650390625, -0.1713275909423828, -0.16506576538085938, -0.15880393981933594, -0.1525421142578125, -0.14628028869628906, -0.14001846313476562, -0.1337566375732422, -0.12749481201171875, -0.12123298645019531, -0.11497116088867188, -0.10870933532714844, -0.102447509765625, -0.09618568420410156, -0.08992385864257812, -0.08366203308105469, -0.07740020751953125, -0.07113838195800781, -0.06487655639648438, -0.05861473083496094, -0.0523529052734375, -0.04609107971191406, -0.039829254150390625, -0.03356742858886719, -0.02730560302734375, -0.021043777465820312, -0.014781951904296875, -0.008520126342773438, -0.00225830078125, 0.0040035247802734375, 0.010265350341796875, 0.016527175903320312, 0.02278900146484375, 0.029050827026367188, 0.035312652587890625, 0.04157447814941406, 0.0478363037109375, 0.05409812927246094, 0.060359954833984375, 0.06662178039550781, 0.07288360595703125, 0.07914543151855469, 0.08540725708007812, 0.09166908264160156, 0.097930908203125, 0.10419273376464844, 0.11045455932617188, 0.11671638488769531, 0.12297821044921875, 0.1292400360107422, 0.13550186157226562, 0.14176368713378906, 0.1480255126953125, 0.15428733825683594, 0.16054916381835938, 0.1668109893798828, 0.17307281494140625, 0.1793346405029297, 0.18559646606445312, 0.19185829162597656, 0.1981201171875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 10.0, 18.0, 45.0, 62.0, 115.0, 210.0, 440.0, 1042.0, 2387.0, 6565.0, 19922.0, 67071.0, 259503.0, 478583.0, 151099.0, 41298.0, 12717.0, 4306.0, 1679.0, 711.0, 332.0, 193.0, 105.0, 52.0, 30.0, 22.0, 13.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10748291015625, -0.10306072235107422, -0.09863853454589844, -0.09421634674072266, -0.08979415893554688, -0.0853719711303711, -0.08094978332519531, -0.07652759552001953, -0.07210540771484375, -0.06768321990966797, -0.06326103210449219, -0.058838844299316406, -0.054416656494140625, -0.049994468688964844, -0.04557228088378906, -0.04115009307861328, -0.0367279052734375, -0.03230571746826172, -0.027883529663085938, -0.023461341857910156, -0.019039154052734375, -0.014616966247558594, -0.010194778442382812, -0.005772590637207031, -0.00135040283203125, 0.0030717849731445312, 0.0074939727783203125, 0.011916160583496094, 0.016338348388671875, 0.020760536193847656, 0.025182723999023438, 0.02960491180419922, 0.034027099609375, 0.03844928741455078, 0.04287147521972656, 0.047293663024902344, 0.051715850830078125, 0.056138038635253906, 0.06056022644042969, 0.06498241424560547, 0.06940460205078125, 0.07382678985595703, 0.07824897766113281, 0.0826711654663086, 0.08709335327148438, 0.09151554107666016, 0.09593772888183594, 0.10035991668701172, 0.1047821044921875, 0.10920429229736328, 0.11362648010253906, 0.11804866790771484, 0.12247085571289062, 0.1268930435180664, 0.1313152313232422, 0.13573741912841797, 0.14015960693359375, 0.14458179473876953, 0.1490039825439453, 0.1534261703491211, 0.15784835815429688, 0.16227054595947266, 0.16669273376464844, 0.17111492156982422, 0.175537109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 5.0, 1.0, 7.0, 9.0, 15.0, 24.0, 47.0, 50.0, 54.0, 87.0, 106.0, 90.0, 109.0, 104.0, 75.0, 53.0, 46.0, 36.0, 30.0, 20.0, 12.0, 10.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013554096221923828, -0.00013245176523923874, -0.0001293625682592392, -0.00012627337127923965, -0.0001231841742992401, -0.00012009497731924057, -0.00011700578033924103, -0.00011391658335924149, -0.00011082738637924194, -0.0001077381893992424, -0.00010464899241924286, -0.00010155979543924332, -9.847059845924377e-05, -9.538140147924423e-05, -9.229220449924469e-05, -8.920300751924515e-05, -8.61138105392456e-05, -8.302461355924606e-05, -7.993541657924652e-05, -7.684621959924698e-05, -7.375702261924744e-05, -7.06678256392479e-05, -6.757862865924835e-05, -6.448943167924881e-05, -6.140023469924927e-05, -5.8311037719249725e-05, -5.522184073925018e-05, -5.213264375925064e-05, -4.90434467792511e-05, -4.5954249799251556e-05, -4.2865052819252014e-05, -3.977585583925247e-05, -3.668665885925293e-05, -3.359746187925339e-05, -3.0508264899253845e-05, -2.7419067919254303e-05, -2.432987093925476e-05, -2.124067395925522e-05, -1.8151476979255676e-05, -1.5062279999256134e-05, -1.1973083019256592e-05, -8.88388603925705e-06, -5.794689059257507e-06, -2.705492079257965e-06, 3.8370490074157715e-07, 3.4729018807411194e-06, 6.562098860740662e-06, 9.651295840740204e-06, 1.2740492820739746e-05, 1.582968980073929e-05, 1.891888678073883e-05, 2.2008083760738373e-05, 2.5097280740737915e-05, 2.8186477720737457e-05, 3.1275674700737e-05, 3.436487168073654e-05, 3.7454068660736084e-05, 4.0543265640735626e-05, 4.363246262073517e-05, 4.672165960073471e-05, 4.981085658073425e-05, 5.2900053560733795e-05, 5.598925054073334e-05, 5.907844752073288e-05, 6.216764450073242e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 8.0, 2.0, 7.0, 8.0, 14.0, 17.0, 26.0, 46.0, 60.0, 63.0, 103.0, 149.0, 201.0, 331.0, 560.0, 1126.0, 2495.0, 6127.0, 18143.0, 59884.0, 233389.0, 518073.0, 145504.0, 40525.0, 12924.0, 4621.0, 1858.0, 933.0, 465.0, 265.0, 175.0, 115.0, 85.0, 77.0, 44.0, 33.0, 26.0, 23.0, 16.0, 12.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1396484375, -0.13519287109375, -0.1307373046875, -0.12628173828125, -0.121826171875, -0.11737060546875, -0.1129150390625, -0.10845947265625, -0.10400390625, -0.09954833984375, -0.0950927734375, -0.09063720703125, -0.086181640625, -0.08172607421875, -0.0772705078125, -0.07281494140625, -0.068359375, -0.06390380859375, -0.0594482421875, -0.05499267578125, -0.050537109375, -0.04608154296875, -0.0416259765625, -0.03717041015625, -0.03271484375, -0.02825927734375, -0.0238037109375, -0.01934814453125, -0.014892578125, -0.01043701171875, -0.0059814453125, -0.00152587890625, 0.0029296875, 0.00738525390625, 0.0118408203125, 0.01629638671875, 0.020751953125, 0.02520751953125, 0.0296630859375, 0.03411865234375, 0.03857421875, 0.04302978515625, 0.0474853515625, 0.05194091796875, 0.056396484375, 0.06085205078125, 0.0653076171875, 0.06976318359375, 0.07421875, 0.07867431640625, 0.0831298828125, 0.08758544921875, 0.092041015625, 0.09649658203125, 0.1009521484375, 0.10540771484375, 0.10986328125, 0.11431884765625, 0.1187744140625, 0.12322998046875, 0.127685546875, 0.13214111328125, 0.1365966796875, 0.14105224609375, 0.1455078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 1.0, 3.0, 9.0, 9.0, 6.0, 8.0, 15.0, 21.0, 13.0, 24.0, 32.0, 35.0, 46.0, 50.0, 73.0, 78.0, 102.0, 75.0, 63.0, 54.0, 54.0, 45.0, 40.0, 34.0, 19.0, 15.0, 12.0, 12.0, 12.0, 8.0, 7.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-0.09893798828125, -0.09633350372314453, -0.09372901916503906, -0.0911245346069336, -0.08852005004882812, -0.08591556549072266, -0.08331108093261719, -0.08070659637451172, -0.07810211181640625, -0.07549762725830078, -0.07289314270019531, -0.07028865814208984, -0.06768417358398438, -0.0650796890258789, -0.06247520446777344, -0.05987071990966797, -0.0572662353515625, -0.05466175079345703, -0.05205726623535156, -0.049452781677246094, -0.046848297119140625, -0.044243812561035156, -0.04163932800292969, -0.03903484344482422, -0.03643035888671875, -0.03382587432861328, -0.031221389770507812, -0.028616905212402344, -0.026012420654296875, -0.023407936096191406, -0.020803451538085938, -0.01819896697998047, -0.015594482421875, -0.012989997863769531, -0.010385513305664062, -0.007781028747558594, -0.005176544189453125, -0.0025720596313476562, 3.24249267578125e-05, 0.0026369094848632812, 0.00524139404296875, 0.007845878601074219, 0.010450363159179688, 0.013054847717285156, 0.015659332275390625, 0.018263816833496094, 0.020868301391601562, 0.02347278594970703, 0.0260772705078125, 0.02868175506591797, 0.03128623962402344, 0.033890724182128906, 0.036495208740234375, 0.039099693298339844, 0.04170417785644531, 0.04430866241455078, 0.04691314697265625, 0.04951763153076172, 0.05212211608886719, 0.054726600646972656, 0.057331085205078125, 0.059935569763183594, 0.06254005432128906, 0.06514453887939453, 0.0677490234375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 11.0, 8.0, 31.0, 55.0, 105.0, 193.0, 210.0, 170.0, 99.0, 58.0, 24.0, 13.0, 12.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1753957271575928, -1.099431037902832, -1.0234663486480713, -0.9475017189979553, -0.8715370893478394, -0.7955724000930786, -0.7196077108383179, -0.6436430811882019, -0.5676783919334412, -0.4917137324810028, -0.41574907302856445, -0.3397843837738037, -0.26381972432136536, -0.187855064868927, -0.11189037561416626, -0.03592574596405029, 0.04003894329071045, 0.1160036101937294, 0.19196827709674835, 0.2679329514503479, 0.34389761090278625, 0.4198622703552246, 0.49582695960998535, 0.5717915892601013, 0.6477562785148621, 0.7237209677696228, 0.7996855974197388, 0.8756502866744995, 0.9516149759292603, 1.0275795459747314, 1.1035442352294922, 1.179508924484253, 1.2554736137390137, 1.3314383029937744, 1.4074029922485352, 1.483367681503296, 1.559332251548767, 1.6352969408035278, 1.7112616300582886, 1.7872262001037598, 1.8631908893585205, 1.9391555786132812, 2.015120267868042, 2.0910849571228027, 2.1670496463775635, 2.243014335632324, 2.318978786468506, 2.3949434757232666, 2.4709081649780273, 2.546872854232788, 2.622837543487549, 2.6988022327423096, 2.7747669219970703, 2.850731372833252, 2.926696300506592, 3.0026607513427734, 3.0786256790161133, 3.154590368270874, 3.2305550575256348, 3.3065197467803955, 3.3824844360351562, 3.458448886871338, 3.5344138145446777, 3.6103782653808594, 3.68634295463562]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 11.0, 11.0, 10.0, 13.0, 23.0, 14.0, 20.0, 31.0, 26.0, 28.0, 31.0, 30.0, 51.0, 45.0, 41.0, 43.0, 48.0, 45.0, 42.0, 49.0, 45.0, 46.0, 41.0, 40.0, 23.0, 35.0, 18.0, 28.0, 22.0, 8.0, 14.0, 10.0, 16.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4971299171447754, -1.451413869857788, -1.4056979417800903, -1.359981894493103, -1.3142659664154053, -1.268549919128418, -1.2228338718414307, -1.177117943763733, -1.1314020156860352, -1.0856859683990479, -1.03997004032135, -0.9942539930343628, -0.948538064956665, -0.9028220176696777, -0.8571060299873352, -0.8113900423049927, -0.7656739950180054, -0.7199580073356628, -0.6742420196533203, -0.628525972366333, -0.5828100442886353, -0.537093997001648, -0.4913780093193054, -0.4456620216369629, -0.39994603395462036, -0.35423004627227783, -0.3085140585899353, -0.2627980411052704, -0.21708205342292786, -0.17136606574058533, -0.1256500482559204, -0.07993406057357788, -0.03421807289123535, 0.011497922241687775, 0.0572139173746109, 0.10292991995811462, 0.14864590764045715, 0.19436189532279968, 0.2400779128074646, 0.28579390048980713, 0.33150988817214966, 0.3772258758544922, 0.4229418635368347, 0.46865788102149963, 0.5143738985061646, 0.5600898265838623, 0.6058058738708496, 0.6515218615531921, 0.6972378492355347, 0.7429538369178772, 0.7886698246002197, 0.834385871887207, 0.8801017999649048, 0.9258178472518921, 0.9715338349342346, 1.0172498226165771, 1.0629658699035645, 1.1086819171905518, 1.1543978452682495, 1.2001138925552368, 1.2458298206329346, 1.2915458679199219, 1.3372619152069092, 1.382977843284607, 1.4286937713623047]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 7.0, 8.0, 12.0, 5.0, 23.0, 30.0, 39.0, 66.0, 98.0, 158.0, 253.0, 446.0, 710.0, 1336.0, 2904.0, 7868.0, 27157.0, 149589.0, 3602473.0, 337017.0, 44224.0, 11450.0, 4181.0, 1844.0, 911.0, 513.0, 293.0, 210.0, 165.0, 75.0, 59.0, 51.0, 23.0, 23.0, 15.0, 10.0, 5.0, 10.0, 2.0, 6.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33544921875, -0.3248558044433594, -0.31426239013671875, -0.3036689758300781, -0.2930755615234375, -0.2824821472167969, -0.27188873291015625, -0.2612953186035156, -0.250701904296875, -0.24010848999023438, -0.22951507568359375, -0.21892166137695312, -0.2083282470703125, -0.19773483276367188, -0.18714141845703125, -0.17654800415039062, -0.16595458984375, -0.15536117553710938, -0.14476776123046875, -0.13417434692382812, -0.1235809326171875, -0.11298751831054688, -0.10239410400390625, -0.09180068969726562, -0.081207275390625, -0.07061386108398438, -0.06002044677734375, -0.049427032470703125, -0.0388336181640625, -0.028240203857421875, -0.01764678955078125, -0.007053375244140625, 0.0035400390625, 0.014133453369140625, 0.02472686767578125, 0.035320281982421875, 0.0459136962890625, 0.056507110595703125, 0.06710052490234375, 0.07769393920898438, 0.088287353515625, 0.09888076782226562, 0.10947418212890625, 0.12006759643554688, 0.1306610107421875, 0.14125442504882812, 0.15184783935546875, 0.16244125366210938, 0.17303466796875, 0.18362808227539062, 0.19422149658203125, 0.20481491088867188, 0.2154083251953125, 0.22600173950195312, 0.23659515380859375, 0.24718856811523438, 0.257781982421875, 0.2683753967285156, 0.27896881103515625, 0.2895622253417969, 0.3001556396484375, 0.3107490539550781, 0.32134246826171875, 0.3319358825683594, 0.342529296875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 12.0, 10.0, 14.0, 16.0, 24.0, 29.0, 29.0, 40.0, 46.0, 49.0, 72.0, 77.0, 67.0, 80.0, 81.0, 66.0, 51.0, 45.0, 37.0, 41.0, 22.0, 20.0, 22.0, 10.0, 12.0, 6.0, 3.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.059112548828125, -0.057383060455322266, -0.05565357208251953, -0.0539240837097168, -0.05219459533691406, -0.05046510696411133, -0.048735618591308594, -0.04700613021850586, -0.045276641845703125, -0.04354715347290039, -0.041817665100097656, -0.04008817672729492, -0.03835868835449219, -0.03662919998168945, -0.03489971160888672, -0.033170223236083984, -0.03144073486328125, -0.029711246490478516, -0.02798175811767578, -0.026252269744873047, -0.024522781372070312, -0.022793292999267578, -0.021063804626464844, -0.01933431625366211, -0.017604827880859375, -0.01587533950805664, -0.014145851135253906, -0.012416362762451172, -0.010686874389648438, -0.008957386016845703, -0.007227897644042969, -0.005498409271240234, -0.0037689208984375, -0.0020394325256347656, -0.00030994415283203125, 0.0014195442199707031, 0.0031490325927734375, 0.004878520965576172, 0.006608009338378906, 0.00833749771118164, 0.010066986083984375, 0.01179647445678711, 0.013525962829589844, 0.015255451202392578, 0.016984939575195312, 0.018714427947998047, 0.02044391632080078, 0.022173404693603516, 0.02390289306640625, 0.025632381439208984, 0.02736186981201172, 0.029091358184814453, 0.030820846557617188, 0.03255033493041992, 0.034279823303222656, 0.03600931167602539, 0.037738800048828125, 0.03946828842163086, 0.041197776794433594, 0.04292726516723633, 0.04465675354003906, 0.0463862419128418, 0.04811573028564453, 0.049845218658447266, 0.05157470703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 11.0, 7.0, 20.0, 19.0, 23.0, 45.0, 47.0, 71.0, 137.0, 183.0, 252.0, 380.0, 686.0, 1247.0, 2430.0, 5224.0, 13005.0, 36606.0, 136006.0, 1163850.0, 2581756.0, 180167.0, 44583.0, 15191.0, 6228.0, 2714.0, 1384.0, 787.0, 432.0, 259.0, 183.0, 119.0, 85.0, 46.0, 25.0, 18.0, 17.0, 8.0, 5.0, 9.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2115478515625, -0.2047443389892578, -0.19794082641601562, -0.19113731384277344, -0.18433380126953125, -0.17753028869628906, -0.17072677612304688, -0.1639232635498047, -0.1571197509765625, -0.1503162384033203, -0.14351272583007812, -0.13670921325683594, -0.12990570068359375, -0.12310218811035156, -0.11629867553710938, -0.10949516296386719, -0.102691650390625, -0.09588813781738281, -0.08908462524414062, -0.08228111267089844, -0.07547760009765625, -0.06867408752441406, -0.061870574951171875, -0.05506706237792969, -0.0482635498046875, -0.04146003723144531, -0.034656524658203125, -0.027853012084960938, -0.02104949951171875, -0.014245986938476562, -0.007442474365234375, -0.0006389617919921875, 0.00616455078125, 0.012968063354492188, 0.019771575927734375, 0.026575088500976562, 0.03337860107421875, 0.04018211364746094, 0.046985626220703125, 0.05378913879394531, 0.0605926513671875, 0.06739616394042969, 0.07419967651367188, 0.08100318908691406, 0.08780670166015625, 0.09461021423339844, 0.10141372680664062, 0.10821723937988281, 0.115020751953125, 0.12182426452636719, 0.12862777709960938, 0.13543128967285156, 0.14223480224609375, 0.14903831481933594, 0.15584182739257812, 0.1626453399658203, 0.1694488525390625, 0.1762523651123047, 0.18305587768554688, 0.18985939025878906, 0.19666290283203125, 0.20346641540527344, 0.21026992797851562, 0.2170734405517578, 0.223876953125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 7.0, 17.0, 12.0, 17.0, 23.0, 28.0, 50.0, 84.0, 94.0, 194.0, 351.0, 1122.0, 1235.0, 349.0, 162.0, 92.0, 79.0, 39.0, 24.0, 29.0, 19.0, 13.0, 10.0, 6.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.10089111328125, -0.09837007522583008, -0.09584903717041016, -0.09332799911499023, -0.09080696105957031, -0.08828592300415039, -0.08576488494873047, -0.08324384689331055, -0.08072280883789062, -0.0782017707824707, -0.07568073272705078, -0.07315969467163086, -0.07063865661621094, -0.06811761856079102, -0.0655965805053711, -0.06307554244995117, -0.06055450439453125, -0.05803346633911133, -0.055512428283691406, -0.052991390228271484, -0.05047035217285156, -0.04794931411743164, -0.04542827606201172, -0.0429072380065918, -0.040386199951171875, -0.03786516189575195, -0.03534412384033203, -0.03282308578491211, -0.030302047729492188, -0.027781009674072266, -0.025259971618652344, -0.022738933563232422, -0.0202178955078125, -0.017696857452392578, -0.015175819396972656, -0.012654781341552734, -0.010133743286132812, -0.007612705230712891, -0.005091667175292969, -0.002570629119873047, -4.9591064453125e-05, 0.002471446990966797, 0.004992485046386719, 0.007513523101806641, 0.010034561157226562, 0.012555599212646484, 0.015076637268066406, 0.017597675323486328, 0.02011871337890625, 0.022639751434326172, 0.025160789489746094, 0.027681827545166016, 0.030202865600585938, 0.03272390365600586, 0.03524494171142578, 0.0377659797668457, 0.040287017822265625, 0.04280805587768555, 0.04532909393310547, 0.04785013198852539, 0.05037117004394531, 0.052892208099365234, 0.055413246154785156, 0.05793428421020508, 0.060455322265625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 7.0, 19.0, 47.0, 66.0, 166.0, 246.0, 216.0, 130.0, 57.0, 31.0, 17.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3823726177215576, -0.3583725094795227, -0.3343724012374878, -0.3103722929954529, -0.28637218475341797, -0.26237207651138306, -0.23837193846702576, -0.21437183022499084, -0.19037172198295593, -0.16637161374092102, -0.1423715054988861, -0.11837138235569, -0.09437127411365509, -0.07037116587162018, -0.04637104272842407, -0.02237093448638916, 0.001629173755645752, 0.025629285722970963, 0.04962939769029617, 0.07362951338291168, 0.0976296216249466, 0.1216297298669815, 0.1456298530101776, 0.16962996125221252, 0.19363006949424744, 0.21763017773628235, 0.24163028597831726, 0.26563042402267456, 0.2896305322647095, 0.3136306405067444, 0.3376307487487793, 0.3616308569908142, 0.3856309652328491, 0.40963107347488403, 0.43363118171691895, 0.45763128995895386, 0.48163139820098877, 0.5056315064430237, 0.5296316146850586, 0.5536317825317383, 0.5776318311691284, 0.6016319394111633, 0.6256320476531982, 0.6496321558952332, 0.6736322641372681, 0.697632372379303, 0.7216324806213379, 0.7456326484680176, 0.7696327567100525, 0.7936328649520874, 0.8176329731941223, 0.8416330814361572, 0.8656331896781921, 0.889633297920227, 0.9136334657669067, 0.9376335144042969, 0.9616336822509766, 0.9856337904930115, 1.0096338987350464, 1.033634066581726, 1.0576341152191162, 1.081634283065796, 1.105634331703186, 1.1296344995498657, 1.1536345481872559]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 6.0, 5.0, 3.0, 11.0, 5.0, 10.0, 10.0, 14.0, 16.0, 14.0, 27.0, 19.0, 25.0, 29.0, 31.0, 32.0, 36.0, 47.0, 42.0, 48.0, 46.0, 40.0, 37.0, 37.0, 36.0, 29.0, 40.0, 37.0, 36.0, 27.0, 37.0, 21.0, 22.0, 30.0, 16.0, 9.0, 13.0, 14.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.21842819452285767, -0.2109563797712326, -0.20348455011844635, -0.1960127353668213, -0.18854090571403503, -0.18106909096240997, -0.1735972762107849, -0.16612544655799866, -0.1586536318063736, -0.15118181705474854, -0.14370998740196228, -0.13623817265033722, -0.12876635789871216, -0.1212945282459259, -0.11382271349430084, -0.10635089129209518, -0.09887906908988953, -0.09140724688768387, -0.08393542468547821, -0.07646360993385315, -0.06899178773164749, -0.061519965529441833, -0.054048147052526474, -0.046576328575611115, -0.03910450637340546, -0.0316326841711998, -0.02416086569428444, -0.01668904535472393, -0.009217225015163422, -0.0017454028129577637, 0.005726415663957596, 0.013198234140872955, 0.020670056343078613, 0.028141876682639122, 0.03561369702219963, 0.04308551549911499, 0.05055733770132065, 0.058029159903526306, 0.06550097465515137, 0.07297279685735703, 0.08044461905956268, 0.08791644126176834, 0.095388263463974, 0.10286007821559906, 0.11033190041780472, 0.11780372262001038, 0.12527553737163544, 0.1327473521232605, 0.14021918177604675, 0.14769099652767181, 0.15516282618045807, 0.16263464093208313, 0.17010647058486938, 0.17757828533649445, 0.1850501000881195, 0.19252192974090576, 0.19999374449253082, 0.20746555924415588, 0.21493738889694214, 0.2224092036485672, 0.22988101840019226, 0.23735284805297852, 0.24482466280460358, 0.25229647755622864, 0.2597683072090149]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 9.0, 3.0, 5.0, 9.0, 17.0, 17.0, 37.0, 36.0, 59.0, 81.0, 111.0, 224.0, 321.0, 480.0, 760.0, 1418.0, 2469.0, 4906.0, 9686.0, 19605.0, 42483.0, 94913.0, 208869.0, 316479.0, 186725.0, 84713.0, 37987.0, 17558.0, 8442.0, 4380.0, 2359.0, 1278.0, 775.0, 480.0, 281.0, 202.0, 126.0, 82.0, 59.0, 44.0, 25.0, 17.0, 10.0, 7.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.1641845703125, -0.15979766845703125, -0.1554107666015625, -0.15102386474609375, -0.146636962890625, -0.14225006103515625, -0.1378631591796875, -0.13347625732421875, -0.12908935546875, -0.12470245361328125, -0.1203155517578125, -0.11592864990234375, -0.111541748046875, -0.10715484619140625, -0.1027679443359375, -0.09838104248046875, -0.093994140625, -0.08960723876953125, -0.0852203369140625, -0.08083343505859375, -0.076446533203125, -0.07205963134765625, -0.0676727294921875, -0.06328582763671875, -0.05889892578125, -0.05451202392578125, -0.0501251220703125, -0.04573822021484375, -0.041351318359375, -0.03696441650390625, -0.0325775146484375, -0.02819061279296875, -0.0238037109375, -0.01941680908203125, -0.0150299072265625, -0.01064300537109375, -0.006256103515625, -0.00186920166015625, 0.0025177001953125, 0.00690460205078125, 0.01129150390625, 0.01567840576171875, 0.0200653076171875, 0.02445220947265625, 0.028839111328125, 0.03322601318359375, 0.0376129150390625, 0.04199981689453125, 0.04638671875, 0.05077362060546875, 0.0551605224609375, 0.05954742431640625, 0.063934326171875, 0.06832122802734375, 0.0727081298828125, 0.07709503173828125, 0.08148193359375, 0.08586883544921875, 0.0902557373046875, 0.09464263916015625, 0.099029541015625, 0.10341644287109375, 0.1078033447265625, 0.11219024658203125, 0.1165771484375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 11.0, 11.0, 19.0, 26.0, 30.0, 32.0, 52.0, 48.0, 40.0, 60.0, 93.0, 68.0, 77.0, 74.0, 64.0, 50.0, 48.0, 41.0, 29.0, 33.0, 18.0, 17.0, 11.0, 10.0, 4.0, 7.0, 7.0, 1.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06231689453125, -0.06062889099121094, -0.058940887451171875, -0.05725288391113281, -0.05556488037109375, -0.05387687683105469, -0.052188873291015625, -0.05050086975097656, -0.0488128662109375, -0.04712486267089844, -0.045436859130859375, -0.04374885559082031, -0.04206085205078125, -0.04037284851074219, -0.038684844970703125, -0.03699684143066406, -0.035308837890625, -0.03362083435058594, -0.031932830810546875, -0.030244827270507812, -0.02855682373046875, -0.026868820190429688, -0.025180816650390625, -0.023492813110351562, -0.0218048095703125, -0.020116806030273438, -0.018428802490234375, -0.016740798950195312, -0.01505279541015625, -0.013364791870117188, -0.011676788330078125, -0.009988784790039062, -0.00830078125, -0.0066127777099609375, -0.004924774169921875, -0.0032367706298828125, -0.00154876708984375, 0.0001392364501953125, 0.001827239990234375, 0.0035152435302734375, 0.0052032470703125, 0.0068912506103515625, 0.008579254150390625, 0.010267257690429688, 0.01195526123046875, 0.013643264770507812, 0.015331268310546875, 0.017019271850585938, 0.018707275390625, 0.020395278930664062, 0.022083282470703125, 0.023771286010742188, 0.02545928955078125, 0.027147293090820312, 0.028835296630859375, 0.030523300170898438, 0.0322113037109375, 0.03389930725097656, 0.035587310791015625, 0.03727531433105469, 0.03896331787109375, 0.04065132141113281, 0.042339324951171875, 0.04402732849121094, 0.04571533203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 9.0, 7.0, 8.0, 20.0, 32.0, 35.0, 63.0, 68.0, 93.0, 159.0, 227.0, 393.0, 630.0, 1229.0, 2419.0, 5650.0, 15875.0, 54567.0, 192746.0, 433521.0, 238765.0, 69242.0, 19978.0, 6825.0, 2781.0, 1302.0, 701.0, 396.0, 272.0, 150.0, 114.0, 74.0, 52.0, 43.0, 30.0, 23.0, 13.0, 12.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.228515625, -0.22243690490722656, -0.21635818481445312, -0.2102794647216797, -0.20420074462890625, -0.1981220245361328, -0.19204330444335938, -0.18596458435058594, -0.1798858642578125, -0.17380714416503906, -0.16772842407226562, -0.1616497039794922, -0.15557098388671875, -0.1494922637939453, -0.14341354370117188, -0.13733482360839844, -0.131256103515625, -0.12517738342285156, -0.11909866333007812, -0.11301994323730469, -0.10694122314453125, -0.10086250305175781, -0.09478378295898438, -0.08870506286621094, -0.0826263427734375, -0.07654762268066406, -0.07046890258789062, -0.06439018249511719, -0.05831146240234375, -0.05223274230957031, -0.046154022216796875, -0.04007530212402344, -0.03399658203125, -0.027917861938476562, -0.021839141845703125, -0.015760421752929688, -0.00968170166015625, -0.0036029815673828125, 0.002475738525390625, 0.008554458618164062, 0.0146331787109375, 0.020711898803710938, 0.026790618896484375, 0.03286933898925781, 0.03894805908203125, 0.04502677917480469, 0.051105499267578125, 0.05718421936035156, 0.063262939453125, 0.06934165954589844, 0.07542037963867188, 0.08149909973144531, 0.08757781982421875, 0.09365653991699219, 0.09973526000976562, 0.10581398010253906, 0.1118927001953125, 0.11797142028808594, 0.12405014038085938, 0.1301288604736328, 0.13620758056640625, 0.1422863006591797, 0.14836502075195312, 0.15444374084472656, 0.1605224609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 13.0, 8.0, 5.0, 16.0, 16.0, 17.0, 23.0, 37.0, 36.0, 33.0, 47.0, 49.0, 51.0, 61.0, 58.0, 56.0, 59.0, 47.0, 57.0, 44.0, 49.0, 42.0, 42.0, 21.0, 20.0, 23.0, 17.0, 13.0, 6.0, 6.0, 10.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.315185546875, -0.3072471618652344, -0.29930877685546875, -0.2913703918457031, -0.2834320068359375, -0.2754936218261719, -0.26755523681640625, -0.2596168518066406, -0.251678466796875, -0.24374008178710938, -0.23580169677734375, -0.22786331176757812, -0.2199249267578125, -0.21198654174804688, -0.20404815673828125, -0.19610977172851562, -0.18817138671875, -0.18023300170898438, -0.17229461669921875, -0.16435623168945312, -0.1564178466796875, -0.14847946166992188, -0.14054107666015625, -0.13260269165039062, -0.124664306640625, -0.11672592163085938, -0.10878753662109375, -0.10084915161132812, -0.0929107666015625, -0.08497238159179688, -0.07703399658203125, -0.06909561157226562, -0.0611572265625, -0.053218841552734375, -0.04528045654296875, -0.037342071533203125, -0.0294036865234375, -0.021465301513671875, -0.01352691650390625, -0.005588531494140625, 0.002349853515625, 0.010288238525390625, 0.01822662353515625, 0.026165008544921875, 0.0341033935546875, 0.042041778564453125, 0.04998016357421875, 0.057918548583984375, 0.06585693359375, 0.07379531860351562, 0.08173370361328125, 0.08967208862304688, 0.0976104736328125, 0.10554885864257812, 0.11348724365234375, 0.12142562866210938, 0.129364013671875, 0.13730239868164062, 0.14524078369140625, 0.15317916870117188, 0.1611175537109375, 0.16905593872070312, 0.17699432373046875, 0.18493270874023438, 0.19287109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 16.0, 13.0, 16.0, 27.0, 38.0, 65.0, 88.0, 158.0, 201.0, 374.0, 649.0, 1150.0, 2540.0, 5550.0, 13831.0, 38678.0, 125935.0, 401739.0, 317508.0, 90954.0, 29132.0, 10856.0, 4415.0, 2090.0, 1066.0, 586.0, 293.0, 200.0, 120.0, 84.0, 53.0, 37.0, 26.0, 18.0, 16.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0712890625, -0.06863594055175781, -0.06598281860351562, -0.06332969665527344, -0.06067657470703125, -0.05802345275878906, -0.055370330810546875, -0.05271720886230469, -0.0500640869140625, -0.04741096496582031, -0.044757843017578125, -0.04210472106933594, -0.03945159912109375, -0.03679847717285156, -0.034145355224609375, -0.03149223327636719, -0.028839111328125, -0.026185989379882812, -0.023532867431640625, -0.020879745483398438, -0.01822662353515625, -0.015573501586914062, -0.012920379638671875, -0.010267257690429688, -0.0076141357421875, -0.0049610137939453125, -0.002307891845703125, 0.0003452301025390625, 0.00299835205078125, 0.0056514739990234375, 0.008304595947265625, 0.010957717895507812, 0.01361083984375, 0.016263961791992188, 0.018917083740234375, 0.021570205688476562, 0.02422332763671875, 0.026876449584960938, 0.029529571533203125, 0.03218269348144531, 0.0348358154296875, 0.03748893737792969, 0.040142059326171875, 0.04279518127441406, 0.04544830322265625, 0.04810142517089844, 0.050754547119140625, 0.05340766906738281, 0.056060791015625, 0.05871391296386719, 0.061367034912109375, 0.06402015686035156, 0.06667327880859375, 0.06932640075683594, 0.07197952270507812, 0.07463264465332031, 0.0772857666015625, 0.07993888854980469, 0.08259201049804688, 0.08524513244628906, 0.08789825439453125, 0.09055137634277344, 0.09320449829101562, 0.09585762023925781, 0.0985107421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 8.0, 17.0, 17.0, 19.0, 22.0, 36.0, 41.0, 43.0, 54.0, 54.0, 65.0, 68.0, 68.0, 68.0, 58.0, 62.0, 52.0, 51.0, 56.0, 29.0, 25.0, 15.0, 13.0, 13.0, 10.0, 2.0, 8.0, 7.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7578086853027344e-05, -5.5806711316108704e-05, -5.4035335779190063e-05, -5.226396024227142e-05, -5.049258470535278e-05, -4.872120916843414e-05, -4.69498336315155e-05, -4.517845809459686e-05, -4.340708255767822e-05, -4.163570702075958e-05, -3.986433148384094e-05, -3.80929559469223e-05, -3.632158041000366e-05, -3.455020487308502e-05, -3.277882933616638e-05, -3.100745379924774e-05, -2.92360782623291e-05, -2.746470272541046e-05, -2.569332718849182e-05, -2.392195165157318e-05, -2.215057611465454e-05, -2.03792005777359e-05, -1.860782504081726e-05, -1.683644950389862e-05, -1.506507396697998e-05, -1.329369843006134e-05, -1.15223228931427e-05, -9.75094735622406e-06, -7.97957181930542e-06, -6.20819628238678e-06, -4.43682074546814e-06, -2.6654452085494995e-06, -8.940696716308594e-07, 8.773058652877808e-07, 2.648681402206421e-06, 4.420056939125061e-06, 6.191432476043701e-06, 7.962808012962341e-06, 9.734183549880981e-06, 1.1505559086799622e-05, 1.3276934623718262e-05, 1.5048310160636902e-05, 1.6819685697555542e-05, 1.8591061234474182e-05, 2.0362436771392822e-05, 2.2133812308311462e-05, 2.3905187845230103e-05, 2.5676563382148743e-05, 2.7447938919067383e-05, 2.9219314455986023e-05, 3.099068999290466e-05, 3.27620655298233e-05, 3.453344106674194e-05, 3.6304816603660583e-05, 3.8076192140579224e-05, 3.9847567677497864e-05, 4.1618943214416504e-05, 4.3390318751335144e-05, 4.5161694288253784e-05, 4.6933069825172424e-05, 4.8704445362091064e-05, 5.0475820899009705e-05, 5.2247196435928345e-05, 5.4018571972846985e-05, 5.5789947509765625e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 9.0, 9.0, 14.0, 29.0, 24.0, 43.0, 58.0, 107.0, 121.0, 238.0, 422.0, 735.0, 1563.0, 3191.0, 7762.0, 22279.0, 74866.0, 300314.0, 453042.0, 127706.0, 35368.0, 11663.0, 4616.0, 1968.0, 1001.0, 527.0, 288.0, 196.0, 115.0, 74.0, 63.0, 36.0, 22.0, 20.0, 9.0, 9.0, 6.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0819091796875, -0.07919692993164062, -0.07648468017578125, -0.07377243041992188, -0.0710601806640625, -0.06834793090820312, -0.06563568115234375, -0.06292343139648438, -0.060211181640625, -0.057498931884765625, -0.05478668212890625, -0.052074432373046875, -0.0493621826171875, -0.046649932861328125, -0.04393768310546875, -0.041225433349609375, -0.03851318359375, -0.035800933837890625, -0.03308868408203125, -0.030376434326171875, -0.0276641845703125, -0.024951934814453125, -0.02223968505859375, -0.019527435302734375, -0.016815185546875, -0.014102935791015625, -0.01139068603515625, -0.008678436279296875, -0.0059661865234375, -0.003253936767578125, -0.00054168701171875, 0.002170562744140625, 0.0048828125, 0.007595062255859375, 0.01030731201171875, 0.013019561767578125, 0.0157318115234375, 0.018444061279296875, 0.02115631103515625, 0.023868560791015625, 0.026580810546875, 0.029293060302734375, 0.03200531005859375, 0.034717559814453125, 0.0374298095703125, 0.040142059326171875, 0.04285430908203125, 0.045566558837890625, 0.04827880859375, 0.050991058349609375, 0.05370330810546875, 0.056415557861328125, 0.0591278076171875, 0.061840057373046875, 0.06455230712890625, 0.06726455688476562, 0.069976806640625, 0.07268905639648438, 0.07540130615234375, 0.07811355590820312, 0.0808258056640625, 0.08353805541992188, 0.08625030517578125, 0.08896255493164062, 0.0916748046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 4.0, 1.0, 3.0, 8.0, 8.0, 11.0, 13.0, 21.0, 23.0, 20.0, 30.0, 26.0, 52.0, 55.0, 49.0, 61.0, 83.0, 64.0, 59.0, 79.0, 48.0, 55.0, 41.0, 33.0, 32.0, 28.0, 23.0, 21.0, 16.0, 7.0, 8.0, 7.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0517578125, -0.049953460693359375, -0.04814910888671875, -0.046344757080078125, -0.0445404052734375, -0.042736053466796875, -0.04093170166015625, -0.039127349853515625, -0.037322998046875, -0.035518646240234375, -0.03371429443359375, -0.031909942626953125, -0.0301055908203125, -0.028301239013671875, -0.02649688720703125, -0.024692535400390625, -0.02288818359375, -0.021083831787109375, -0.01927947998046875, -0.017475128173828125, -0.0156707763671875, -0.013866424560546875, -0.01206207275390625, -0.010257720947265625, -0.008453369140625, -0.006649017333984375, -0.00484466552734375, -0.003040313720703125, -0.0012359619140625, 0.000568389892578125, 0.00237274169921875, 0.004177093505859375, 0.0059814453125, 0.007785797119140625, 0.00959014892578125, 0.011394500732421875, 0.0131988525390625, 0.015003204345703125, 0.01680755615234375, 0.018611907958984375, 0.020416259765625, 0.022220611572265625, 0.02402496337890625, 0.025829315185546875, 0.0276336669921875, 0.029438018798828125, 0.03124237060546875, 0.033046722412109375, 0.03485107421875, 0.036655426025390625, 0.03845977783203125, 0.040264129638671875, 0.0420684814453125, 0.043872833251953125, 0.04567718505859375, 0.047481536865234375, 0.049285888671875, 0.051090240478515625, 0.05289459228515625, 0.054698944091796875, 0.0565032958984375, 0.058307647705078125, 0.06011199951171875, 0.061916351318359375, 0.063720703125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 9.0, 16.0, 29.0, 46.0, 60.0, 94.0, 117.0, 151.0, 144.0, 103.0, 93.0, 55.0, 36.0, 18.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5754654407501221, -0.5339462757110596, -0.4924270808696747, -0.4509079158306122, -0.4093887209892273, -0.3678695559501648, -0.3263503909111023, -0.2848311960697174, -0.2433120310306549, -0.2017928510904312, -0.16027367115020752, -0.11875450611114502, -0.07723532617092133, -0.03571614623069763, 0.005803018808364868, 0.047322213649749756, 0.08884137868881226, 0.13036055862903595, 0.17187973856925964, 0.21339890360832214, 0.25491809844970703, 0.29643726348876953, 0.33795642852783203, 0.3794756233692169, 0.4209947884082794, 0.4625139534473419, 0.5040331482887268, 0.5455523133277893, 0.5870714783668518, 0.6285907030105591, 0.6701098680496216, 0.7116290330886841, 0.7531481981277466, 0.7946673631668091, 0.8361865282058716, 0.8777056932449341, 0.9192249178886414, 0.9607440829277039, 1.0022633075714111, 1.0437824726104736, 1.0853016376495361, 1.1268208026885986, 1.1683399677276611, 1.2098591327667236, 1.2513782978057861, 1.2928974628448486, 1.3344166278839111, 1.3759359121322632, 1.4174549579620361, 1.4589741230010986, 1.5004932880401611, 1.5420124530792236, 1.5835316181182861, 1.6250507831573486, 1.6665699481964111, 1.7080892324447632, 1.7496083974838257, 1.7911275625228882, 1.8326467275619507, 1.8741658926010132, 1.9156850576400757, 1.9572043418884277, 1.9987235069274902, 2.0402426719665527, 2.0817618370056152]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 1.0, 2.0, 7.0, 2.0, 4.0, 10.0, 10.0, 18.0, 17.0, 18.0, 25.0, 27.0, 21.0, 27.0, 32.0, 36.0, 32.0, 35.0, 41.0, 30.0, 45.0, 45.0, 59.0, 53.0, 37.0, 43.0, 32.0, 33.0, 30.0, 25.0, 28.0, 28.0, 14.0, 26.0, 19.0, 15.0, 16.0, 7.0, 13.0, 8.0, 3.0, 7.0, 7.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.980883002281189, -0.9472073316574097, -0.9135316610336304, -0.8798559904098511, -0.846180260181427, -0.8125045895576477, -0.7788289189338684, -0.7451532483100891, -0.711477518081665, -0.6778018474578857, -0.6441261768341064, -0.6104505062103271, -0.5767747759819031, -0.5430991053581238, -0.5094234347343445, -0.4757477641105652, -0.4420720934867859, -0.4083964228630066, -0.3747207224369049, -0.3410450518131256, -0.3073693513870239, -0.27369368076324463, -0.24001801013946533, -0.20634232461452484, -0.17266663908958435, -0.13899095356464386, -0.10531527549028397, -0.07163959741592407, -0.03796391189098358, -0.004288226366043091, 0.029387444257736206, 0.0630631297826767, 0.09673881530761719, 0.13041450083255768, 0.16409018635749817, 0.19776585698127747, 0.23144154250621796, 0.26511722803115845, 0.29879289865493774, 0.33246856927871704, 0.3661442697048187, 0.399819940328598, 0.4334956407546997, 0.467171311378479, 0.5008469820022583, 0.5345226526260376, 0.5681983232498169, 0.601874053478241, 0.6355497241020203, 0.6692253947257996, 0.7029010653495789, 0.7365767955780029, 0.7702524662017822, 0.8039281368255615, 0.8376038074493408, 0.8712794780731201, 0.9049551486968994, 0.9386308193206787, 0.972306489944458, 1.0059821605682373, 1.0396578311920166, 1.073333501815796, 1.1070091724395752, 1.140684962272644, 1.1743606328964233]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 9.0, 12.0, 25.0, 34.0, 46.0, 69.0, 101.0, 160.0, 261.0, 429.0, 729.0, 1259.0, 2512.0, 5346.0, 12686.0, 36858.0, 158277.0, 3417267.0, 456218.0, 66198.0, 20082.0, 7807.0, 3561.0, 1800.0, 976.0, 539.0, 329.0, 209.0, 137.0, 95.0, 71.0, 36.0, 31.0, 26.0, 15.0, 15.0, 13.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18262290954589844, -0.17603683471679688, -0.1694507598876953, -0.16286468505859375, -0.1562786102294922, -0.14969253540039062, -0.14310646057128906, -0.1365203857421875, -0.12993431091308594, -0.12334823608398438, -0.11676216125488281, -0.11017608642578125, -0.10359001159667969, -0.09700393676757812, -0.09041786193847656, -0.083831787109375, -0.07724571228027344, -0.07065963745117188, -0.06407356262207031, -0.05748748779296875, -0.05090141296386719, -0.044315338134765625, -0.03772926330566406, -0.0311431884765625, -0.024557113647460938, -0.017971038818359375, -0.011384963989257812, -0.00479888916015625, 0.0017871856689453125, 0.008373260498046875, 0.014959335327148438, 0.02154541015625, 0.028131484985351562, 0.034717559814453125, 0.04130363464355469, 0.04788970947265625, 0.05447578430175781, 0.061061859130859375, 0.06764793395996094, 0.0742340087890625, 0.08082008361816406, 0.08740615844726562, 0.09399223327636719, 0.10057830810546875, 0.10716438293457031, 0.11375045776367188, 0.12033653259277344, 0.126922607421875, 0.13350868225097656, 0.14009475708007812, 0.1466808319091797, 0.15326690673828125, 0.1598529815673828, 0.16643905639648438, 0.17302513122558594, 0.1796112060546875, 0.18619728088378906, 0.19278335571289062, 0.1993694305419922, 0.20595550537109375, 0.2125415802001953, 0.21912765502929688, 0.22571372985839844, 0.2322998046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 17.0, 24.0, 22.0, 26.0, 29.0, 37.0, 21.0, 37.0, 42.0, 48.0, 59.0, 62.0, 67.0, 51.0, 55.0, 49.0, 54.0, 40.0, 37.0, 42.0, 28.0, 26.0, 22.0, 16.0, 14.0, 13.0, 11.0, 6.0, 7.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041259765625, -0.039888858795166016, -0.03851795196533203, -0.03714704513549805, -0.03577613830566406, -0.03440523147583008, -0.033034324645996094, -0.03166341781616211, -0.030292510986328125, -0.02892160415649414, -0.027550697326660156, -0.026179790496826172, -0.024808883666992188, -0.023437976837158203, -0.02206707000732422, -0.020696163177490234, -0.01932525634765625, -0.017954349517822266, -0.01658344268798828, -0.015212535858154297, -0.013841629028320312, -0.012470722198486328, -0.011099815368652344, -0.00972890853881836, -0.008358001708984375, -0.006987094879150391, -0.005616188049316406, -0.004245281219482422, -0.0028743743896484375, -0.0015034675598144531, -0.00013256072998046875, 0.0012383460998535156, 0.0026092529296875, 0.003980159759521484, 0.005351066589355469, 0.006721973419189453, 0.008092880249023438, 0.009463787078857422, 0.010834693908691406, 0.01220560073852539, 0.013576507568359375, 0.01494741439819336, 0.016318321228027344, 0.017689228057861328, 0.019060134887695312, 0.020431041717529297, 0.02180194854736328, 0.023172855377197266, 0.02454376220703125, 0.025914669036865234, 0.02728557586669922, 0.028656482696533203, 0.030027389526367188, 0.03139829635620117, 0.032769203186035156, 0.03414011001586914, 0.035511016845703125, 0.03688192367553711, 0.038252830505371094, 0.03962373733520508, 0.04099464416503906, 0.04236555099487305, 0.04373645782470703, 0.045107364654541016, 0.046478271484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 9.0, 10.0, 10.0, 30.0, 38.0, 55.0, 82.0, 129.0, 221.0, 338.0, 691.0, 1310.0, 2776.0, 6231.0, 16597.0, 53464.0, 270453.0, 3196294.0, 528099.0, 79623.0, 22145.0, 8180.0, 3654.0, 1733.0, 867.0, 486.0, 266.0, 173.0, 102.0, 60.0, 43.0, 29.0, 23.0, 11.0, 15.0, 12.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177001953125, -0.17103195190429688, -0.16506195068359375, -0.15909194946289062, -0.1531219482421875, -0.14715194702148438, -0.14118194580078125, -0.13521194458007812, -0.129241943359375, -0.12327194213867188, -0.11730194091796875, -0.11133193969726562, -0.1053619384765625, -0.09939193725585938, -0.09342193603515625, -0.08745193481445312, -0.08148193359375, -0.07551193237304688, -0.06954193115234375, -0.06357192993164062, -0.0576019287109375, -0.051631927490234375, -0.04566192626953125, -0.039691925048828125, -0.033721923828125, -0.027751922607421875, -0.02178192138671875, -0.015811920166015625, -0.0098419189453125, -0.003871917724609375, 0.00209808349609375, 0.008068084716796875, 0.0140380859375, 0.020008087158203125, 0.02597808837890625, 0.031948089599609375, 0.0379180908203125, 0.043888092041015625, 0.04985809326171875, 0.055828094482421875, 0.061798095703125, 0.06776809692382812, 0.07373809814453125, 0.07970809936523438, 0.0856781005859375, 0.09164810180664062, 0.09761810302734375, 0.10358810424804688, 0.10955810546875, 0.11552810668945312, 0.12149810791015625, 0.12746810913085938, 0.1334381103515625, 0.13940811157226562, 0.14537811279296875, 0.15134811401367188, 0.157318115234375, 0.16328811645507812, 0.16925811767578125, 0.17522811889648438, 0.1811981201171875, 0.18716812133789062, 0.19313812255859375, 0.19910812377929688, 0.205078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 6.0, 11.0, 18.0, 21.0, 18.0, 30.0, 50.0, 66.0, 94.0, 174.0, 238.0, 579.0, 1470.0, 588.0, 250.0, 148.0, 106.0, 58.0, 29.0, 30.0, 12.0, 12.0, 9.0, 12.0, 7.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.049163818359375, -0.04730653762817383, -0.045449256896972656, -0.043591976165771484, -0.04173469543457031, -0.03987741470336914, -0.03802013397216797, -0.0361628532409668, -0.034305572509765625, -0.03244829177856445, -0.03059101104736328, -0.02873373031616211, -0.026876449584960938, -0.025019168853759766, -0.023161888122558594, -0.021304607391357422, -0.01944732666015625, -0.017590045928955078, -0.015732765197753906, -0.013875484466552734, -0.012018203735351562, -0.01016092300415039, -0.008303642272949219, -0.006446361541748047, -0.004589080810546875, -0.002731800079345703, -0.0008745193481445312, 0.0009827613830566406, 0.0028400421142578125, 0.004697322845458984, 0.006554603576660156, 0.008411884307861328, 0.0102691650390625, 0.012126445770263672, 0.013983726501464844, 0.015841007232666016, 0.017698287963867188, 0.01955556869506836, 0.02141284942626953, 0.023270130157470703, 0.025127410888671875, 0.026984691619873047, 0.02884197235107422, 0.03069925308227539, 0.03255653381347656, 0.034413814544677734, 0.036271095275878906, 0.03812837600708008, 0.03998565673828125, 0.04184293746948242, 0.043700218200683594, 0.045557498931884766, 0.04741477966308594, 0.04927206039428711, 0.05112934112548828, 0.05298662185668945, 0.054843902587890625, 0.0567011833190918, 0.05855846405029297, 0.06041574478149414, 0.06227302551269531, 0.06413030624389648, 0.06598758697509766, 0.06784486770629883, 0.0697021484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 9.0, 13.0, 36.0, 46.0, 100.0, 129.0, 143.0, 145.0, 138.0, 93.0, 58.0, 42.0, 15.0, 12.0, 14.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25761300325393677, -0.2436131238937378, -0.2296132594347, -0.21561338007450104, -0.20161351561546326, -0.18761363625526428, -0.1736137568950653, -0.15961389243602753, -0.14561402797698975, -0.13161414861679077, -0.11761428415775299, -0.10361440479755402, -0.08961454033851624, -0.07561466097831726, -0.06161478906869888, -0.047614917159080505, -0.03361503779888153, -0.019615165889263153, -0.005615292116999626, 0.0083845816552639, 0.02238445356488228, 0.036384329199790955, 0.05038420110940933, 0.06438407301902771, 0.07838394492864609, 0.09238381683826447, 0.10638368874788284, 0.12038356065750122, 0.1343834400177002, 0.14838331937789917, 0.16238318383693695, 0.17638304829597473, 0.1903829276561737, 0.20438280701637268, 0.21838267147541046, 0.23238255083560944, 0.24638241529464722, 0.2603822946548462, 0.27438217401504517, 0.28838205337524414, 0.3023819029331207, 0.3163817822933197, 0.3303816616535187, 0.34438151121139526, 0.35838139057159424, 0.3723812699317932, 0.3863811492919922, 0.40038102865219116, 0.41438090801239014, 0.4283807873725891, 0.4423806667327881, 0.4563805162906647, 0.47038039565086365, 0.4843802750110626, 0.4983801543712616, 0.5123800039291382, 0.5263798832893372, 0.5403797626495361, 0.5543796420097351, 0.5683795213699341, 0.5823794007301331, 0.596379280090332, 0.6103790998458862, 0.6243789792060852, 0.6383788585662842]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 2.0, 6.0, 5.0, 9.0, 13.0, 6.0, 8.0, 15.0, 13.0, 33.0, 22.0, 30.0, 30.0, 42.0, 32.0, 52.0, 44.0, 45.0, 42.0, 30.0, 44.0, 42.0, 43.0, 35.0, 36.0, 39.0, 33.0, 28.0, 36.0, 32.0, 22.0, 22.0, 19.0, 18.0, 17.0, 16.0, 7.0, 2.0, 9.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.21582037210464478, -0.20919713377952576, -0.20257388055324554, -0.19595062732696533, -0.1893273890018463, -0.1827041506767273, -0.17608089745044708, -0.16945764422416687, -0.16283440589904785, -0.15621116757392883, -0.14958791434764862, -0.1429646611213684, -0.1363414227962494, -0.12971818447113037, -0.12309493124485016, -0.11647168546915054, -0.10984843969345093, -0.10322519391775131, -0.0966019481420517, -0.08997870236635208, -0.08335545659065247, -0.07673221081495285, -0.07010896503925323, -0.06348571926355362, -0.056862473487854004, -0.05023922771215439, -0.04361598193645477, -0.03699273616075516, -0.030369490385055542, -0.023746244609355927, -0.01712299883365631, -0.010499753057956696, -0.00387650728225708, 0.0027467384934425354, 0.009369984269142151, 0.015993230044841766, 0.022616475820541382, 0.029239721596240997, 0.03586296737194061, 0.04248621314764023, 0.049109458923339844, 0.05573270469903946, 0.062355950474739075, 0.06897919625043869, 0.0756024420261383, 0.08222568780183792, 0.08884893357753754, 0.09547217935323715, 0.10209542512893677, 0.10871867090463638, 0.115341916680336, 0.12196516245603561, 0.12858840823173523, 0.13521164655685425, 0.14183489978313446, 0.14845815300941467, 0.1550813913345337, 0.1617046296596527, 0.16832788288593292, 0.17495113611221313, 0.18157437443733215, 0.18819761276245117, 0.19482086598873138, 0.2014441192150116, 0.20806735754013062]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 12.0, 7.0, 11.0, 17.0, 19.0, 23.0, 41.0, 59.0, 115.0, 161.0, 252.0, 391.0, 648.0, 1149.0, 2000.0, 3598.0, 7144.0, 14370.0, 29693.0, 62082.0, 128601.0, 238989.0, 264371.0, 150637.0, 73818.0, 34989.0, 17056.0, 8369.0, 4270.0, 2358.0, 1297.0, 754.0, 400.0, 306.0, 173.0, 117.0, 63.0, 61.0, 32.0, 28.0, 20.0, 16.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11712646484375, -0.1134796142578125, -0.109832763671875, -0.1061859130859375, -0.1025390625, -0.0988922119140625, -0.095245361328125, -0.0915985107421875, -0.08795166015625, -0.0843048095703125, -0.080657958984375, -0.0770111083984375, -0.0733642578125, -0.0697174072265625, -0.066070556640625, -0.0624237060546875, -0.05877685546875, -0.0551300048828125, -0.051483154296875, -0.0478363037109375, -0.044189453125, -0.0405426025390625, -0.036895751953125, -0.0332489013671875, -0.02960205078125, -0.0259552001953125, -0.022308349609375, -0.0186614990234375, -0.0150146484375, -0.0113677978515625, -0.007720947265625, -0.0040740966796875, -0.00042724609375, 0.0032196044921875, 0.006866455078125, 0.0105133056640625, 0.01416015625, 0.0178070068359375, 0.021453857421875, 0.0251007080078125, 0.02874755859375, 0.0323944091796875, 0.036041259765625, 0.0396881103515625, 0.0433349609375, 0.0469818115234375, 0.050628662109375, 0.0542755126953125, 0.05792236328125, 0.0615692138671875, 0.065216064453125, 0.0688629150390625, 0.072509765625, 0.0761566162109375, 0.079803466796875, 0.0834503173828125, 0.08709716796875, 0.0907440185546875, 0.094390869140625, 0.0980377197265625, 0.1016845703125, 0.1053314208984375, 0.108978271484375, 0.1126251220703125, 0.11627197265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 3.0, 6.0, 10.0, 12.0, 22.0, 15.0, 25.0, 30.0, 33.0, 17.0, 35.0, 39.0, 38.0, 42.0, 34.0, 57.0, 56.0, 61.0, 46.0, 47.0, 36.0, 51.0, 49.0, 37.0, 26.0, 29.0, 20.0, 22.0, 17.0, 16.0, 13.0, 6.0, 4.0, 9.0, 9.0, 2.0, 3.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.039642333984375, -0.03841400146484375, -0.0371856689453125, -0.03595733642578125, -0.03472900390625, -0.03350067138671875, -0.0322723388671875, -0.03104400634765625, -0.029815673828125, -0.02858734130859375, -0.0273590087890625, -0.02613067626953125, -0.02490234375, -0.02367401123046875, -0.0224456787109375, -0.02121734619140625, -0.019989013671875, -0.01876068115234375, -0.0175323486328125, -0.01630401611328125, -0.01507568359375, -0.01384735107421875, -0.0126190185546875, -0.01139068603515625, -0.010162353515625, -0.00893402099609375, -0.0077056884765625, -0.00647735595703125, -0.0052490234375, -0.00402069091796875, -0.0027923583984375, -0.00156402587890625, -0.000335693359375, 0.00089263916015625, 0.0021209716796875, 0.00334930419921875, 0.00457763671875, 0.00580596923828125, 0.0070343017578125, 0.00826263427734375, 0.009490966796875, 0.01071929931640625, 0.0119476318359375, 0.01317596435546875, 0.014404296875, 0.01563262939453125, 0.0168609619140625, 0.01808929443359375, 0.019317626953125, 0.02054595947265625, 0.0217742919921875, 0.02300262451171875, 0.02423095703125, 0.02545928955078125, 0.0266876220703125, 0.02791595458984375, 0.029144287109375, 0.03037261962890625, 0.0316009521484375, 0.03282928466796875, 0.0340576171875, 0.03528594970703125, 0.0365142822265625, 0.03774261474609375, 0.038970947265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 5.0, 4.0, 14.0, 24.0, 22.0, 34.0, 56.0, 72.0, 104.0, 170.0, 277.0, 419.0, 765.0, 1574.0, 3891.0, 12977.0, 57765.0, 265084.0, 500270.0, 157681.0, 33618.0, 8211.0, 2725.0, 1133.0, 576.0, 370.0, 228.0, 180.0, 108.0, 57.0, 49.0, 22.0, 17.0, 14.0, 9.0, 8.0, 5.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2244873046875, -0.21794700622558594, -0.21140670776367188, -0.2048664093017578, -0.19832611083984375, -0.1917858123779297, -0.18524551391601562, -0.17870521545410156, -0.1721649169921875, -0.16562461853027344, -0.15908432006835938, -0.1525440216064453, -0.14600372314453125, -0.1394634246826172, -0.13292312622070312, -0.12638282775878906, -0.119842529296875, -0.11330223083496094, -0.10676193237304688, -0.10022163391113281, -0.09368133544921875, -0.08714103698730469, -0.08060073852539062, -0.07406044006347656, -0.0675201416015625, -0.06097984313964844, -0.054439544677734375, -0.04789924621582031, -0.04135894775390625, -0.03481864929199219, -0.028278350830078125, -0.021738052368164062, -0.01519775390625, -0.008657455444335938, -0.002117156982421875, 0.0044231414794921875, 0.01096343994140625, 0.017503738403320312, 0.024044036865234375, 0.030584335327148438, 0.0371246337890625, 0.04366493225097656, 0.050205230712890625, 0.05674552917480469, 0.06328582763671875, 0.06982612609863281, 0.07636642456054688, 0.08290672302246094, 0.089447021484375, 0.09598731994628906, 0.10252761840820312, 0.10906791687011719, 0.11560821533203125, 0.12214851379394531, 0.12868881225585938, 0.13522911071777344, 0.1417694091796875, 0.14830970764160156, 0.15485000610351562, 0.1613903045654297, 0.16793060302734375, 0.1744709014892578, 0.18101119995117188, 0.18755149841308594, 0.194091796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 10.0, 7.0, 14.0, 12.0, 13.0, 17.0, 14.0, 26.0, 20.0, 24.0, 35.0, 46.0, 45.0, 48.0, 53.0, 51.0, 49.0, 48.0, 46.0, 47.0, 45.0, 48.0, 30.0, 36.0, 37.0, 31.0, 26.0, 22.0, 17.0, 18.0, 13.0, 12.0, 3.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0], "bins": [-0.205810546875, -0.2001323699951172, -0.19445419311523438, -0.18877601623535156, -0.18309783935546875, -0.17741966247558594, -0.17174148559570312, -0.1660633087158203, -0.1603851318359375, -0.1547069549560547, -0.14902877807617188, -0.14335060119628906, -0.13767242431640625, -0.13199424743652344, -0.12631607055664062, -0.12063789367675781, -0.114959716796875, -0.10928153991699219, -0.10360336303710938, -0.09792518615722656, -0.09224700927734375, -0.08656883239746094, -0.08089065551757812, -0.07521247863769531, -0.0695343017578125, -0.06385612487792969, -0.058177947998046875, -0.05249977111816406, -0.04682159423828125, -0.04114341735839844, -0.035465240478515625, -0.029787063598632812, -0.02410888671875, -0.018430709838867188, -0.012752532958984375, -0.0070743560791015625, -0.00139617919921875, 0.0042819976806640625, 0.009960174560546875, 0.015638351440429688, 0.0213165283203125, 0.026994705200195312, 0.032672882080078125, 0.03835105895996094, 0.04402923583984375, 0.04970741271972656, 0.055385589599609375, 0.06106376647949219, 0.066741943359375, 0.07242012023925781, 0.07809829711914062, 0.08377647399902344, 0.08945465087890625, 0.09513282775878906, 0.10081100463867188, 0.10648918151855469, 0.1121673583984375, 0.11784553527832031, 0.12352371215820312, 0.12920188903808594, 0.13488006591796875, 0.14055824279785156, 0.14623641967773438, 0.1519145965576172, 0.1575927734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 13.0, 22.0, 40.0, 66.0, 170.0, 392.0, 1154.0, 4639.0, 25900.0, 235833.0, 677263.0, 87075.0, 12116.0, 2616.0, 759.0, 253.0, 103.0, 62.0, 30.0, 10.0, 13.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177978515625, -0.17293548583984375, -0.1678924560546875, -0.16284942626953125, -0.157806396484375, -0.15276336669921875, -0.1477203369140625, -0.14267730712890625, -0.13763427734375, -0.13259124755859375, -0.1275482177734375, -0.12250518798828125, -0.117462158203125, -0.11241912841796875, -0.1073760986328125, -0.10233306884765625, -0.0972900390625, -0.09224700927734375, -0.0872039794921875, -0.08216094970703125, -0.077117919921875, -0.07207489013671875, -0.0670318603515625, -0.06198883056640625, -0.05694580078125, -0.05190277099609375, -0.0468597412109375, -0.04181671142578125, -0.036773681640625, -0.03173065185546875, -0.0266876220703125, -0.02164459228515625, -0.0166015625, -0.01155853271484375, -0.0065155029296875, -0.00147247314453125, 0.003570556640625, 0.00861358642578125, 0.0136566162109375, 0.01869964599609375, 0.02374267578125, 0.02878570556640625, 0.0338287353515625, 0.03887176513671875, 0.043914794921875, 0.04895782470703125, 0.0540008544921875, 0.05904388427734375, 0.0640869140625, 0.06912994384765625, 0.0741729736328125, 0.07921600341796875, 0.084259033203125, 0.08930206298828125, 0.0943450927734375, 0.09938812255859375, 0.10443115234375, 0.10947418212890625, 0.1145172119140625, 0.11956024169921875, 0.124603271484375, 0.12964630126953125, 0.1346893310546875, 0.13973236083984375, 0.144775390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 6.0, 5.0, 13.0, 10.0, 24.0, 26.0, 42.0, 50.0, 58.0, 79.0, 112.0, 116.0, 100.0, 74.0, 67.0, 49.0, 37.0, 29.0, 21.0, 21.0, 13.0, 13.0, 9.0, 7.0, 3.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010138750076293945, -9.847059845924377e-05, -9.55536961555481e-05, -9.263679385185242e-05, -8.971989154815674e-05, -8.680298924446106e-05, -8.388608694076538e-05, -8.09691846370697e-05, -7.805228233337402e-05, -7.513538002967834e-05, -7.221847772598267e-05, -6.930157542228699e-05, -6.638467311859131e-05, -6.346777081489563e-05, -6.055086851119995e-05, -5.763396620750427e-05, -5.4717063903808594e-05, -5.1800161600112915e-05, -4.8883259296417236e-05, -4.596635699272156e-05, -4.304945468902588e-05, -4.01325523853302e-05, -3.721565008163452e-05, -3.429874777793884e-05, -3.1381845474243164e-05, -2.8464943170547485e-05, -2.5548040866851807e-05, -2.2631138563156128e-05, -1.971423625946045e-05, -1.679733395576477e-05, -1.3880431652069092e-05, -1.0963529348373413e-05, -8.046627044677734e-06, -5.129724740982056e-06, -2.212822437286377e-06, 7.040798664093018e-07, 3.6209821701049805e-06, 6.537884473800659e-06, 9.454786777496338e-06, 1.2371689081192017e-05, 1.5288591384887695e-05, 1.8205493688583374e-05, 2.1122395992279053e-05, 2.403929829597473e-05, 2.695620059967041e-05, 2.987310290336609e-05, 3.279000520706177e-05, 3.5706907510757446e-05, 3.8623809814453125e-05, 4.1540712118148804e-05, 4.445761442184448e-05, 4.737451672554016e-05, 5.029141902923584e-05, 5.320832133293152e-05, 5.61252236366272e-05, 5.9042125940322876e-05, 6.195902824401855e-05, 6.487593054771423e-05, 6.779283285140991e-05, 7.070973515510559e-05, 7.362663745880127e-05, 7.654353976249695e-05, 7.946044206619263e-05, 8.23773443698883e-05, 8.529424667358398e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 8.0, 14.0, 17.0, 28.0, 47.0, 86.0, 135.0, 253.0, 534.0, 1172.0, 3112.0, 11662.0, 77383.0, 665004.0, 253441.0, 26704.0, 5609.0, 1817.0, 734.0, 351.0, 171.0, 99.0, 72.0, 27.0, 16.0, 10.0, 14.0, 11.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1688232421875, -0.1642284393310547, -0.15963363647460938, -0.15503883361816406, -0.15044403076171875, -0.14584922790527344, -0.14125442504882812, -0.1366596221923828, -0.1320648193359375, -0.1274700164794922, -0.12287521362304688, -0.11828041076660156, -0.11368560791015625, -0.10909080505371094, -0.10449600219726562, -0.09990119934082031, -0.095306396484375, -0.09071159362792969, -0.08611679077148438, -0.08152198791503906, -0.07692718505859375, -0.07233238220214844, -0.06773757934570312, -0.06314277648925781, -0.0585479736328125, -0.05395317077636719, -0.049358367919921875, -0.04476356506347656, -0.04016876220703125, -0.03557395935058594, -0.030979156494140625, -0.026384353637695312, -0.02178955078125, -0.017194747924804688, -0.012599945068359375, -0.008005142211914062, -0.00341033935546875, 0.0011844635009765625, 0.005779266357421875, 0.010374069213867188, 0.0149688720703125, 0.019563674926757812, 0.024158477783203125, 0.028753280639648438, 0.03334808349609375, 0.03794288635253906, 0.042537689208984375, 0.04713249206542969, 0.051727294921875, 0.05632209777832031, 0.060916900634765625, 0.06551170349121094, 0.07010650634765625, 0.07470130920410156, 0.07929611206054688, 0.08389091491699219, 0.0884857177734375, 0.09308052062988281, 0.09767532348632812, 0.10227012634277344, 0.10686492919921875, 0.11145973205566406, 0.11605453491210938, 0.12064933776855469, 0.125244140625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 14.0, 22.0, 29.0, 39.0, 55.0, 78.0, 104.0, 116.0, 135.0, 105.0, 89.0, 71.0, 33.0, 34.0, 14.0, 12.0, 13.0, 6.0, 3.0, 3.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07080078125, -0.0678701400756836, -0.06493949890136719, -0.06200885772705078, -0.059078216552734375, -0.05614757537841797, -0.05321693420410156, -0.050286293029785156, -0.04735565185546875, -0.044425010681152344, -0.04149436950683594, -0.03856372833251953, -0.035633087158203125, -0.03270244598388672, -0.029771804809570312, -0.026841163635253906, -0.0239105224609375, -0.020979881286621094, -0.018049240112304688, -0.015118598937988281, -0.012187957763671875, -0.009257316589355469, -0.0063266754150390625, -0.0033960342407226562, -0.00046539306640625, 0.0024652481079101562, 0.0053958892822265625, 0.008326530456542969, 0.011257171630859375, 0.014187812805175781, 0.017118453979492188, 0.020049095153808594, 0.022979736328125, 0.025910377502441406, 0.028841018676757812, 0.03177165985107422, 0.034702301025390625, 0.03763294219970703, 0.04056358337402344, 0.043494224548339844, 0.04642486572265625, 0.049355506896972656, 0.05228614807128906, 0.05521678924560547, 0.058147430419921875, 0.06107807159423828, 0.06400871276855469, 0.0669393539428711, 0.0698699951171875, 0.0728006362915039, 0.07573127746582031, 0.07866191864013672, 0.08159255981445312, 0.08452320098876953, 0.08745384216308594, 0.09038448333740234, 0.09331512451171875, 0.09624576568603516, 0.09917640686035156, 0.10210704803466797, 0.10503768920898438, 0.10796833038330078, 0.11089897155761719, 0.1138296127319336, 0.11676025390625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 18.0, 61.0, 169.0, 280.0, 248.0, 149.0, 56.0, 21.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5243494510650635, -1.4398808479309082, -1.3554123640060425, -1.2709437608718872, -1.1864752769470215, -1.1020066738128662, -1.017538070678711, -0.9330695271492004, -0.8486009836196899, -0.7641324400901794, -0.679663896560669, -0.5951952934265137, -0.5107267498970032, -0.4262582063674927, -0.3417896032333374, -0.2573210597038269, -0.1728525161743164, -0.08838395774364471, -0.0039153993129730225, 0.08055317401885986, 0.16502171754837036, 0.24949026107788086, 0.33395886421203613, 0.41842740774154663, 0.5028959512710571, 0.5873644948005676, 0.6718330383300781, 0.7563016414642334, 0.8407701849937439, 0.9252387285232544, 1.0097073316574097, 1.0941758155822754, 1.1786446571350098, 1.263113260269165, 1.3475817441940308, 1.432050347328186, 1.5165188312530518, 1.600987434387207, 1.6854560375213623, 1.7699246406555176, 1.8543931245803833, 1.9388617277145386, 2.0233302116394043, 2.1077988147735596, 2.192267417907715, 2.276735782623291, 2.3612046241760254, 2.4456729888916016, 2.530141592025757, 2.614610195159912, 2.6990787982940674, 2.7835474014282227, 2.868015766143799, 2.952484369277954, 3.0369529724121094, 3.1214215755462646, 3.20589017868042, 3.290358781814575, 3.3748273849487305, 3.4592957496643066, 3.543764352798462, 3.628232955932617, 3.7127015590667725, 3.7971701622009277, 3.881638526916504]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 15.0, 12.0, 11.0, 18.0, 22.0, 40.0, 24.0, 43.0, 50.0, 44.0, 47.0, 59.0, 61.0, 57.0, 55.0, 55.0, 48.0, 77.0, 41.0, 45.0, 37.0, 26.0, 20.0, 17.0, 18.0, 13.0, 10.0, 4.0, 10.0, 5.0, 9.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9450921416282654, -0.9084863066673279, -0.8718804717063904, -0.8352746367454529, -0.7986688017845154, -0.7620629668235779, -0.7254571318626404, -0.6888512969017029, -0.6522454619407654, -0.6156396269798279, -0.5790337920188904, -0.5424279570579529, -0.5058221220970154, -0.4692162871360779, -0.4326104521751404, -0.3960046172142029, -0.3593987822532654, -0.3227929472923279, -0.2861871123313904, -0.24958127737045288, -0.21297544240951538, -0.17636960744857788, -0.13976377248764038, -0.10315793752670288, -0.06655210256576538, -0.02994626760482788, 0.006659567356109619, 0.04326540231704712, 0.07987123727798462, 0.11647707223892212, 0.15308290719985962, 0.18968874216079712, 0.22629451751708984, 0.26290035247802734, 0.29950618743896484, 0.33611202239990234, 0.37271785736083984, 0.40932369232177734, 0.44592952728271484, 0.48253536224365234, 0.5191411972045898, 0.5557470321655273, 0.5923528671264648, 0.6289587020874023, 0.6655645370483398, 0.7021703720092773, 0.7387762069702148, 0.7753820419311523, 0.8119878768920898, 0.8485937118530273, 0.8851995468139648, 0.9218053817749023, 0.9584112167358398, 0.9950170516967773, 1.0316228866577148, 1.0682287216186523, 1.1048345565795898, 1.1414403915405273, 1.1780462265014648, 1.2146520614624023, 1.2512578964233398, 1.2878637313842773, 1.3244695663452148, 1.3610754013061523, 1.3976812362670898]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 9.0, 9.0, 12.0, 13.0, 26.0, 29.0, 46.0, 78.0, 116.0, 209.0, 358.0, 630.0, 1102.0, 2377.0, 5396.0, 13851.0, 44381.0, 215730.0, 3271553.0, 525277.0, 77076.0, 21591.0, 7751.0, 3204.0, 1499.0, 807.0, 473.0, 225.0, 156.0, 106.0, 63.0, 39.0, 25.0, 19.0, 20.0, 10.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.182373046875, -0.17623138427734375, -0.1700897216796875, -0.16394805908203125, -0.157806396484375, -0.15166473388671875, -0.1455230712890625, -0.13938140869140625, -0.13323974609375, -0.12709808349609375, -0.1209564208984375, -0.11481475830078125, -0.108673095703125, -0.10253143310546875, -0.0963897705078125, -0.09024810791015625, -0.0841064453125, -0.07796478271484375, -0.0718231201171875, -0.06568145751953125, -0.059539794921875, -0.05339813232421875, -0.0472564697265625, -0.04111480712890625, -0.03497314453125, -0.02883148193359375, -0.0226898193359375, -0.01654815673828125, -0.010406494140625, -0.00426483154296875, 0.0018768310546875, 0.00801849365234375, 0.01416015625, 0.02030181884765625, 0.0264434814453125, 0.03258514404296875, 0.038726806640625, 0.04486846923828125, 0.0510101318359375, 0.05715179443359375, 0.06329345703125, 0.06943511962890625, 0.0755767822265625, 0.08171844482421875, 0.087860107421875, 0.09400177001953125, 0.1001434326171875, 0.10628509521484375, 0.1124267578125, 0.11856842041015625, 0.1247100830078125, 0.13085174560546875, 0.136993408203125, 0.14313507080078125, 0.1492767333984375, 0.15541839599609375, 0.16156005859375, 0.16770172119140625, 0.1738433837890625, 0.17998504638671875, 0.186126708984375, 0.19226837158203125, 0.1984100341796875, 0.20455169677734375, 0.210693359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 4.0, 11.0, 16.0, 15.0, 20.0, 26.0, 35.0, 35.0, 38.0, 56.0, 53.0, 64.0, 51.0, 68.0, 61.0, 54.0, 51.0, 63.0, 48.0, 41.0, 33.0, 26.0, 18.0, 22.0, 18.0, 11.0, 11.0, 7.0, 11.0, 3.0, 3.0, 7.0, 2.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04840087890625, -0.046933650970458984, -0.04546642303466797, -0.04399919509887695, -0.04253196716308594, -0.04106473922729492, -0.039597511291503906, -0.03813028335571289, -0.036663055419921875, -0.03519582748413086, -0.033728599548339844, -0.03226137161254883, -0.030794143676757812, -0.029326915740966797, -0.02785968780517578, -0.026392459869384766, -0.02492523193359375, -0.023458003997802734, -0.02199077606201172, -0.020523548126220703, -0.019056320190429688, -0.017589092254638672, -0.016121864318847656, -0.01465463638305664, -0.013187408447265625, -0.01172018051147461, -0.010252952575683594, -0.008785724639892578, -0.0073184967041015625, -0.005851268768310547, -0.004384040832519531, -0.0029168128967285156, -0.0014495849609375, 1.7642974853515625e-05, 0.0014848709106445312, 0.002952098846435547, 0.0044193267822265625, 0.005886554718017578, 0.007353782653808594, 0.00882101058959961, 0.010288238525390625, 0.01175546646118164, 0.013222694396972656, 0.014689922332763672, 0.016157150268554688, 0.017624378204345703, 0.01909160614013672, 0.020558834075927734, 0.02202606201171875, 0.023493289947509766, 0.02496051788330078, 0.026427745819091797, 0.027894973754882812, 0.029362201690673828, 0.030829429626464844, 0.03229665756225586, 0.033763885498046875, 0.03523111343383789, 0.036698341369628906, 0.03816556930541992, 0.03963279724121094, 0.04110002517700195, 0.04256725311279297, 0.044034481048583984, 0.045501708984375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 8.0, 7.0, 8.0, 11.0, 10.0, 19.0, 34.0, 38.0, 81.0, 104.0, 165.0, 281.0, 465.0, 896.0, 1812.0, 4070.0, 10089.0, 28945.0, 103492.0, 592138.0, 2941353.0, 394411.0, 78149.0, 22788.0, 8160.0, 3394.0, 1519.0, 779.0, 391.0, 256.0, 159.0, 79.0, 55.0, 39.0, 21.0, 22.0, 12.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.176513671875, -0.17152786254882812, -0.16654205322265625, -0.16155624389648438, -0.1565704345703125, -0.15158462524414062, -0.14659881591796875, -0.14161300659179688, -0.136627197265625, -0.13164138793945312, -0.12665557861328125, -0.12166976928710938, -0.1166839599609375, -0.11169815063476562, -0.10671234130859375, -0.10172653198242188, -0.09674072265625, -0.09175491333007812, -0.08676910400390625, -0.08178329467773438, -0.0767974853515625, -0.07181167602539062, -0.06682586669921875, -0.061840057373046875, -0.056854248046875, -0.051868438720703125, -0.04688262939453125, -0.041896820068359375, -0.0369110107421875, -0.031925201416015625, -0.02693939208984375, -0.021953582763671875, -0.0169677734375, -0.011981964111328125, -0.00699615478515625, -0.002010345458984375, 0.0029754638671875, 0.007961273193359375, 0.01294708251953125, 0.017932891845703125, 0.022918701171875, 0.027904510498046875, 0.03289031982421875, 0.037876129150390625, 0.0428619384765625, 0.047847747802734375, 0.05283355712890625, 0.057819366455078125, 0.06280517578125, 0.06779098510742188, 0.07277679443359375, 0.07776260375976562, 0.0827484130859375, 0.08773422241210938, 0.09272003173828125, 0.09770584106445312, 0.102691650390625, 0.10767745971679688, 0.11266326904296875, 0.11764907836914062, 0.1226348876953125, 0.12762069702148438, 0.13260650634765625, 0.13759231567382812, 0.142578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 8.0, 12.0, 8.0, 6.0, 13.0, 19.0, 23.0, 27.0, 48.0, 62.0, 79.0, 164.0, 188.0, 350.0, 582.0, 994.0, 567.0, 282.0, 207.0, 117.0, 81.0, 69.0, 36.0, 38.0, 24.0, 14.0, 12.0, 4.0, 7.0, 5.0, 4.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0775146484375, -0.07538890838623047, -0.07326316833496094, -0.0711374282836914, -0.06901168823242188, -0.06688594818115234, -0.06476020812988281, -0.06263446807861328, -0.06050872802734375, -0.05838298797607422, -0.05625724792480469, -0.054131507873535156, -0.052005767822265625, -0.049880027770996094, -0.04775428771972656, -0.04562854766845703, -0.0435028076171875, -0.04137706756591797, -0.03925132751464844, -0.037125587463378906, -0.034999847412109375, -0.032874107360839844, -0.030748367309570312, -0.02862262725830078, -0.02649688720703125, -0.02437114715576172, -0.022245407104492188, -0.020119667053222656, -0.017993927001953125, -0.015868186950683594, -0.013742446899414062, -0.011616706848144531, -0.009490966796875, -0.007365226745605469, -0.0052394866943359375, -0.0031137466430664062, -0.000988006591796875, 0.0011377334594726562, 0.0032634735107421875, 0.005389213562011719, 0.00751495361328125, 0.009640693664550781, 0.011766433715820312, 0.013892173767089844, 0.016017913818359375, 0.018143653869628906, 0.020269393920898438, 0.02239513397216797, 0.0245208740234375, 0.02664661407470703, 0.028772354125976562, 0.030898094177246094, 0.033023834228515625, 0.035149574279785156, 0.03727531433105469, 0.03940105438232422, 0.04152679443359375, 0.04365253448486328, 0.04577827453613281, 0.047904014587402344, 0.050029754638671875, 0.052155494689941406, 0.05428123474121094, 0.05640697479248047, 0.05853271484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 10.0, 25.0, 48.0, 114.0, 170.0, 232.0, 213.0, 102.0, 40.0, 24.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2824467420578003, -1.2523645162582397, -1.2222822904586792, -1.192199945449829, -1.1621177196502686, -1.132035493850708, -1.1019532680511475, -1.071871042251587, -1.0417888164520264, -1.0117065906524658, -0.9816243052482605, -0.9515420794487, -0.9214598536491394, -0.8913775682449341, -0.8612953424453735, -0.831213116645813, -0.8011308312416077, -0.7710486054420471, -0.7409663200378418, -0.7108840942382812, -0.6808018684387207, -0.6507196426391602, -0.6206373572349548, -0.5905551314353943, -0.560472846031189, -0.5303906202316284, -0.5003083348274231, -0.47022610902786255, -0.440143883228302, -0.41006162762641907, -0.37997937202453613, -0.3498971462249756, -0.3198149800300598, -0.2897327244281769, -0.25965049862861633, -0.2295682430267334, -0.19948600232601166, -0.16940376162528992, -0.13932150602340698, -0.10923926532268524, -0.0791570246219635, -0.04907478019595146, -0.018992535769939423, 0.011089712381362915, 0.041171953082084656, 0.0712541937828064, 0.10133644938468933, 0.13141869008541107, 0.1615009307861328, 0.19158317148685455, 0.2216654121875763, 0.25174766778945923, 0.2818298935890198, 0.3119121491909027, 0.34199440479278564, 0.3720766305923462, 0.4021588861942291, 0.43224114179611206, 0.4623233675956726, 0.49240562319755554, 0.5224878787994385, 0.552570104598999, 0.5826523303985596, 0.6127346158027649, 0.6428168416023254]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 5.0, 6.0, 14.0, 9.0, 15.0, 15.0, 26.0, 20.0, 28.0, 19.0, 22.0, 36.0, 27.0, 46.0, 64.0, 47.0, 48.0, 40.0, 38.0, 36.0, 48.0, 45.0, 36.0, 42.0, 34.0, 42.0, 25.0, 25.0, 27.0, 18.0, 11.0, 19.0, 15.0, 8.0, 9.0, 11.0, 1.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0], "bins": [-0.3536110520362854, -0.3444724678993225, -0.335333913564682, -0.3261953294277191, -0.3170567750930786, -0.3079181909561157, -0.29877960681915283, -0.28964105248451233, -0.28050246834754944, -0.27136388421058655, -0.26222532987594604, -0.25308674573898315, -0.24394817650318146, -0.23480960726737976, -0.22567103803157806, -0.21653246879577637, -0.20739389955997467, -0.19825533032417297, -0.18911676108837128, -0.17997819185256958, -0.1708396077156067, -0.161701038479805, -0.1525624692440033, -0.1434238851070404, -0.1342853307723999, -0.1251467615365982, -0.11600818485021591, -0.10686961561441422, -0.09773103892803192, -0.08859246969223022, -0.07945390045642853, -0.07031532377004623, -0.06117674708366394, -0.052038174122571945, -0.04289960116147995, -0.03376103192567825, -0.024622458964586258, -0.015483886003494263, -0.006345316767692566, 0.002793259918689728, 0.011931829154491425, 0.02107040211558342, 0.030208973214030266, 0.03934754431247711, 0.04848611727356911, 0.0576246902346611, 0.0667632594704628, 0.07590183615684509, 0.08504040539264679, 0.09417897462844849, 0.10331755131483078, 0.11245612055063248, 0.12159469723701477, 0.13073326647281647, 0.13987183570861816, 0.14901041984558105, 0.15814897418022156, 0.16728754341602325, 0.17642611265182495, 0.18556469678878784, 0.19470326602458954, 0.20384183526039124, 0.21298040449619293, 0.22211897373199463, 0.23125755786895752]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 13.0, 11.0, 18.0, 30.0, 37.0, 50.0, 104.0, 162.0, 352.0, 843.0, 2166.0, 7028.0, 26534.0, 120935.0, 547813.0, 269499.0, 53723.0, 13046.0, 3758.0, 1353.0, 502.0, 245.0, 112.0, 68.0, 57.0, 26.0, 24.0, 18.0, 4.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291259765625, -0.2823638916015625, -0.273468017578125, -0.2645721435546875, -0.25567626953125, -0.2467803955078125, -0.237884521484375, -0.2289886474609375, -0.2200927734375, -0.2111968994140625, -0.202301025390625, -0.1934051513671875, -0.18450927734375, -0.1756134033203125, -0.166717529296875, -0.1578216552734375, -0.14892578125, -0.1400299072265625, -0.131134033203125, -0.1222381591796875, -0.11334228515625, -0.1044464111328125, -0.095550537109375, -0.0866546630859375, -0.0777587890625, -0.0688629150390625, -0.059967041015625, -0.0510711669921875, -0.04217529296875, -0.0332794189453125, -0.024383544921875, -0.0154876708984375, -0.006591796875, 0.0023040771484375, 0.011199951171875, 0.0200958251953125, 0.02899169921875, 0.0378875732421875, 0.046783447265625, 0.0556793212890625, 0.0645751953125, 0.0734710693359375, 0.082366943359375, 0.0912628173828125, 0.10015869140625, 0.1090545654296875, 0.117950439453125, 0.1268463134765625, 0.1357421875, 0.1446380615234375, 0.153533935546875, 0.1624298095703125, 0.17132568359375, 0.1802215576171875, 0.189117431640625, 0.1980133056640625, 0.2069091796875, 0.2158050537109375, 0.224700927734375, 0.2335968017578125, 0.24249267578125, 0.2513885498046875, 0.260284423828125, 0.2691802978515625, 0.278076171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 9.0, 6.0, 5.0, 11.0, 15.0, 22.0, 14.0, 27.0, 38.0, 35.0, 47.0, 55.0, 55.0, 48.0, 62.0, 52.0, 55.0, 59.0, 59.0, 56.0, 52.0, 36.0, 30.0, 37.0, 21.0, 21.0, 14.0, 10.0, 10.0, 6.0, 7.0, 6.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.050018310546875, -0.04862022399902344, -0.047222137451171875, -0.04582405090332031, -0.04442596435546875, -0.04302787780761719, -0.041629791259765625, -0.04023170471191406, -0.0388336181640625, -0.03743553161621094, -0.036037445068359375, -0.03463935852050781, -0.03324127197265625, -0.03184318542480469, -0.030445098876953125, -0.029047012329101562, -0.02764892578125, -0.026250839233398438, -0.024852752685546875, -0.023454666137695312, -0.02205657958984375, -0.020658493041992188, -0.019260406494140625, -0.017862319946289062, -0.0164642333984375, -0.015066146850585938, -0.013668060302734375, -0.012269973754882812, -0.01087188720703125, -0.009473800659179688, -0.008075714111328125, -0.0066776275634765625, -0.005279541015625, -0.0038814544677734375, -0.002483367919921875, -0.0010852813720703125, 0.00031280517578125, 0.0017108917236328125, 0.003108978271484375, 0.0045070648193359375, 0.0059051513671875, 0.0073032379150390625, 0.008701324462890625, 0.010099411010742188, 0.01149749755859375, 0.012895584106445312, 0.014293670654296875, 0.015691757202148438, 0.01708984375, 0.018487930297851562, 0.019886016845703125, 0.021284103393554688, 0.02268218994140625, 0.024080276489257812, 0.025478363037109375, 0.026876449584960938, 0.0282745361328125, 0.029672622680664062, 0.031070709228515625, 0.03246879577636719, 0.03386688232421875, 0.03526496887207031, 0.036663055419921875, 0.03806114196777344, 0.039459228515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 10.0, 19.0, 16.0, 32.0, 44.0, 54.0, 90.0, 110.0, 136.0, 205.0, 349.0, 502.0, 832.0, 1426.0, 2572.0, 5054.0, 10922.0, 26211.0, 68829.0, 178729.0, 367701.0, 232196.0, 90076.0, 34404.0, 14123.0, 6261.0, 3135.0, 1709.0, 1003.0, 616.0, 342.0, 261.0, 169.0, 133.0, 83.0, 45.0, 37.0, 34.0, 24.0, 14.0, 14.0, 16.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.134521484375, -0.13027000427246094, -0.12601852416992188, -0.12176704406738281, -0.11751556396484375, -0.11326408386230469, -0.10901260375976562, -0.10476112365722656, -0.1005096435546875, -0.09625816345214844, -0.09200668334960938, -0.08775520324707031, -0.08350372314453125, -0.07925224304199219, -0.07500076293945312, -0.07074928283691406, -0.066497802734375, -0.06224632263183594, -0.057994842529296875, -0.05374336242675781, -0.04949188232421875, -0.04524040222167969, -0.040988922119140625, -0.03673744201660156, -0.0324859619140625, -0.028234481811523438, -0.023983001708984375, -0.019731521606445312, -0.01548004150390625, -0.011228561401367188, -0.006977081298828125, -0.0027256011962890625, 0.00152587890625, 0.0057773590087890625, 0.010028839111328125, 0.014280319213867188, 0.01853179931640625, 0.022783279418945312, 0.027034759521484375, 0.03128623962402344, 0.0355377197265625, 0.03978919982910156, 0.044040679931640625, 0.04829216003417969, 0.05254364013671875, 0.05679512023925781, 0.061046600341796875, 0.06529808044433594, 0.069549560546875, 0.07380104064941406, 0.07805252075195312, 0.08230400085449219, 0.08655548095703125, 0.09080696105957031, 0.09505844116210938, 0.09930992126464844, 0.1035614013671875, 0.10781288146972656, 0.11206436157226562, 0.11631584167480469, 0.12056732177734375, 0.12481880187988281, 0.12907028198242188, 0.13332176208496094, 0.1375732421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 5.0, 11.0, 7.0, 8.0, 13.0, 16.0, 8.0, 13.0, 19.0, 22.0, 22.0, 28.0, 29.0, 29.0, 33.0, 31.0, 47.0, 42.0, 34.0, 52.0, 40.0, 41.0, 42.0, 49.0, 38.0, 36.0, 33.0, 24.0, 34.0, 25.0, 26.0, 20.0, 26.0, 20.0, 19.0, 11.0, 12.0, 8.0, 12.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16650390625, -0.161102294921875, -0.15570068359375, -0.150299072265625, -0.1448974609375, -0.139495849609375, -0.13409423828125, -0.128692626953125, -0.123291015625, -0.117889404296875, -0.11248779296875, -0.107086181640625, -0.1016845703125, -0.096282958984375, -0.09088134765625, -0.085479736328125, -0.080078125, -0.074676513671875, -0.06927490234375, -0.063873291015625, -0.0584716796875, -0.053070068359375, -0.04766845703125, -0.042266845703125, -0.036865234375, -0.031463623046875, -0.02606201171875, -0.020660400390625, -0.0152587890625, -0.009857177734375, -0.00445556640625, 0.000946044921875, 0.00634765625, 0.011749267578125, 0.01715087890625, 0.022552490234375, 0.0279541015625, 0.033355712890625, 0.03875732421875, 0.044158935546875, 0.049560546875, 0.054962158203125, 0.06036376953125, 0.065765380859375, 0.0711669921875, 0.076568603515625, 0.08197021484375, 0.087371826171875, 0.0927734375, 0.098175048828125, 0.10357666015625, 0.108978271484375, 0.1143798828125, 0.119781494140625, 0.12518310546875, 0.130584716796875, 0.135986328125, 0.141387939453125, 0.14678955078125, 0.152191162109375, 0.1575927734375, 0.162994384765625, 0.16839599609375, 0.173797607421875, 0.17919921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 7.0, 8.0, 7.0, 14.0, 23.0, 41.0, 80.0, 127.0, 226.0, 443.0, 1071.0, 3181.0, 12749.0, 71930.0, 585644.0, 321192.0, 40240.0, 7942.0, 2052.0, 777.0, 362.0, 172.0, 104.0, 52.0, 41.0, 24.0, 12.0, 12.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.189453125, -0.1838550567626953, -0.17825698852539062, -0.17265892028808594, -0.16706085205078125, -0.16146278381347656, -0.15586471557617188, -0.1502666473388672, -0.1446685791015625, -0.1390705108642578, -0.13347244262695312, -0.12787437438964844, -0.12227630615234375, -0.11667823791503906, -0.11108016967773438, -0.10548210144042969, -0.099884033203125, -0.09428596496582031, -0.08868789672851562, -0.08308982849121094, -0.07749176025390625, -0.07189369201660156, -0.06629562377929688, -0.06069755554199219, -0.0550994873046875, -0.04950141906738281, -0.043903350830078125, -0.03830528259277344, -0.03270721435546875, -0.027109146118164062, -0.021511077880859375, -0.015913009643554688, -0.01031494140625, -0.0047168731689453125, 0.000881195068359375, 0.0064792633056640625, 0.01207733154296875, 0.017675399780273438, 0.023273468017578125, 0.028871536254882812, 0.0344696044921875, 0.04006767272949219, 0.045665740966796875, 0.05126380920410156, 0.05686187744140625, 0.06245994567871094, 0.06805801391601562, 0.07365608215332031, 0.079254150390625, 0.08485221862792969, 0.09045028686523438, 0.09604835510253906, 0.10164642333984375, 0.10724449157714844, 0.11284255981445312, 0.11844062805175781, 0.1240386962890625, 0.1296367645263672, 0.13523483276367188, 0.14083290100097656, 0.14643096923828125, 0.15202903747558594, 0.15762710571289062, 0.1632251739501953, 0.1688232421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 10.0, 5.0, 6.0, 11.0, 11.0, 7.0, 15.0, 20.0, 31.0, 31.0, 38.0, 45.0, 47.0, 52.0, 68.0, 57.0, 72.0, 60.0, 55.0, 57.0, 59.0, 41.0, 37.0, 42.0, 15.0, 30.0, 14.0, 15.0, 17.0, 8.0, 6.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.282329559326172e-05, -6.113201379776001e-05, -5.94407320022583e-05, -5.774945020675659e-05, -5.605816841125488e-05, -5.4366886615753174e-05, -5.2675604820251465e-05, -5.0984323024749756e-05, -4.929304122924805e-05, -4.760175943374634e-05, -4.591047763824463e-05, -4.421919584274292e-05, -4.252791404724121e-05, -4.08366322517395e-05, -3.914535045623779e-05, -3.7454068660736084e-05, -3.5762786865234375e-05, -3.4071505069732666e-05, -3.238022327423096e-05, -3.068894147872925e-05, -2.899765968322754e-05, -2.730637788772583e-05, -2.561509609222412e-05, -2.3923814296722412e-05, -2.2232532501220703e-05, -2.0541250705718994e-05, -1.8849968910217285e-05, -1.7158687114715576e-05, -1.5467405319213867e-05, -1.3776123523712158e-05, -1.208484172821045e-05, -1.039355993270874e-05, -8.702278137207031e-06, -7.010996341705322e-06, -5.319714546203613e-06, -3.6284327507019043e-06, -1.9371509552001953e-06, -2.4586915969848633e-07, 1.4454126358032227e-06, 3.1366944313049316e-06, 4.827976226806641e-06, 6.51925802230835e-06, 8.210539817810059e-06, 9.901821613311768e-06, 1.1593103408813477e-05, 1.3284385204315186e-05, 1.4975666999816895e-05, 1.6666948795318604e-05, 1.8358230590820312e-05, 2.004951238632202e-05, 2.174079418182373e-05, 2.343207597732544e-05, 2.512335777282715e-05, 2.6814639568328857e-05, 2.8505921363830566e-05, 3.0197203159332275e-05, 3.1888484954833984e-05, 3.357976675033569e-05, 3.52710485458374e-05, 3.696233034133911e-05, 3.865361213684082e-05, 4.034489393234253e-05, 4.203617572784424e-05, 4.372745752334595e-05, 4.5418739318847656e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 7.0, 10.0, 14.0, 24.0, 37.0, 44.0, 62.0, 110.0, 193.0, 342.0, 559.0, 1178.0, 2428.0, 5679.0, 15162.0, 48181.0, 206780.0, 542269.0, 163326.0, 39829.0, 12890.0, 4998.0, 2124.0, 1030.0, 512.0, 267.0, 157.0, 93.0, 78.0, 35.0, 34.0, 29.0, 13.0, 18.0, 8.0, 8.0, 6.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1109619140625, -0.10773849487304688, -0.10451507568359375, -0.10129165649414062, -0.0980682373046875, -0.09484481811523438, -0.09162139892578125, -0.08839797973632812, -0.085174560546875, -0.08195114135742188, -0.07872772216796875, -0.07550430297851562, -0.0722808837890625, -0.06905746459960938, -0.06583404541015625, -0.06261062622070312, -0.05938720703125, -0.056163787841796875, -0.05294036865234375, -0.049716949462890625, -0.0464935302734375, -0.043270111083984375, -0.04004669189453125, -0.036823272705078125, -0.033599853515625, -0.030376434326171875, -0.02715301513671875, -0.023929595947265625, -0.0207061767578125, -0.017482757568359375, -0.01425933837890625, -0.011035919189453125, -0.0078125, -0.004589080810546875, -0.00136566162109375, 0.001857757568359375, 0.0050811767578125, 0.008304595947265625, 0.01152801513671875, 0.014751434326171875, 0.017974853515625, 0.021198272705078125, 0.02442169189453125, 0.027645111083984375, 0.0308685302734375, 0.034091949462890625, 0.03731536865234375, 0.040538787841796875, 0.04376220703125, 0.046985626220703125, 0.05020904541015625, 0.053432464599609375, 0.0566558837890625, 0.059879302978515625, 0.06310272216796875, 0.06632614135742188, 0.069549560546875, 0.07277297973632812, 0.07599639892578125, 0.07921981811523438, 0.0824432373046875, 0.08566665649414062, 0.08889007568359375, 0.09211349487304688, 0.0953369140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 8.0, 4.0, 12.0, 13.0, 18.0, 16.0, 40.0, 45.0, 58.0, 75.0, 97.0, 84.0, 90.0, 76.0, 77.0, 65.0, 56.0, 44.0, 24.0, 29.0, 10.0, 13.0, 6.0, 8.0, 6.0, 5.0, 9.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06866455078125, -0.06606769561767578, -0.06347084045410156, -0.060873985290527344, -0.058277130126953125, -0.055680274963378906, -0.05308341979980469, -0.05048656463623047, -0.04788970947265625, -0.04529285430908203, -0.04269599914550781, -0.040099143981933594, -0.037502288818359375, -0.034905433654785156, -0.03230857849121094, -0.02971172332763672, -0.0271148681640625, -0.02451801300048828, -0.021921157836914062, -0.019324302673339844, -0.016727447509765625, -0.014130592346191406, -0.011533737182617188, -0.008936882019042969, -0.00634002685546875, -0.0037431716918945312, -0.0011463165283203125, 0.0014505386352539062, 0.004047393798828125, 0.006644248962402344, 0.009241104125976562, 0.011837959289550781, 0.014434814453125, 0.01703166961669922, 0.019628524780273438, 0.022225379943847656, 0.024822235107421875, 0.027419090270996094, 0.030015945434570312, 0.03261280059814453, 0.03520965576171875, 0.03780651092529297, 0.04040336608886719, 0.043000221252441406, 0.045597076416015625, 0.048193931579589844, 0.05079078674316406, 0.05338764190673828, 0.0559844970703125, 0.05858135223388672, 0.06117820739746094, 0.06377506256103516, 0.06637191772460938, 0.0689687728881836, 0.07156562805175781, 0.07416248321533203, 0.07675933837890625, 0.07935619354248047, 0.08195304870605469, 0.0845499038696289, 0.08714675903320312, 0.08974361419677734, 0.09234046936035156, 0.09493732452392578, 0.0975341796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 14.0, 12.0, 35.0, 72.0, 108.0, 121.0, 159.0, 153.0, 122.0, 91.0, 53.0, 23.0, 18.0, 12.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7730293273925781, -1.722174048423767, -1.6713188886642456, -1.6204636096954346, -1.569608449935913, -1.518753170967102, -1.467897891998291, -1.4170427322387695, -1.366187572479248, -1.315332293510437, -1.2644771337509155, -1.2136218547821045, -1.162766695022583, -1.111911416053772, -1.061056137084961, -1.0102009773254395, -0.9593456983566284, -0.9084904789924622, -0.8576352596282959, -0.8067799806594849, -0.7559248208999634, -0.7050695419311523, -0.6542143225669861, -0.6033591032028198, -0.5525038838386536, -0.5016486644744873, -0.45079344511032104, -0.3999381959438324, -0.34908297657966614, -0.2982277572154999, -0.24737250804901123, -0.19651728868484497, -0.14566195011138916, -0.0948067232966423, -0.04395149648189545, 0.006903737783432007, 0.05775895714759827, 0.10861417651176453, 0.15946942567825317, 0.21032464504241943, 0.2611798644065857, 0.31203508377075195, 0.3628903031349182, 0.41374555230140686, 0.4646007716655731, 0.515455961227417, 0.566311240196228, 0.6171664595603943, 0.6680216789245605, 0.7188768982887268, 0.7697321176528931, 0.8205873966217041, 0.8714425563812256, 0.9222978353500366, 0.9731530547142029, 1.0240082740783691, 1.0748634338378906, 1.1257187128067017, 1.1765738725662231, 1.2274291515350342, 1.2782843112945557, 1.3291395902633667, 1.3799948692321777, 1.4308500289916992, 1.4817053079605103]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 11.0, 15.0, 17.0, 27.0, 21.0, 29.0, 29.0, 37.0, 39.0, 54.0, 54.0, 67.0, 69.0, 52.0, 63.0, 59.0, 50.0, 43.0, 47.0, 32.0, 42.0, 30.0, 31.0, 20.0, 14.0, 16.0, 10.0, 4.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4824278354644775, -1.4419621229171753, -1.401496410369873, -1.3610308170318604, -1.320565104484558, -1.2800993919372559, -1.2396336793899536, -1.1991679668426514, -1.1587023735046387, -1.1182366609573364, -1.0777709484100342, -1.0373053550720215, -0.9968396425247192, -0.956373929977417, -0.9159082174301147, -0.8754425048828125, -0.8349767923355103, -0.794511079788208, -0.7540454268455505, -0.7135797142982483, -0.6731140613555908, -0.6326483488082886, -0.5921826362609863, -0.5517169237136841, -0.5112512707710266, -0.47078558802604675, -0.4303199052810669, -0.38985419273376465, -0.3493885099887848, -0.30892282724380493, -0.2684571146965027, -0.22799143195152283, -0.18752574920654297, -0.1470600664615631, -0.10659436881542206, -0.0661286786198616, -0.025662988424301147, 0.014802694320678711, 0.05526839196681976, 0.09573408961296082, 0.13619977235794067, 0.17666545510292053, 0.21713115274906158, 0.25759685039520264, 0.2980625331401825, 0.33852821588516235, 0.3789939284324646, 0.41945961117744446, 0.4599252939224243, 0.5003910064697266, 0.540856659412384, 0.5813223719596863, 0.6217880249023438, 0.662253737449646, 0.7027194499969482, 0.7431851625442505, 0.783650815486908, 0.8241165280342102, 0.8645821809768677, 0.9050478935241699, 0.9455136060714722, 0.9859792590141296, 1.026444911956787, 1.0669106245040894, 1.1073763370513916]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 5.0, 3.0, 2.0, 5.0, 6.0, 9.0, 16.0, 18.0, 24.0, 35.0, 34.0, 73.0, 103.0, 184.0, 237.0, 348.0, 567.0, 981.0, 1688.0, 3220.0, 6551.0, 15370.0, 44261.0, 208364.0, 3436588.0, 375649.0, 62900.0, 19890.0, 8089.0, 4010.0, 2082.0, 1159.0, 680.0, 407.0, 268.0, 160.0, 100.0, 67.0, 38.0, 39.0, 23.0, 9.0, 8.0, 9.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186767578125, -0.1810436248779297, -0.17531967163085938, -0.16959571838378906, -0.16387176513671875, -0.15814781188964844, -0.15242385864257812, -0.1466999053955078, -0.1409759521484375, -0.1352519989013672, -0.12952804565429688, -0.12380409240722656, -0.11808013916015625, -0.11235618591308594, -0.10663223266601562, -0.10090827941894531, -0.095184326171875, -0.08946037292480469, -0.08373641967773438, -0.07801246643066406, -0.07228851318359375, -0.06656455993652344, -0.060840606689453125, -0.05511665344238281, -0.0493927001953125, -0.04366874694824219, -0.037944793701171875, -0.03222084045410156, -0.02649688720703125, -0.020772933959960938, -0.015048980712890625, -0.009325027465820312, -0.00360107421875, 0.0021228790283203125, 0.007846832275390625, 0.013570785522460938, 0.01929473876953125, 0.025018692016601562, 0.030742645263671875, 0.03646659851074219, 0.0421905517578125, 0.04791450500488281, 0.053638458251953125, 0.05936241149902344, 0.06508636474609375, 0.07081031799316406, 0.07653427124023438, 0.08225822448730469, 0.087982177734375, 0.09370613098144531, 0.09943008422851562, 0.10515403747558594, 0.11087799072265625, 0.11660194396972656, 0.12232589721679688, 0.1280498504638672, 0.1337738037109375, 0.1394977569580078, 0.14522171020507812, 0.15094566345214844, 0.15666961669921875, 0.16239356994628906, 0.16811752319335938, 0.1738414764404297, 0.1795654296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 7.0, 16.0, 22.0, 26.0, 22.0, 37.0, 45.0, 31.0, 42.0, 49.0, 63.0, 49.0, 59.0, 66.0, 57.0, 58.0, 58.0, 50.0, 38.0, 37.0, 19.0, 31.0, 14.0, 22.0, 6.0, 12.0, 11.0, 3.0, 8.0, 6.0, 4.0, 6.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0498046875, -0.048293113708496094, -0.04678153991699219, -0.04526996612548828, -0.043758392333984375, -0.04224681854248047, -0.04073524475097656, -0.039223670959472656, -0.03771209716796875, -0.036200523376464844, -0.03468894958496094, -0.03317737579345703, -0.031665802001953125, -0.03015422821044922, -0.028642654418945312, -0.027131080627441406, -0.0256195068359375, -0.024107933044433594, -0.022596359252929688, -0.02108478546142578, -0.019573211669921875, -0.01806163787841797, -0.016550064086914062, -0.015038490295410156, -0.01352691650390625, -0.012015342712402344, -0.010503768920898438, -0.008992195129394531, -0.007480621337890625, -0.005969047546386719, -0.0044574737548828125, -0.0029458999633789062, -0.001434326171875, 7.724761962890625e-05, 0.0015888214111328125, 0.0031003952026367188, 0.004611968994140625, 0.006123542785644531, 0.0076351165771484375, 0.009146690368652344, 0.01065826416015625, 0.012169837951660156, 0.013681411743164062, 0.015192985534667969, 0.016704559326171875, 0.01821613311767578, 0.019727706909179688, 0.021239280700683594, 0.0227508544921875, 0.024262428283691406, 0.025774002075195312, 0.02728557586669922, 0.028797149658203125, 0.03030872344970703, 0.03182029724121094, 0.033331871032714844, 0.03484344482421875, 0.036355018615722656, 0.03786659240722656, 0.03937816619873047, 0.040889739990234375, 0.04240131378173828, 0.04391288757324219, 0.045424461364746094, 0.04693603515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 15.0, 11.0, 15.0, 22.0, 27.0, 38.0, 71.0, 95.0, 115.0, 174.0, 248.0, 391.0, 621.0, 998.0, 1631.0, 2917.0, 5498.0, 11448.0, 25666.0, 68843.0, 241242.0, 2519673.0, 1058666.0, 163493.0, 51514.0, 20568.0, 9319.0, 4647.0, 2485.0, 1396.0, 851.0, 530.0, 334.0, 231.0, 155.0, 94.0, 73.0, 54.0, 23.0, 25.0, 15.0, 17.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.143798828125, -0.13942337036132812, -0.13504791259765625, -0.13067245483398438, -0.1262969970703125, -0.12192153930664062, -0.11754608154296875, -0.11317062377929688, -0.108795166015625, -0.10441970825195312, -0.10004425048828125, -0.09566879272460938, -0.0912933349609375, -0.08691787719726562, -0.08254241943359375, -0.07816696166992188, -0.07379150390625, -0.06941604614257812, -0.06504058837890625, -0.060665130615234375, -0.0562896728515625, -0.051914215087890625, -0.04753875732421875, -0.043163299560546875, -0.038787841796875, -0.034412384033203125, -0.03003692626953125, -0.025661468505859375, -0.0212860107421875, -0.016910552978515625, -0.01253509521484375, -0.008159637451171875, -0.0037841796875, 0.000591278076171875, 0.00496673583984375, 0.009342193603515625, 0.0137176513671875, 0.018093109130859375, 0.02246856689453125, 0.026844024658203125, 0.031219482421875, 0.035594940185546875, 0.03997039794921875, 0.044345855712890625, 0.0487213134765625, 0.053096771240234375, 0.05747222900390625, 0.061847686767578125, 0.06622314453125, 0.07059860229492188, 0.07497406005859375, 0.07934951782226562, 0.0837249755859375, 0.08810043334960938, 0.09247589111328125, 0.09685134887695312, 0.101226806640625, 0.10560226440429688, 0.10997772216796875, 0.11435317993164062, 0.1187286376953125, 0.12310409545898438, 0.12747955322265625, 0.13185501098632812, 0.13623046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 9.0, 9.0, 14.0, 18.0, 23.0, 28.0, 27.0, 50.0, 61.0, 106.0, 175.0, 320.0, 798.0, 1307.0, 454.0, 245.0, 130.0, 96.0, 44.0, 32.0, 30.0, 18.0, 19.0, 8.0, 10.0, 6.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.07843017578125, -0.076202392578125, -0.073974609375, -0.071746826171875, -0.06951904296875, -0.067291259765625, -0.0650634765625, -0.062835693359375, -0.06060791015625, -0.058380126953125, -0.05615234375, -0.053924560546875, -0.05169677734375, -0.049468994140625, -0.0472412109375, -0.045013427734375, -0.04278564453125, -0.040557861328125, -0.038330078125, -0.036102294921875, -0.03387451171875, -0.031646728515625, -0.0294189453125, -0.027191162109375, -0.02496337890625, -0.022735595703125, -0.0205078125, -0.018280029296875, -0.01605224609375, -0.013824462890625, -0.0115966796875, -0.009368896484375, -0.00714111328125, -0.004913330078125, -0.002685546875, -0.000457763671875, 0.00177001953125, 0.003997802734375, 0.0062255859375, 0.008453369140625, 0.01068115234375, 0.012908935546875, 0.01513671875, 0.017364501953125, 0.01959228515625, 0.021820068359375, 0.0240478515625, 0.026275634765625, 0.02850341796875, 0.030731201171875, 0.032958984375, 0.035186767578125, 0.03741455078125, 0.039642333984375, 0.0418701171875, 0.044097900390625, 0.04632568359375, 0.048553466796875, 0.05078125, 0.053009033203125, 0.05523681640625, 0.057464599609375, 0.0596923828125, 0.061920166015625, 0.06414794921875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 13.0, 16.0, 34.0, 48.0, 66.0, 79.0, 95.0, 92.0, 103.0, 101.0, 89.0, 87.0, 52.0, 37.0, 24.0, 20.0, 10.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3733952045440674, -0.35986822843551636, -0.34634125232696533, -0.3328142762184143, -0.3192873001098633, -0.30576032400131226, -0.29223334789276123, -0.2787063717842102, -0.2651793956756592, -0.25165241956710815, -0.23812544345855713, -0.2245984673500061, -0.21107149124145508, -0.19754451513290405, -0.18401755392551422, -0.1704905778169632, -0.15696361660957336, -0.14343664050102234, -0.1299096643924713, -0.11638269573450089, -0.10285571962594986, -0.08932874351739883, -0.0758017748594284, -0.06227479875087738, -0.048747822642326355, -0.03522084653377533, -0.021693874150514603, -0.008166901767253876, 0.00536007434129715, 0.018887050449848175, 0.032414019107818604, 0.04594099521636963, 0.05946794152259827, 0.07299491763114929, 0.08652189373970032, 0.10004886239767075, 0.11357583850622177, 0.1271028220653534, 0.14062978327274323, 0.15415675938129425, 0.16768373548984528, 0.1812107115983963, 0.19473768770694733, 0.20826464891433716, 0.22179162502288818, 0.2353186011314392, 0.24884557723999023, 0.26237255334854126, 0.2758995294570923, 0.2894265055656433, 0.30295348167419434, 0.31648045778274536, 0.3300074338912964, 0.3435344099998474, 0.35706138610839844, 0.37058836221694946, 0.3841153383255005, 0.3976423144340515, 0.41116929054260254, 0.42469626665115356, 0.4382232427597046, 0.4517502188682556, 0.46527719497680664, 0.47880417108535767, 0.4923311173915863]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 2.0, 13.0, 6.0, 11.0, 10.0, 13.0, 15.0, 19.0, 34.0, 27.0, 22.0, 34.0, 33.0, 31.0, 36.0, 36.0, 45.0, 40.0, 42.0, 32.0, 34.0, 44.0, 36.0, 33.0, 46.0, 33.0, 28.0, 34.0, 27.0, 23.0, 23.0, 17.0, 18.0, 21.0, 10.0, 15.0, 10.0, 10.0, 5.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22394448518753052, -0.2160816788673401, -0.20821885764598846, -0.20035603642463684, -0.1924932301044464, -0.18463042378425598, -0.17676760256290436, -0.16890478134155273, -0.1610419750213623, -0.15317916870117188, -0.14531634747982025, -0.13745352625846863, -0.1295907199382782, -0.12172790616750717, -0.11386509239673615, -0.10600227862596512, -0.09813946485519409, -0.09027665108442307, -0.08241383731365204, -0.07455102354288101, -0.06668820977210999, -0.05882539600133896, -0.05096258223056793, -0.043099768459796906, -0.03523695468902588, -0.027374140918254852, -0.019511327147483826, -0.011648513376712799, -0.0037856996059417725, 0.004077114164829254, 0.01193992793560028, 0.019802741706371307, 0.027665555477142334, 0.03552836924791336, 0.04339118301868439, 0.051253996789455414, 0.05911681056022644, 0.06697962433099747, 0.0748424381017685, 0.08270525187253952, 0.09056806564331055, 0.09843087941408157, 0.1062936931848526, 0.11415650695562363, 0.12201932072639465, 0.12988212704658508, 0.1377449482679367, 0.14560776948928833, 0.15347057580947876, 0.1613333821296692, 0.1691962033510208, 0.17705902457237244, 0.18492183089256287, 0.1927846372127533, 0.20064745843410492, 0.20851027965545654, 0.21637308597564697, 0.2242358922958374, 0.23209871351718903, 0.23996153473854065, 0.24782434105873108, 0.2556871473789215, 0.2635499835014343, 0.27141278982162476, 0.2792755961418152]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 15.0, 18.0, 31.0, 35.0, 74.0, 129.0, 183.0, 310.0, 562.0, 965.0, 1841.0, 3500.0, 6742.0, 13667.0, 27426.0, 55606.0, 112224.0, 229189.0, 292245.0, 152645.0, 75911.0, 37570.0, 18262.0, 9180.0, 4743.0, 2375.0, 1338.0, 756.0, 377.0, 250.0, 142.0, 84.0, 57.0, 37.0, 23.0, 16.0, 7.0, 11.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1485595703125, -0.14434146881103516, -0.1401233673095703, -0.13590526580810547, -0.13168716430664062, -0.12746906280517578, -0.12325096130371094, -0.1190328598022461, -0.11481475830078125, -0.1105966567993164, -0.10637855529785156, -0.10216045379638672, -0.09794235229492188, -0.09372425079345703, -0.08950614929199219, -0.08528804779052734, -0.0810699462890625, -0.07685184478759766, -0.07263374328613281, -0.06841564178466797, -0.06419754028320312, -0.05997943878173828, -0.05576133728027344, -0.051543235778808594, -0.04732513427734375, -0.043107032775878906, -0.03888893127441406, -0.03467082977294922, -0.030452728271484375, -0.02623462677001953, -0.022016525268554688, -0.017798423767089844, -0.013580322265625, -0.009362220764160156, -0.0051441192626953125, -0.0009260177612304688, 0.003292083740234375, 0.007510185241699219, 0.011728286743164062, 0.015946388244628906, 0.02016448974609375, 0.024382591247558594, 0.028600692749023438, 0.03281879425048828, 0.037036895751953125, 0.04125499725341797, 0.04547309875488281, 0.049691200256347656, 0.0539093017578125, 0.058127403259277344, 0.06234550476074219, 0.06656360626220703, 0.07078170776367188, 0.07499980926513672, 0.07921791076660156, 0.0834360122680664, 0.08765411376953125, 0.0918722152709961, 0.09609031677246094, 0.10030841827392578, 0.10452651977539062, 0.10874462127685547, 0.11296272277832031, 0.11718082427978516, 0.12139892578125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 11.0, 13.0, 19.0, 20.0, 24.0, 27.0, 20.0, 38.0, 48.0, 48.0, 49.0, 38.0, 44.0, 52.0, 51.0, 58.0, 54.0, 61.0, 46.0, 39.0, 34.0, 35.0, 23.0, 33.0, 17.0, 20.0, 12.0, 8.0, 11.0, 10.0, 3.0, 6.0, 3.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.047576904296875, -0.046154022216796875, -0.04473114013671875, -0.043308258056640625, -0.0418853759765625, -0.040462493896484375, -0.03903961181640625, -0.037616729736328125, -0.03619384765625, -0.034770965576171875, -0.03334808349609375, -0.031925201416015625, -0.0305023193359375, -0.029079437255859375, -0.02765655517578125, -0.026233673095703125, -0.024810791015625, -0.023387908935546875, -0.02196502685546875, -0.020542144775390625, -0.0191192626953125, -0.017696380615234375, -0.01627349853515625, -0.014850616455078125, -0.013427734375, -0.012004852294921875, -0.01058197021484375, -0.009159088134765625, -0.0077362060546875, -0.006313323974609375, -0.00489044189453125, -0.003467559814453125, -0.002044677734375, -0.000621795654296875, 0.00080108642578125, 0.002223968505859375, 0.0036468505859375, 0.005069732666015625, 0.00649261474609375, 0.007915496826171875, 0.00933837890625, 0.010761260986328125, 0.01218414306640625, 0.013607025146484375, 0.0150299072265625, 0.016452789306640625, 0.01787567138671875, 0.019298553466796875, 0.020721435546875, 0.022144317626953125, 0.02356719970703125, 0.024990081787109375, 0.0264129638671875, 0.027835845947265625, 0.02925872802734375, 0.030681610107421875, 0.0321044921875, 0.033527374267578125, 0.03495025634765625, 0.036373138427734375, 0.0377960205078125, 0.039218902587890625, 0.04064178466796875, 0.042064666748046875, 0.043487548828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 2.0, 4.0, 8.0, 10.0, 14.0, 24.0, 29.0, 31.0, 39.0, 71.0, 58.0, 102.0, 144.0, 227.0, 350.0, 520.0, 943.0, 1866.0, 4623.0, 15741.0, 63439.0, 250382.0, 486325.0, 165009.0, 40917.0, 10623.0, 3362.0, 1442.0, 754.0, 499.0, 282.0, 195.0, 149.0, 120.0, 67.0, 47.0, 38.0, 30.0, 17.0, 12.0, 13.0, 9.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.219970703125, -0.21356582641601562, -0.20716094970703125, -0.20075607299804688, -0.1943511962890625, -0.18794631958007812, -0.18154144287109375, -0.17513656616210938, -0.168731689453125, -0.16232681274414062, -0.15592193603515625, -0.14951705932617188, -0.1431121826171875, -0.13670730590820312, -0.13030242919921875, -0.12389755249023438, -0.11749267578125, -0.11108779907226562, -0.10468292236328125, -0.09827804565429688, -0.0918731689453125, -0.08546829223632812, -0.07906341552734375, -0.07265853881835938, -0.066253662109375, -0.059848785400390625, -0.05344390869140625, -0.047039031982421875, -0.0406341552734375, -0.034229278564453125, -0.02782440185546875, -0.021419525146484375, -0.0150146484375, -0.008609771728515625, -0.00220489501953125, 0.004199981689453125, 0.0106048583984375, 0.017009735107421875, 0.02341461181640625, 0.029819488525390625, 0.036224365234375, 0.042629241943359375, 0.04903411865234375, 0.055438995361328125, 0.0618438720703125, 0.06824874877929688, 0.07465362548828125, 0.08105850219726562, 0.08746337890625, 0.09386825561523438, 0.10027313232421875, 0.10667800903320312, 0.1130828857421875, 0.11948776245117188, 0.12589263916015625, 0.13229751586914062, 0.138702392578125, 0.14510726928710938, 0.15151214599609375, 0.15791702270507812, 0.1643218994140625, 0.17072677612304688, 0.17713165283203125, 0.18353652954101562, 0.18994140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 12.0, 15.0, 15.0, 19.0, 25.0, 33.0, 24.0, 30.0, 29.0, 34.0, 47.0, 35.0, 48.0, 55.0, 46.0, 45.0, 46.0, 50.0, 38.0, 30.0, 37.0, 38.0, 37.0, 34.0, 26.0, 31.0, 21.0, 13.0, 15.0, 13.0, 6.0, 5.0, 7.0, 4.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.1577930450439453, -0.15188980102539062, -0.14598655700683594, -0.14008331298828125, -0.13418006896972656, -0.12827682495117188, -0.12237358093261719, -0.1164703369140625, -0.11056709289550781, -0.10466384887695312, -0.09876060485839844, -0.09285736083984375, -0.08695411682128906, -0.08105087280273438, -0.07514762878417969, -0.069244384765625, -0.06334114074707031, -0.057437896728515625, -0.05153465270996094, -0.04563140869140625, -0.03972816467285156, -0.033824920654296875, -0.027921676635742188, -0.0220184326171875, -0.016115188598632812, -0.010211944580078125, -0.0043087005615234375, 0.00159454345703125, 0.0074977874755859375, 0.013401031494140625, 0.019304275512695312, 0.02520751953125, 0.031110763549804688, 0.037014007568359375, 0.04291725158691406, 0.04882049560546875, 0.05472373962402344, 0.060626983642578125, 0.06653022766113281, 0.0724334716796875, 0.07833671569824219, 0.08423995971679688, 0.09014320373535156, 0.09604644775390625, 0.10194969177246094, 0.10785293579101562, 0.11375617980957031, 0.119659423828125, 0.1255626678466797, 0.13146591186523438, 0.13736915588378906, 0.14327239990234375, 0.14917564392089844, 0.15507888793945312, 0.1609821319580078, 0.1668853759765625, 0.1727886199951172, 0.17869186401367188, 0.18459510803222656, 0.19049835205078125, 0.19640159606933594, 0.20230484008789062, 0.2082080841064453, 0.214111328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 7.0, 17.0, 24.0, 17.0, 49.0, 54.0, 95.0, 169.0, 221.0, 378.0, 653.0, 1232.0, 2420.0, 5434.0, 13416.0, 41961.0, 186219.0, 558195.0, 175201.0, 39299.0, 12839.0, 5285.0, 2443.0, 1187.0, 660.0, 408.0, 221.0, 163.0, 81.0, 60.0, 42.0, 31.0, 28.0, 18.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11572265625, -0.11179733276367188, -0.10787200927734375, -0.10394668579101562, -0.1000213623046875, -0.09609603881835938, -0.09217071533203125, -0.08824539184570312, -0.084320068359375, -0.08039474487304688, -0.07646942138671875, -0.07254409790039062, -0.0686187744140625, -0.06469345092773438, -0.06076812744140625, -0.056842803955078125, -0.05291748046875, -0.048992156982421875, -0.04506683349609375, -0.041141510009765625, -0.0372161865234375, -0.033290863037109375, -0.02936553955078125, -0.025440216064453125, -0.021514892578125, -0.017589569091796875, -0.01366424560546875, -0.009738922119140625, -0.0058135986328125, -0.001888275146484375, 0.00203704833984375, 0.005962371826171875, 0.0098876953125, 0.013813018798828125, 0.01773834228515625, 0.021663665771484375, 0.0255889892578125, 0.029514312744140625, 0.03343963623046875, 0.037364959716796875, 0.041290283203125, 0.045215606689453125, 0.04914093017578125, 0.053066253662109375, 0.0569915771484375, 0.060916900634765625, 0.06484222412109375, 0.06876754760742188, 0.07269287109375, 0.07661819458007812, 0.08054351806640625, 0.08446884155273438, 0.0883941650390625, 0.09231948852539062, 0.09624481201171875, 0.10017013549804688, 0.104095458984375, 0.10802078247070312, 0.11194610595703125, 0.11587142944335938, 0.1197967529296875, 0.12372207641601562, 0.12764739990234375, 0.13157272338867188, 0.135498046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 3.0, 2.0, 5.0, 4.0, 7.0, 4.0, 7.0, 8.0, 14.0, 28.0, 20.0, 25.0, 29.0, 49.0, 42.0, 52.0, 39.0, 73.0, 52.0, 57.0, 55.0, 74.0, 54.0, 58.0, 31.0, 43.0, 25.0, 29.0, 18.0, 19.0, 19.0, 8.0, 9.0, 6.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-5.7697296142578125e-05, -5.596969276666641e-05, -5.42420893907547e-05, -5.251448601484299e-05, -5.0786882638931274e-05, -4.905927926301956e-05, -4.733167588710785e-05, -4.5604072511196136e-05, -4.3876469135284424e-05, -4.214886575937271e-05, -4.0421262383461e-05, -3.8693659007549286e-05, -3.696605563163757e-05, -3.523845225572586e-05, -3.351084887981415e-05, -3.1783245503902435e-05, -3.0055642127990723e-05, -2.832803875207901e-05, -2.6600435376167297e-05, -2.4872832000255585e-05, -2.3145228624343872e-05, -2.141762524843216e-05, -1.9690021872520447e-05, -1.7962418496608734e-05, -1.623481512069702e-05, -1.4507211744785309e-05, -1.2779608368873596e-05, -1.1052004992961884e-05, -9.324401617050171e-06, -7.596798241138458e-06, -5.869194865226746e-06, -4.141591489315033e-06, -2.4139881134033203e-06, -6.863847374916077e-07, 1.041218638420105e-06, 2.7688220143318176e-06, 4.49642539024353e-06, 6.224028766155243e-06, 7.951632142066956e-06, 9.679235517978668e-06, 1.1406838893890381e-05, 1.3134442269802094e-05, 1.4862045645713806e-05, 1.658964902162552e-05, 1.831725239753723e-05, 2.0044855773448944e-05, 2.1772459149360657e-05, 2.350006252527237e-05, 2.5227665901184082e-05, 2.6955269277095795e-05, 2.8682872653007507e-05, 3.041047602891922e-05, 3.213807940483093e-05, 3.3865682780742645e-05, 3.559328615665436e-05, 3.732088953256607e-05, 3.904849290847778e-05, 4.0776096284389496e-05, 4.250369966030121e-05, 4.423130303621292e-05, 4.5958906412124634e-05, 4.7686509788036346e-05, 4.941411316394806e-05, 5.114171653985977e-05, 5.2869319915771484e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 15.0, 15.0, 21.0, 29.0, 42.0, 59.0, 80.0, 116.0, 202.0, 390.0, 769.0, 1668.0, 4286.0, 13076.0, 51713.0, 389074.0, 496643.0, 66137.0, 15336.0, 4981.0, 1953.0, 858.0, 383.0, 271.0, 130.0, 90.0, 58.0, 50.0, 24.0, 8.0, 13.0, 14.0, 7.0, 8.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.1431884765625, -0.13872337341308594, -0.13425827026367188, -0.1297931671142578, -0.12532806396484375, -0.12086296081542969, -0.11639785766601562, -0.11193275451660156, -0.1074676513671875, -0.10300254821777344, -0.09853744506835938, -0.09407234191894531, -0.08960723876953125, -0.08514213562011719, -0.08067703247070312, -0.07621192932128906, -0.071746826171875, -0.06728172302246094, -0.06281661987304688, -0.05835151672363281, -0.05388641357421875, -0.04942131042480469, -0.044956207275390625, -0.04049110412597656, -0.0360260009765625, -0.03156089782714844, -0.027095794677734375, -0.022630691528320312, -0.01816558837890625, -0.013700485229492188, -0.009235382080078125, -0.0047702789306640625, -0.00030517578125, 0.0041599273681640625, 0.008625030517578125, 0.013090133666992188, 0.01755523681640625, 0.022020339965820312, 0.026485443115234375, 0.030950546264648438, 0.0354156494140625, 0.03988075256347656, 0.044345855712890625, 0.04881095886230469, 0.05327606201171875, 0.05774116516113281, 0.062206268310546875, 0.06667137145996094, 0.071136474609375, 0.07560157775878906, 0.08006668090820312, 0.08453178405761719, 0.08899688720703125, 0.09346199035644531, 0.09792709350585938, 0.10239219665527344, 0.1068572998046875, 0.11132240295410156, 0.11578750610351562, 0.12025260925292969, 0.12471771240234375, 0.1291828155517578, 0.13364791870117188, 0.13811302185058594, 0.142578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 4.0, 6.0, 5.0, 11.0, 16.0, 27.0, 54.0, 61.0, 113.0, 142.0, 170.0, 127.0, 85.0, 60.0, 36.0, 23.0, 14.0, 11.0, 13.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1988525390625, -0.19436073303222656, -0.18986892700195312, -0.1853771209716797, -0.18088531494140625, -0.1763935089111328, -0.17190170288085938, -0.16740989685058594, -0.1629180908203125, -0.15842628479003906, -0.15393447875976562, -0.1494426727294922, -0.14495086669921875, -0.1404590606689453, -0.13596725463867188, -0.13147544860839844, -0.126983642578125, -0.12249183654785156, -0.11800003051757812, -0.11350822448730469, -0.10901641845703125, -0.10452461242675781, -0.10003280639648438, -0.09554100036621094, -0.0910491943359375, -0.08655738830566406, -0.08206558227539062, -0.07757377624511719, -0.07308197021484375, -0.06859016418457031, -0.06409835815429688, -0.05960655212402344, -0.05511474609375, -0.05062294006347656, -0.046131134033203125, -0.04163932800292969, -0.03714752197265625, -0.03265571594238281, -0.028163909912109375, -0.023672103881835938, -0.0191802978515625, -0.014688491821289062, -0.010196685791015625, -0.0057048797607421875, -0.00121307373046875, 0.0032787322998046875, 0.007770538330078125, 0.012262344360351562, 0.016754150390625, 0.021245956420898438, 0.025737762451171875, 0.030229568481445312, 0.03472137451171875, 0.03921318054199219, 0.043704986572265625, 0.04819679260253906, 0.0526885986328125, 0.05718040466308594, 0.061672210693359375, 0.06616401672363281, 0.07065582275390625, 0.07514762878417969, 0.07963943481445312, 0.08413124084472656, 0.088623046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 13.0, 24.0, 54.0, 84.0, 152.0, 189.0, 166.0, 131.0, 82.0, 59.0, 25.0, 12.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.302182197570801, -2.243377685546875, -2.18457293510437, -2.1257684230804443, -2.0669639110565186, -2.0081591606140137, -1.949354648590088, -1.890550136566162, -1.8317455053329468, -1.7729408740997314, -1.7141363620758057, -1.6553317308425903, -1.5965272188186646, -1.5377225875854492, -1.4789180755615234, -1.420113444328308, -1.3613088130950928, -1.3025041818618774, -1.2436996698379517, -1.1848950386047363, -1.1260905265808105, -1.0672858953475952, -1.0084812641143799, -0.9496767520904541, -0.8908722400665283, -0.8320676684379578, -0.7732630968093872, -0.7144584655761719, -0.6556538939476013, -0.5968493223190308, -0.5380447506904602, -0.47924014925956726, -0.4204355478286743, -0.36163097620010376, -0.3028263747692108, -0.24402180314064026, -0.1852172166109085, -0.12641263008117676, -0.0676080584526062, -0.008803457021713257, 0.0500011146068573, 0.10880570113658905, 0.1676102876663208, 0.22641485929489136, 0.2852194309234619, 0.34402403235435486, 0.4028286039829254, 0.46163320541381836, 0.5204377770423889, 0.5792423486709595, 0.63804692029953, 0.6968514919281006, 0.7556561231613159, 0.8144606947898865, 0.873265266418457, 0.9320698976516724, 0.9908744096755981, 1.0496790409088135, 1.1084835529327393, 1.1672881841659546, 1.2260926961898804, 1.2848973274230957, 1.3437018394470215, 1.4025064706802368, 1.4613111019134521]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 12.0, 8.0, 6.0, 5.0, 5.0, 15.0, 14.0, 29.0, 14.0, 24.0, 26.0, 41.0, 34.0, 33.0, 41.0, 28.0, 32.0, 29.0, 41.0, 40.0, 37.0, 42.0, 37.0, 44.0, 36.0, 31.0, 26.0, 27.0, 24.0, 29.0, 31.0, 24.0, 15.0, 20.0, 11.0, 12.0, 11.0, 11.0, 9.0, 7.0, 3.0, 6.0, 9.0, 0.0, 9.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.9869225025177002, -0.9588083028793335, -0.9306941628456116, -0.9025799632072449, -0.8744657635688782, -0.8463516235351562, -0.8182374238967896, -0.7901232242584229, -0.7620090246200562, -0.7338948249816895, -0.7057806849479675, -0.6776664853096008, -0.6495522856712341, -0.6214381456375122, -0.5933239459991455, -0.5652097463607788, -0.5370956063270569, -0.5089814066886902, -0.4808672368526459, -0.45275306701660156, -0.42463886737823486, -0.39652469754219055, -0.36841052770614624, -0.34029632806777954, -0.31218215823173523, -0.2840679883956909, -0.2559537887573242, -0.2278396189212799, -0.1997254341840744, -0.1716112494468689, -0.14349707961082458, -0.11538289487361908, -0.08726876974105835, -0.05915458872914314, -0.031040407717227936, -0.0029262304306030273, 0.025187954306602478, 0.05330213904380798, 0.0814163088798523, 0.1095304936170578, 0.1376446783542633, 0.1657588630914688, 0.19387304782867432, 0.22198721766471863, 0.25010138750076294, 0.27821558713912964, 0.30632975697517395, 0.33444392681121826, 0.36255812644958496, 0.3906722962856293, 0.41878649592399597, 0.4469006657600403, 0.475014865398407, 0.5031290054321289, 0.5312432050704956, 0.5593574047088623, 0.587471604347229, 0.6155858039855957, 0.6436999440193176, 0.6718141436576843, 0.699928343296051, 0.728042483329773, 0.7561566829681396, 0.7842708826065063, 0.8123850226402283]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 8.0, 10.0, 4.0, 23.0, 23.0, 43.0, 60.0, 107.0, 125.0, 204.0, 376.0, 544.0, 1024.0, 1751.0, 3501.0, 7321.0, 17220.0, 47364.0, 172935.0, 2597360.0, 1141655.0, 133953.0, 39854.0, 15121.0, 6508.0, 3117.0, 1732.0, 915.0, 508.0, 301.0, 203.0, 131.0, 81.0, 58.0, 44.0, 26.0, 18.0, 14.0, 9.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.148193359375, -0.14323997497558594, -0.13828659057617188, -0.1333332061767578, -0.12837982177734375, -0.12342643737792969, -0.11847305297851562, -0.11351966857910156, -0.1085662841796875, -0.10361289978027344, -0.09865951538085938, -0.09370613098144531, -0.08875274658203125, -0.08379936218261719, -0.07884597778320312, -0.07389259338378906, -0.068939208984375, -0.06398582458496094, -0.059032440185546875, -0.05407905578613281, -0.04912567138671875, -0.04417228698730469, -0.039218902587890625, -0.03426551818847656, -0.0293121337890625, -0.024358749389648438, -0.019405364990234375, -0.014451980590820312, -0.00949859619140625, -0.0045452117919921875, 0.000408172607421875, 0.0053615570068359375, 0.01031494140625, 0.015268325805664062, 0.020221710205078125, 0.025175094604492188, 0.03012847900390625, 0.03508186340332031, 0.040035247802734375, 0.04498863220214844, 0.0499420166015625, 0.05489540100097656, 0.059848785400390625, 0.06480216979980469, 0.06975555419921875, 0.07470893859863281, 0.07966232299804688, 0.08461570739746094, 0.089569091796875, 0.09452247619628906, 0.09947586059570312, 0.10442924499511719, 0.10938262939453125, 0.11433601379394531, 0.11928939819335938, 0.12424278259277344, 0.1291961669921875, 0.13414955139160156, 0.13910293579101562, 0.1440563201904297, 0.14900970458984375, 0.1539630889892578, 0.15891647338867188, 0.16386985778808594, 0.1688232421875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 7.0, 14.0, 12.0, 23.0, 19.0, 31.0, 24.0, 36.0, 44.0, 36.0, 56.0, 45.0, 44.0, 70.0, 60.0, 64.0, 63.0, 52.0, 46.0, 38.0, 40.0, 39.0, 23.0, 22.0, 17.0, 14.0, 9.0, 8.0, 10.0, 7.0, 4.0, 3.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04901123046875, -0.04739570617675781, -0.045780181884765625, -0.04416465759277344, -0.04254913330078125, -0.04093360900878906, -0.039318084716796875, -0.03770256042480469, -0.0360870361328125, -0.03447151184082031, -0.032855987548828125, -0.031240463256835938, -0.02962493896484375, -0.028009414672851562, -0.026393890380859375, -0.024778366088867188, -0.023162841796875, -0.021547317504882812, -0.019931793212890625, -0.018316268920898438, -0.01670074462890625, -0.015085220336914062, -0.013469696044921875, -0.011854171752929688, -0.0102386474609375, -0.008623123168945312, -0.007007598876953125, -0.0053920745849609375, -0.00377655029296875, -0.0021610260009765625, -0.000545501708984375, 0.0010700225830078125, 0.002685546875, 0.0043010711669921875, 0.005916595458984375, 0.0075321197509765625, 0.00914764404296875, 0.010763168334960938, 0.012378692626953125, 0.013994216918945312, 0.0156097412109375, 0.017225265502929688, 0.018840789794921875, 0.020456314086914062, 0.02207183837890625, 0.023687362670898438, 0.025302886962890625, 0.026918411254882812, 0.028533935546875, 0.030149459838867188, 0.031764984130859375, 0.03338050842285156, 0.03499603271484375, 0.03661155700683594, 0.038227081298828125, 0.03984260559082031, 0.0414581298828125, 0.04307365417480469, 0.044689178466796875, 0.04630470275878906, 0.04792022705078125, 0.04953575134277344, 0.051151275634765625, 0.05276679992675781, 0.05438232421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 6.0, 10.0, 13.0, 28.0, 25.0, 42.0, 71.0, 80.0, 171.0, 245.0, 413.0, 569.0, 1016.0, 1877.0, 3399.0, 7033.0, 15267.0, 36543.0, 102563.0, 386745.0, 2705067.0, 695706.0, 149714.0, 49771.0, 19435.0, 8859.0, 4178.0, 2242.0, 1195.0, 713.0, 471.0, 270.0, 184.0, 117.0, 79.0, 53.0, 31.0, 26.0, 13.0, 9.0, 11.0, 8.0, 1.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1383056640625, -0.13407135009765625, -0.1298370361328125, -0.12560272216796875, -0.121368408203125, -0.11713409423828125, -0.1128997802734375, -0.10866546630859375, -0.10443115234375, -0.10019683837890625, -0.0959625244140625, -0.09172821044921875, -0.087493896484375, -0.08325958251953125, -0.0790252685546875, -0.07479095458984375, -0.070556640625, -0.06632232666015625, -0.0620880126953125, -0.05785369873046875, -0.053619384765625, -0.04938507080078125, -0.0451507568359375, -0.04091644287109375, -0.03668212890625, -0.03244781494140625, -0.0282135009765625, -0.02397918701171875, -0.019744873046875, -0.01551055908203125, -0.0112762451171875, -0.00704193115234375, -0.0028076171875, 0.00142669677734375, 0.0056610107421875, 0.00989532470703125, 0.014129638671875, 0.01836395263671875, 0.0225982666015625, 0.02683258056640625, 0.03106689453125, 0.03530120849609375, 0.0395355224609375, 0.04376983642578125, 0.048004150390625, 0.05223846435546875, 0.0564727783203125, 0.06070709228515625, 0.06494140625, 0.06917572021484375, 0.0734100341796875, 0.07764434814453125, 0.081878662109375, 0.08611297607421875, 0.0903472900390625, 0.09458160400390625, 0.09881591796875, 0.10305023193359375, 0.1072845458984375, 0.11151885986328125, 0.115753173828125, 0.11998748779296875, 0.1242218017578125, 0.12845611572265625, 0.1326904296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 9.0, 7.0, 9.0, 10.0, 19.0, 25.0, 25.0, 42.0, 63.0, 70.0, 101.0, 177.0, 261.0, 457.0, 1065.0, 766.0, 330.0, 195.0, 142.0, 87.0, 53.0, 45.0, 32.0, 21.0, 14.0, 13.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0841064453125, -0.08154487609863281, -0.07898330688476562, -0.07642173767089844, -0.07386016845703125, -0.07129859924316406, -0.06873703002929688, -0.06617546081542969, -0.0636138916015625, -0.06105232238769531, -0.058490753173828125, -0.05592918395996094, -0.05336761474609375, -0.05080604553222656, -0.048244476318359375, -0.04568290710449219, -0.043121337890625, -0.04055976867675781, -0.037998199462890625, -0.03543663024902344, -0.03287506103515625, -0.030313491821289062, -0.027751922607421875, -0.025190353393554688, -0.0226287841796875, -0.020067214965820312, -0.017505645751953125, -0.014944076538085938, -0.01238250732421875, -0.009820938110351562, -0.007259368896484375, -0.0046977996826171875, -0.00213623046875, 0.0004253387451171875, 0.002986907958984375, 0.0055484771728515625, 0.00811004638671875, 0.010671615600585938, 0.013233184814453125, 0.015794754028320312, 0.0183563232421875, 0.020917892456054688, 0.023479461669921875, 0.026041030883789062, 0.02860260009765625, 0.031164169311523438, 0.033725738525390625, 0.03628730773925781, 0.038848876953125, 0.04141044616699219, 0.043972015380859375, 0.04653358459472656, 0.04909515380859375, 0.05165672302246094, 0.054218292236328125, 0.05677986145019531, 0.0593414306640625, 0.06190299987792969, 0.06446456909179688, 0.06702613830566406, 0.06958770751953125, 0.07214927673339844, 0.07471084594726562, 0.07727241516113281, 0.079833984375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 12.0, 28.0, 47.0, 68.0, 120.0, 137.0, 136.0, 116.0, 125.0, 88.0, 58.0, 29.0, 15.0, 9.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1035006046295166, -1.0809924602508545, -1.058484435081482, -1.0359762907028198, -1.0134681463241577, -0.9909600615501404, -0.968451976776123, -0.9459438323974609, -0.9234357476234436, -0.9009276628494263, -0.8784195184707642, -0.8559114336967468, -0.8334033489227295, -0.8108952045440674, -0.78838711977005, -0.7658790349960327, -0.7433708906173706, -0.7208628058433533, -0.6983546614646912, -0.6758465766906738, -0.6533384323120117, -0.6308303475379944, -0.608322262763977, -0.5858141183853149, -0.5633060336112976, -0.5407979488372803, -0.5182898044586182, -0.49578171968460083, -0.4732736051082611, -0.4507654905319214, -0.42825740575790405, -0.40574929118156433, -0.3832412362098694, -0.36073312163352966, -0.33822500705718994, -0.3157169222831726, -0.2932088077068329, -0.27070069313049316, -0.24819259345531464, -0.2256844937801361, -0.2031763792037964, -0.18066826462745667, -0.15816016495227814, -0.1356520652770996, -0.11314395070075989, -0.09063584357500076, -0.06812773644924164, -0.04561963677406311, -0.02311152219772339, -0.0006034150719642639, 0.02190469205379486, 0.044412799179553986, 0.06692090630531311, 0.08942901343107224, 0.11193712055683136, 0.1344452202320099, 0.1569533348083496, 0.17946144938468933, 0.20196954905986786, 0.2244776487350464, 0.2469857633113861, 0.26949387788772583, 0.29200196266174316, 0.3145100772380829, 0.3370181918144226]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 2.0, 11.0, 7.0, 10.0, 20.0, 19.0, 18.0, 16.0, 25.0, 23.0, 31.0, 36.0, 43.0, 39.0, 45.0, 52.0, 46.0, 44.0, 45.0, 43.0, 45.0, 45.0, 44.0, 39.0, 26.0, 27.0, 35.0, 21.0, 23.0, 20.0, 21.0, 10.0, 10.0, 4.0, 4.0, 9.0, 14.0, 5.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31915968656539917, -0.3087106943130493, -0.2982616722583771, -0.28781265020370483, -0.277363657951355, -0.2669146656990051, -0.2564656436443329, -0.24601663649082184, -0.2355676293373108, -0.22511862218379974, -0.2146696150302887, -0.20422060787677765, -0.1937716007232666, -0.18332259356975555, -0.1728735864162445, -0.16242457926273346, -0.1519755721092224, -0.14152656495571136, -0.13107755780220032, -0.12062855064868927, -0.11017954349517822, -0.09973053634166718, -0.08928152918815613, -0.07883252203464508, -0.06838351488113403, -0.057934507727622986, -0.04748550057411194, -0.03703649342060089, -0.026587486267089844, -0.016138479113578796, -0.005689471960067749, 0.004759535193443298, 0.015208542346954346, 0.025657549500465393, 0.03610655665397644, 0.04655556380748749, 0.057004570960998535, 0.06745357811450958, 0.07790258526802063, 0.08835159242153168, 0.09880059957504272, 0.10924960672855377, 0.11969861388206482, 0.13014762103557587, 0.14059662818908691, 0.15104563534259796, 0.161494642496109, 0.17194364964962006, 0.1823926568031311, 0.19284166395664215, 0.2032906711101532, 0.21373967826366425, 0.2241886854171753, 0.23463769257068634, 0.2450866997241974, 0.25553572177886963, 0.2659847140312195, 0.27643370628356934, 0.2868827283382416, 0.2973317503929138, 0.30778074264526367, 0.3182297348976135, 0.32867875695228577, 0.339127779006958, 0.34957677125930786]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 11.0, 12.0, 18.0, 33.0, 44.0, 58.0, 111.0, 173.0, 312.0, 523.0, 968.0, 1898.0, 3993.0, 8796.0, 21329.0, 58272.0, 212845.0, 551891.0, 120120.0, 39230.0, 15138.0, 6468.0, 2992.0, 1477.0, 808.0, 399.0, 253.0, 122.0, 85.0, 60.0, 31.0, 34.0, 21.0, 8.0, 4.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2281494140625, -0.22150039672851562, -0.21485137939453125, -0.20820236206054688, -0.2015533447265625, -0.19490432739257812, -0.18825531005859375, -0.18160629272460938, -0.174957275390625, -0.16830825805664062, -0.16165924072265625, -0.15501022338867188, -0.1483612060546875, -0.14171218872070312, -0.13506317138671875, -0.12841415405273438, -0.12176513671875, -0.11511611938476562, -0.10846710205078125, -0.10181808471679688, -0.0951690673828125, -0.08852005004882812, -0.08187103271484375, -0.07522201538085938, -0.068572998046875, -0.061923980712890625, -0.05527496337890625, -0.048625946044921875, -0.0419769287109375, -0.035327911376953125, -0.02867889404296875, -0.022029876708984375, -0.015380859375, -0.008731842041015625, -0.00208282470703125, 0.004566192626953125, 0.0112152099609375, 0.017864227294921875, 0.02451324462890625, 0.031162261962890625, 0.037811279296875, 0.044460296630859375, 0.05110931396484375, 0.057758331298828125, 0.0644073486328125, 0.07105636596679688, 0.07770538330078125, 0.08435440063476562, 0.09100341796875, 0.09765243530273438, 0.10430145263671875, 0.11095046997070312, 0.1175994873046875, 0.12424850463867188, 0.13089752197265625, 0.13754653930664062, 0.144195556640625, 0.15084457397460938, 0.15749359130859375, 0.16414260864257812, 0.1707916259765625, 0.17744064331054688, 0.18408966064453125, 0.19073867797851562, 0.1973876953125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 17.0, 8.0, 14.0, 21.0, 22.0, 24.0, 30.0, 38.0, 49.0, 32.0, 46.0, 59.0, 53.0, 62.0, 58.0, 66.0, 62.0, 57.0, 51.0, 41.0, 39.0, 27.0, 15.0, 18.0, 24.0, 14.0, 9.0, 9.0, 8.0, 6.0, 4.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050811767578125, -0.049180030822753906, -0.04754829406738281, -0.04591655731201172, -0.044284820556640625, -0.04265308380126953, -0.04102134704589844, -0.039389610290527344, -0.03775787353515625, -0.036126136779785156, -0.03449440002441406, -0.03286266326904297, -0.031230926513671875, -0.02959918975830078, -0.027967453002929688, -0.026335716247558594, -0.0247039794921875, -0.023072242736816406, -0.021440505981445312, -0.01980876922607422, -0.018177032470703125, -0.01654529571533203, -0.014913558959960938, -0.013281822204589844, -0.01165008544921875, -0.010018348693847656, -0.008386611938476562, -0.006754875183105469, -0.005123138427734375, -0.0034914016723632812, -0.0018596649169921875, -0.00022792816162109375, 0.00140380859375, 0.0030355453491210938, 0.0046672821044921875, 0.006299018859863281, 0.007930755615234375, 0.009562492370605469, 0.011194229125976562, 0.012825965881347656, 0.01445770263671875, 0.016089439392089844, 0.017721176147460938, 0.01935291290283203, 0.020984649658203125, 0.02261638641357422, 0.024248123168945312, 0.025879859924316406, 0.0275115966796875, 0.029143333435058594, 0.030775070190429688, 0.03240680694580078, 0.034038543701171875, 0.03567028045654297, 0.03730201721191406, 0.038933753967285156, 0.04056549072265625, 0.042197227478027344, 0.04382896423339844, 0.04546070098876953, 0.047092437744140625, 0.04872417449951172, 0.05035591125488281, 0.051987648010253906, 0.053619384765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 6.0, 10.0, 15.0, 14.0, 19.0, 38.0, 31.0, 67.0, 66.0, 123.0, 161.0, 260.0, 377.0, 629.0, 1057.0, 2268.0, 6077.0, 20622.0, 95847.0, 631167.0, 231454.0, 40868.0, 10110.0, 3574.0, 1572.0, 744.0, 432.0, 281.0, 201.0, 128.0, 84.0, 63.0, 45.0, 44.0, 26.0, 24.0, 17.0, 9.0, 9.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2386474609375, -0.2308826446533203, -0.22311782836914062, -0.21535301208496094, -0.20758819580078125, -0.19982337951660156, -0.19205856323242188, -0.1842937469482422, -0.1765289306640625, -0.1687641143798828, -0.16099929809570312, -0.15323448181152344, -0.14546966552734375, -0.13770484924316406, -0.12994003295898438, -0.12217521667480469, -0.114410400390625, -0.10664558410644531, -0.09888076782226562, -0.09111595153808594, -0.08335113525390625, -0.07558631896972656, -0.06782150268554688, -0.06005668640136719, -0.0522918701171875, -0.04452705383300781, -0.036762237548828125, -0.028997421264648438, -0.02123260498046875, -0.013467788696289062, -0.005702972412109375, 0.0020618438720703125, 0.00982666015625, 0.017591476440429688, 0.025356292724609375, 0.03312110900878906, 0.04088592529296875, 0.04865074157714844, 0.056415557861328125, 0.06418037414550781, 0.0719451904296875, 0.07971000671386719, 0.08747482299804688, 0.09523963928222656, 0.10300445556640625, 0.11076927185058594, 0.11853408813476562, 0.1262989044189453, 0.134063720703125, 0.1418285369873047, 0.14959335327148438, 0.15735816955566406, 0.16512298583984375, 0.17288780212402344, 0.18065261840820312, 0.1884174346923828, 0.1961822509765625, 0.2039470672607422, 0.21171188354492188, 0.21947669982910156, 0.22724151611328125, 0.23500633239746094, 0.24277114868164062, 0.2505359649658203, 0.25830078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 6.0, 11.0, 14.0, 13.0, 15.0, 17.0, 21.0, 38.0, 34.0, 46.0, 46.0, 34.0, 56.0, 68.0, 57.0, 70.0, 54.0, 39.0, 44.0, 47.0, 47.0, 32.0, 30.0, 39.0, 29.0, 16.0, 16.0, 19.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2044677734375, -0.19736862182617188, -0.19026947021484375, -0.18317031860351562, -0.1760711669921875, -0.16897201538085938, -0.16187286376953125, -0.15477371215820312, -0.147674560546875, -0.14057540893554688, -0.13347625732421875, -0.12637710571289062, -0.1192779541015625, -0.11217880249023438, -0.10507965087890625, -0.09798049926757812, -0.09088134765625, -0.08378219604492188, -0.07668304443359375, -0.06958389282226562, -0.0624847412109375, -0.055385589599609375, -0.04828643798828125, -0.041187286376953125, -0.034088134765625, -0.026988983154296875, -0.01988983154296875, -0.012790679931640625, -0.0056915283203125, 0.001407623291015625, 0.00850677490234375, 0.015605926513671875, 0.022705078125, 0.029804229736328125, 0.03690338134765625, 0.044002532958984375, 0.0511016845703125, 0.058200836181640625, 0.06529998779296875, 0.07239913940429688, 0.079498291015625, 0.08659744262695312, 0.09369659423828125, 0.10079574584960938, 0.1078948974609375, 0.11499404907226562, 0.12209320068359375, 0.12919235229492188, 0.13629150390625, 0.14339065551757812, 0.15048980712890625, 0.15758895874023438, 0.1646881103515625, 0.17178726196289062, 0.17888641357421875, 0.18598556518554688, 0.193084716796875, 0.20018386840820312, 0.20728302001953125, 0.21438217163085938, 0.2214813232421875, 0.22858047485351562, 0.23567962646484375, 0.24277877807617188, 0.2498779296875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 4.0, 7.0, 9.0, 17.0, 24.0, 37.0, 39.0, 72.0, 90.0, 141.0, 250.0, 462.0, 891.0, 2057.0, 5000.0, 13755.0, 43751.0, 222556.0, 634906.0, 85686.0, 24515.0, 8199.0, 3171.0, 1343.0, 643.0, 344.0, 205.0, 119.0, 70.0, 41.0, 36.0, 21.0, 22.0, 18.0, 11.0, 10.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.1353759765625, -0.1314239501953125, -0.127471923828125, -0.1235198974609375, -0.11956787109375, -0.1156158447265625, -0.111663818359375, -0.1077117919921875, -0.103759765625, -0.0998077392578125, -0.095855712890625, -0.0919036865234375, -0.08795166015625, -0.0839996337890625, -0.080047607421875, -0.0760955810546875, -0.0721435546875, -0.0681915283203125, -0.064239501953125, -0.0602874755859375, -0.05633544921875, -0.0523834228515625, -0.048431396484375, -0.0444793701171875, -0.04052734375, -0.0365753173828125, -0.032623291015625, -0.0286712646484375, -0.02471923828125, -0.0207672119140625, -0.016815185546875, -0.0128631591796875, -0.0089111328125, -0.0049591064453125, -0.001007080078125, 0.0029449462890625, 0.00689697265625, 0.0108489990234375, 0.014801025390625, 0.0187530517578125, 0.022705078125, 0.0266571044921875, 0.030609130859375, 0.0345611572265625, 0.03851318359375, 0.0424652099609375, 0.046417236328125, 0.0503692626953125, 0.0543212890625, 0.0582733154296875, 0.062225341796875, 0.0661773681640625, 0.07012939453125, 0.0740814208984375, 0.078033447265625, 0.0819854736328125, 0.0859375, 0.0898895263671875, 0.093841552734375, 0.0977935791015625, 0.10174560546875, 0.1056976318359375, 0.109649658203125, 0.1136016845703125, 0.1175537109375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 12.0, 5.0, 10.0, 19.0, 43.0, 64.0, 95.0, 130.0, 163.0, 118.0, 108.0, 72.0, 55.0, 30.0, 17.0, 13.0, 10.0, 9.0, 3.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010323524475097656, -9.97716560959816e-05, -9.630806744098663e-05, -9.284447878599167e-05, -8.93808901309967e-05, -8.591730147600174e-05, -8.245371282100677e-05, -7.899012416601181e-05, -7.552653551101685e-05, -7.206294685602188e-05, -6.859935820102692e-05, -6.513576954603195e-05, -6.167218089103699e-05, -5.820859223604202e-05, -5.474500358104706e-05, -5.1281414926052094e-05, -4.781782627105713e-05, -4.4354237616062164e-05, -4.08906489610672e-05, -3.7427060306072235e-05, -3.396347165107727e-05, -3.0499882996082306e-05, -2.703629434108734e-05, -2.3572705686092377e-05, -2.0109117031097412e-05, -1.6645528376102448e-05, -1.3181939721107483e-05, -9.718351066112518e-06, -6.254762411117554e-06, -2.791173756122589e-06, 6.724148988723755e-07, 4.13600355386734e-06, 7.599592208862305e-06, 1.106318086385727e-05, 1.4526769518852234e-05, 1.79903581738472e-05, 2.1453946828842163e-05, 2.4917535483837128e-05, 2.8381124138832092e-05, 3.184471279382706e-05, 3.530830144882202e-05, 3.8771890103816986e-05, 4.223547875881195e-05, 4.5699067413806915e-05, 4.916265606880188e-05, 5.2626244723796844e-05, 5.608983337879181e-05, 5.9553422033786774e-05, 6.301701068878174e-05, 6.64805993437767e-05, 6.994418799877167e-05, 7.340777665376663e-05, 7.68713653087616e-05, 8.033495396375656e-05, 8.379854261875153e-05, 8.726213127374649e-05, 9.072571992874146e-05, 9.418930858373642e-05, 9.765289723873138e-05, 0.00010111648589372635, 0.00010458007454872131, 0.00010804366320371628, 0.00011150725185871124, 0.00011497084051370621, 0.00011843442916870117]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 12.0, 10.0, 14.0, 35.0, 59.0, 113.0, 183.0, 344.0, 836.0, 2126.0, 7674.0, 39488.0, 481664.0, 466170.0, 38558.0, 7550.0, 2049.0, 818.0, 349.0, 189.0, 112.0, 71.0, 39.0, 39.0, 16.0, 9.0, 4.0, 11.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1719970703125, -0.16678428649902344, -0.16157150268554688, -0.1563587188720703, -0.15114593505859375, -0.1459331512451172, -0.14072036743164062, -0.13550758361816406, -0.1302947998046875, -0.12508201599121094, -0.11986923217773438, -0.11465644836425781, -0.10944366455078125, -0.10423088073730469, -0.09901809692382812, -0.09380531311035156, -0.088592529296875, -0.08337974548339844, -0.07816696166992188, -0.07295417785644531, -0.06774139404296875, -0.06252861022949219, -0.057315826416015625, -0.05210304260253906, -0.0468902587890625, -0.04167747497558594, -0.036464691162109375, -0.03125190734863281, -0.02603912353515625, -0.020826339721679688, -0.015613555908203125, -0.010400772094726562, -0.00518798828125, 2.47955322265625e-05, 0.005237579345703125, 0.010450363159179688, 0.01566314697265625, 0.020875930786132812, 0.026088714599609375, 0.03130149841308594, 0.0365142822265625, 0.04172706604003906, 0.046939849853515625, 0.05215263366699219, 0.05736541748046875, 0.06257820129394531, 0.06779098510742188, 0.07300376892089844, 0.078216552734375, 0.08342933654785156, 0.08864212036132812, 0.09385490417480469, 0.09906768798828125, 0.10428047180175781, 0.10949325561523438, 0.11470603942871094, 0.1199188232421875, 0.12513160705566406, 0.13034439086914062, 0.1355571746826172, 0.14076995849609375, 0.1459827423095703, 0.15119552612304688, 0.15640830993652344, 0.16162109375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 7.0, 7.0, 10.0, 14.0, 9.0, 11.0, 11.0, 20.0, 22.0, 38.0, 50.0, 75.0, 136.0, 135.0, 125.0, 92.0, 64.0, 42.0, 35.0, 15.0, 18.0, 12.0, 14.0, 12.0, 5.0, 1.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.091064453125, -0.08809089660644531, -0.08511734008789062, -0.08214378356933594, -0.07917022705078125, -0.07619667053222656, -0.07322311401367188, -0.07024955749511719, -0.0672760009765625, -0.06430244445800781, -0.061328887939453125, -0.05835533142089844, -0.05538177490234375, -0.05240821838378906, -0.049434661865234375, -0.04646110534667969, -0.043487548828125, -0.04051399230957031, -0.037540435791015625, -0.03456687927246094, -0.03159332275390625, -0.028619766235351562, -0.025646209716796875, -0.022672653198242188, -0.0196990966796875, -0.016725540161132812, -0.013751983642578125, -0.010778427124023438, -0.00780487060546875, -0.0048313140869140625, -0.001857757568359375, 0.0011157989501953125, 0.00408935546875, 0.0070629119873046875, 0.010036468505859375, 0.013010025024414062, 0.01598358154296875, 0.018957138061523438, 0.021930694580078125, 0.024904251098632812, 0.0278778076171875, 0.030851364135742188, 0.033824920654296875, 0.03679847717285156, 0.03977203369140625, 0.04274559020996094, 0.045719146728515625, 0.04869270324707031, 0.051666259765625, 0.05463981628417969, 0.057613372802734375, 0.06058692932128906, 0.06356048583984375, 0.06653404235839844, 0.06950759887695312, 0.07248115539550781, 0.0754547119140625, 0.07842826843261719, 0.08140182495117188, 0.08437538146972656, 0.08734893798828125, 0.09032249450683594, 0.09329605102539062, 0.09626960754394531, 0.0992431640625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 13.0, 21.0, 43.0, 69.0, 112.0, 137.0, 176.0, 148.0, 108.0, 76.0, 44.0, 26.0, 12.0, 12.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.679431676864624, -1.6258400678634644, -1.5722485780715942, -1.5186569690704346, -1.465065360069275, -1.4114737510681152, -1.3578822612762451, -1.3042906522750854, -1.2506990432739258, -1.1971074342727661, -1.143515944480896, -1.0899243354797363, -1.0363327264785767, -0.9827411770820618, -0.9291496276855469, -0.8755580186843872, -0.8219665288925171, -0.7683749794960022, -0.7147833704948425, -0.6611918210983276, -0.607600212097168, -0.5540086627006531, -0.5004171133041382, -0.4468255341053009, -0.3932339549064636, -0.33964237570762634, -0.28605079650878906, -0.23245924711227417, -0.1788676679134369, -0.1252760887145996, -0.07168453931808472, -0.018092960119247437, 0.035498738288879395, 0.08909031003713608, 0.14268188178539276, 0.19627344608306885, 0.24986502528190613, 0.3034566044807434, 0.3570481538772583, 0.4106397330760956, 0.46423131227493286, 0.5178228616714478, 0.5714144706726074, 0.6250060200691223, 0.6785975694656372, 0.7321891784667969, 0.7857807278633118, 0.8393722772598267, 0.8929638862609863, 0.9465554356575012, 1.0001469850540161, 1.0537385940551758, 1.1073302030563354, 1.1609218120574951, 1.2145133018493652, 1.268104910850525, 1.3216965198516846, 1.3752881288528442, 1.4288796186447144, 1.482471227645874, 1.5360628366470337, 1.5896544456481934, 1.6432459354400635, 1.6968375444412231, 1.7504290342330933]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 8.0, 7.0, 5.0, 12.0, 10.0, 7.0, 15.0, 30.0, 23.0, 41.0, 29.0, 20.0, 39.0, 40.0, 38.0, 29.0, 42.0, 39.0, 38.0, 48.0, 64.0, 48.0, 38.0, 39.0, 34.0, 29.0, 32.0, 31.0, 21.0, 31.0, 19.0, 11.0, 21.0, 14.0, 10.0, 10.0, 10.0, 5.0, 8.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0763580799102783, -1.04521906375885, -1.0140800476074219, -0.9829409718513489, -0.9518018960952759, -0.9206628799438477, -0.8895238041877747, -0.8583847880363464, -0.8272457122802734, -0.7961066961288452, -0.7649676203727722, -0.733828604221344, -0.702689528465271, -0.6715505123138428, -0.6404114365577698, -0.6092724204063416, -0.5781333446502686, -0.5469943284988403, -0.5158552527427673, -0.4847162067890167, -0.4535771608352661, -0.4224381446838379, -0.3912990689277649, -0.36016005277633667, -0.32902103662490845, -0.29788199067115784, -0.2667429447174072, -0.23560389876365662, -0.204464852809906, -0.1733258217573166, -0.14218677580356598, -0.11104772984981537, -0.07990866899490356, -0.048769623041152954, -0.017630580812692642, 0.01350846141576767, 0.04464750736951828, 0.0757865458726883, 0.1069255918264389, 0.13806463778018951, 0.16920368373394012, 0.20034272968769073, 0.23148177564144135, 0.26262080669403076, 0.29375985264778137, 0.324898898601532, 0.3560379445552826, 0.3871769905090332, 0.4183160364627838, 0.4494550824165344, 0.48059412837028503, 0.5117331743240356, 0.5428721904754639, 0.5740112662315369, 0.6051502823829651, 0.6362893581390381, 0.6674283742904663, 0.6985673904418945, 0.7297064661979675, 0.7608454823493958, 0.7919845581054688, 0.823123574256897, 0.85426265001297, 0.8854016661643982, 0.9165407419204712]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 9.0, 7.0, 10.0, 4.0, 10.0, 16.0, 37.0, 45.0, 80.0, 118.0, 188.0, 256.0, 391.0, 670.0, 1011.0, 1825.0, 3231.0, 5862.0, 11367.0, 23507.0, 57239.0, 183316.0, 2663310.0, 1009977.0, 141477.0, 47735.0, 20495.0, 9952.0, 5104.0, 2908.0, 1581.0, 964.0, 556.0, 348.0, 229.0, 149.0, 106.0, 64.0, 41.0, 30.0, 17.0, 13.0, 7.0, 10.0, 3.0, 4.0, 9.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1431884765625, -0.13896560668945312, -0.13474273681640625, -0.13051986694335938, -0.1262969970703125, -0.12207412719726562, -0.11785125732421875, -0.11362838745117188, -0.109405517578125, -0.10518264770507812, -0.10095977783203125, -0.09673690795898438, -0.0925140380859375, -0.08829116821289062, -0.08406829833984375, -0.07984542846679688, -0.07562255859375, -0.07139968872070312, -0.06717681884765625, -0.06295394897460938, -0.0587310791015625, -0.054508209228515625, -0.05028533935546875, -0.046062469482421875, -0.041839599609375, -0.037616729736328125, -0.03339385986328125, -0.029170989990234375, -0.0249481201171875, -0.020725250244140625, -0.01650238037109375, -0.012279510498046875, -0.008056640625, -0.003833770751953125, 0.00038909912109375, 0.004611968994140625, 0.0088348388671875, 0.013057708740234375, 0.01728057861328125, 0.021503448486328125, 0.025726318359375, 0.029949188232421875, 0.03417205810546875, 0.038394927978515625, 0.0426177978515625, 0.046840667724609375, 0.05106353759765625, 0.055286407470703125, 0.05950927734375, 0.06373214721679688, 0.06795501708984375, 0.07217788696289062, 0.0764007568359375, 0.08062362670898438, 0.08484649658203125, 0.08906936645507812, 0.093292236328125, 0.09751510620117188, 0.10173797607421875, 0.10596084594726562, 0.1101837158203125, 0.11440658569335938, 0.11862945556640625, 0.12285232543945312, 0.1270751953125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 8.0, 7.0, 10.0, 15.0, 16.0, 22.0, 26.0, 27.0, 37.0, 30.0, 32.0, 45.0, 40.0, 47.0, 50.0, 47.0, 45.0, 43.0, 56.0, 52.0, 51.0, 49.0, 37.0, 35.0, 44.0, 28.0, 12.0, 18.0, 13.0, 6.0, 12.0, 6.0, 11.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052215576171875, -0.050655364990234375, -0.04909515380859375, -0.047534942626953125, -0.0459747314453125, -0.044414520263671875, -0.04285430908203125, -0.041294097900390625, -0.03973388671875, -0.038173675537109375, -0.03661346435546875, -0.035053253173828125, -0.0334930419921875, -0.031932830810546875, -0.03037261962890625, -0.028812408447265625, -0.027252197265625, -0.025691986083984375, -0.02413177490234375, -0.022571563720703125, -0.0210113525390625, -0.019451141357421875, -0.01789093017578125, -0.016330718994140625, -0.0147705078125, -0.013210296630859375, -0.01165008544921875, -0.010089874267578125, -0.0085296630859375, -0.006969451904296875, -0.00540924072265625, -0.003849029541015625, -0.002288818359375, -0.000728607177734375, 0.00083160400390625, 0.002391815185546875, 0.0039520263671875, 0.005512237548828125, 0.00707244873046875, 0.008632659912109375, 0.01019287109375, 0.011753082275390625, 0.01331329345703125, 0.014873504638671875, 0.0164337158203125, 0.017993927001953125, 0.01955413818359375, 0.021114349365234375, 0.022674560546875, 0.024234771728515625, 0.02579498291015625, 0.027355194091796875, 0.0289154052734375, 0.030475616455078125, 0.03203582763671875, 0.033596038818359375, 0.03515625, 0.036716461181640625, 0.03827667236328125, 0.039836883544921875, 0.0413970947265625, 0.042957305908203125, 0.04451751708984375, 0.046077728271484375, 0.047637939453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 14.0, 17.0, 24.0, 53.0, 44.0, 80.0, 118.0, 183.0, 222.0, 392.0, 555.0, 871.0, 1347.0, 2425.0, 4150.0, 8156.0, 16919.0, 40728.0, 119891.0, 614775.0, 2944332.0, 303307.0, 78312.0, 29183.0, 12983.0, 6263.0, 3564.0, 1927.0, 1199.0, 710.0, 424.0, 350.0, 243.0, 151.0, 109.0, 81.0, 60.0, 30.0, 34.0, 13.0, 14.0, 6.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.1624755859375, -0.15774154663085938, -0.15300750732421875, -0.14827346801757812, -0.1435394287109375, -0.13880538940429688, -0.13407135009765625, -0.12933731079101562, -0.124603271484375, -0.11986923217773438, -0.11513519287109375, -0.11040115356445312, -0.1056671142578125, -0.10093307495117188, -0.09619903564453125, -0.09146499633789062, -0.08673095703125, -0.08199691772460938, -0.07726287841796875, -0.07252883911132812, -0.0677947998046875, -0.06306076049804688, -0.05832672119140625, -0.053592681884765625, -0.048858642578125, -0.044124603271484375, -0.03939056396484375, -0.034656524658203125, -0.0299224853515625, -0.025188446044921875, -0.02045440673828125, -0.015720367431640625, -0.010986328125, -0.006252288818359375, -0.00151824951171875, 0.003215789794921875, 0.0079498291015625, 0.012683868408203125, 0.01741790771484375, 0.022151947021484375, 0.026885986328125, 0.031620025634765625, 0.03635406494140625, 0.041088104248046875, 0.0458221435546875, 0.050556182861328125, 0.05529022216796875, 0.060024261474609375, 0.06475830078125, 0.06949234008789062, 0.07422637939453125, 0.07896041870117188, 0.0836944580078125, 0.08842849731445312, 0.09316253662109375, 0.09789657592773438, 0.102630615234375, 0.10736465454101562, 0.11209869384765625, 0.11683273315429688, 0.1215667724609375, 0.12630081176757812, 0.13103485107421875, 0.13576889038085938, 0.1405029296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 7.0, 12.0, 17.0, 30.0, 36.0, 61.0, 84.0, 158.0, 344.0, 1219.0, 1300.0, 365.0, 166.0, 103.0, 58.0, 27.0, 18.0, 19.0, 10.0, 9.0, 4.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.12310791015625, -0.11959266662597656, -0.11607742309570312, -0.11256217956542969, -0.10904693603515625, -0.10553169250488281, -0.10201644897460938, -0.09850120544433594, -0.0949859619140625, -0.09147071838378906, -0.08795547485351562, -0.08444023132324219, -0.08092498779296875, -0.07740974426269531, -0.07389450073242188, -0.07037925720214844, -0.066864013671875, -0.06334877014160156, -0.059833526611328125, -0.05631828308105469, -0.05280303955078125, -0.04928779602050781, -0.045772552490234375, -0.04225730895996094, -0.0387420654296875, -0.03522682189941406, -0.031711578369140625, -0.028196334838867188, -0.02468109130859375, -0.021165847778320312, -0.017650604248046875, -0.014135360717773438, -0.0106201171875, -0.0071048736572265625, -0.003589630126953125, -7.43865966796875e-05, 0.00344085693359375, 0.0069561004638671875, 0.010471343994140625, 0.013986587524414062, 0.0175018310546875, 0.021017074584960938, 0.024532318115234375, 0.028047561645507812, 0.03156280517578125, 0.03507804870605469, 0.038593292236328125, 0.04210853576660156, 0.045623779296875, 0.04913902282714844, 0.052654266357421875, 0.05616950988769531, 0.05968475341796875, 0.06319999694824219, 0.06671524047851562, 0.07023048400878906, 0.0737457275390625, 0.07726097106933594, 0.08077621459960938, 0.08429145812988281, 0.08780670166015625, 0.09132194519042969, 0.09483718872070312, 0.09835243225097656, 0.10186767578125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 9.0, 21.0, 28.0, 52.0, 68.0, 96.0, 112.0, 121.0, 129.0, 111.0, 69.0, 51.0, 40.0, 30.0, 11.0, 13.0, 6.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5777998566627502, -0.5606703758239746, -0.543540894985199, -0.5264114141464233, -0.5092819333076477, -0.49215245246887207, -0.47502294182777405, -0.4578934609889984, -0.4407639801502228, -0.42363449931144714, -0.4065050184726715, -0.3893755376338959, -0.37224602699279785, -0.3551165461540222, -0.3379870653152466, -0.32085758447647095, -0.3037281036376953, -0.2865986227989197, -0.26946914196014404, -0.2523396611213684, -0.23521016538143158, -0.21808068454265594, -0.20095118880271912, -0.18382170796394348, -0.16669222712516785, -0.1495627462863922, -0.13243326544761658, -0.11530376970767975, -0.09817428886890411, -0.08104480803012848, -0.06391531974077225, -0.046785831451416016, -0.02965635061264038, -0.012526866048574448, 0.004602618515491486, 0.02173210307955742, 0.03886158764362335, 0.05599106848239899, 0.07312055677175522, 0.09025004506111145, 0.10737952589988708, 0.12450900673866272, 0.14163848757743835, 0.15876798331737518, 0.17589746415615082, 0.19302694499492645, 0.21015644073486328, 0.22728592157363892, 0.24441540241241455, 0.2615448832511902, 0.2786743640899658, 0.29580384492874146, 0.3129333257675171, 0.3300628066062927, 0.34719231724739075, 0.3643217980861664, 0.381451278924942, 0.39858075976371765, 0.4157102406024933, 0.4328397214412689, 0.44996923208236694, 0.4670987129211426, 0.4842281937599182, 0.5013576745986938, 0.5184871554374695]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 16.0, 18.0, 12.0, 12.0, 22.0, 13.0, 22.0, 22.0, 30.0, 23.0, 32.0, 42.0, 44.0, 45.0, 31.0, 55.0, 51.0, 50.0, 38.0, 51.0, 33.0, 41.0, 26.0, 39.0, 28.0, 23.0, 35.0, 12.0, 15.0, 27.0, 16.0, 8.0, 11.0, 10.0, 11.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.32235443592071533, -0.3130477964878082, -0.3037411570549011, -0.294434517621994, -0.2851278781890869, -0.2758212685585022, -0.2665145993232727, -0.257207989692688, -0.24790135025978088, -0.23859471082687378, -0.22928807139396667, -0.21998143196105957, -0.21067480742931366, -0.20136816799640656, -0.19206152856349945, -0.18275490403175354, -0.17344824969768524, -0.16414161026477814, -0.15483497083187103, -0.14552834630012512, -0.13622170686721802, -0.1269150674343109, -0.11760842800140381, -0.1083017960190773, -0.0989951565861702, -0.08968851715326309, -0.08038188517093658, -0.07107524573802948, -0.061768610030412674, -0.05246197432279587, -0.04315533488988876, -0.033848702907562256, -0.02454206347465515, -0.01523542683571577, -0.00592879019677639, 0.003377847373485565, 0.012684483081102371, 0.021991118788719177, 0.03129775822162628, 0.04060439020395279, 0.049911029636859894, 0.0592176653444767, 0.0685243010520935, 0.07783094048500061, 0.08713757991790771, 0.09644421190023422, 0.10575085133314133, 0.11505748331546783, 0.12436412274837494, 0.13367076218128204, 0.14297740161418915, 0.15228402614593506, 0.16159066557884216, 0.17089730501174927, 0.18020394444465637, 0.18951058387756348, 0.19881722331047058, 0.20812386274337769, 0.2174305021762848, 0.2267371416091919, 0.2360437661409378, 0.2453504055738449, 0.2546570301055908, 0.2639636695384979, 0.27327030897140503]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 11.0, 15.0, 17.0, 15.0, 36.0, 39.0, 66.0, 98.0, 173.0, 270.0, 648.0, 1452.0, 3746.0, 10120.0, 27465.0, 83558.0, 437707.0, 369806.0, 73505.0, 24616.0, 9085.0, 3494.0, 1311.0, 583.0, 276.0, 157.0, 95.0, 72.0, 31.0, 25.0, 18.0, 11.0, 11.0, 3.0, 1.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.197265625, -0.19127845764160156, -0.18529129028320312, -0.1793041229248047, -0.17331695556640625, -0.1673297882080078, -0.16134262084960938, -0.15535545349121094, -0.1493682861328125, -0.14338111877441406, -0.13739395141601562, -0.1314067840576172, -0.12541961669921875, -0.11943244934082031, -0.11344528198242188, -0.10745811462402344, -0.101470947265625, -0.09548377990722656, -0.08949661254882812, -0.08350944519042969, -0.07752227783203125, -0.07153511047363281, -0.06554794311523438, -0.05956077575683594, -0.0535736083984375, -0.04758644104003906, -0.041599273681640625, -0.03561210632324219, -0.02962493896484375, -0.023637771606445312, -0.017650604248046875, -0.011663436889648438, -0.00567626953125, 0.0003108978271484375, 0.006298065185546875, 0.012285232543945312, 0.01827239990234375, 0.024259567260742188, 0.030246734619140625, 0.03623390197753906, 0.0422210693359375, 0.04820823669433594, 0.054195404052734375, 0.06018257141113281, 0.06616973876953125, 0.07215690612792969, 0.07814407348632812, 0.08413124084472656, 0.090118408203125, 0.09610557556152344, 0.10209274291992188, 0.10807991027832031, 0.11406707763671875, 0.12005424499511719, 0.12604141235351562, 0.13202857971191406, 0.1380157470703125, 0.14400291442871094, 0.14999008178710938, 0.1559772491455078, 0.16196441650390625, 0.1679515838623047, 0.17393875122070312, 0.17992591857910156, 0.1859130859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 5.0, 6.0, 18.0, 17.0, 18.0, 19.0, 15.0, 27.0, 36.0, 31.0, 36.0, 50.0, 40.0, 39.0, 58.0, 54.0, 58.0, 40.0, 49.0, 47.0, 50.0, 36.0, 36.0, 40.0, 40.0, 18.0, 18.0, 15.0, 16.0, 14.0, 11.0, 13.0, 4.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.052520751953125, -0.05094099044799805, -0.049361228942871094, -0.04778146743774414, -0.04620170593261719, -0.044621944427490234, -0.04304218292236328, -0.04146242141723633, -0.039882659912109375, -0.03830289840698242, -0.03672313690185547, -0.035143375396728516, -0.03356361389160156, -0.03198385238647461, -0.030404090881347656, -0.028824329376220703, -0.02724456787109375, -0.025664806365966797, -0.024085044860839844, -0.02250528335571289, -0.020925521850585938, -0.019345760345458984, -0.01776599884033203, -0.016186237335205078, -0.014606475830078125, -0.013026714324951172, -0.011446952819824219, -0.009867191314697266, -0.008287429809570312, -0.006707668304443359, -0.005127906799316406, -0.003548145294189453, -0.0019683837890625, -0.0003886222839355469, 0.0011911392211914062, 0.0027709007263183594, 0.0043506622314453125, 0.005930423736572266, 0.007510185241699219, 0.009089946746826172, 0.010669708251953125, 0.012249469757080078, 0.013829231262207031, 0.015408992767333984, 0.016988754272460938, 0.01856851577758789, 0.020148277282714844, 0.021728038787841797, 0.02330780029296875, 0.024887561798095703, 0.026467323303222656, 0.02804708480834961, 0.029626846313476562, 0.031206607818603516, 0.03278636932373047, 0.03436613082885742, 0.035945892333984375, 0.03752565383911133, 0.03910541534423828, 0.040685176849365234, 0.04226493835449219, 0.04384469985961914, 0.045424461364746094, 0.04700422286987305, 0.048583984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 4.0, 11.0, 11.0, 14.0, 21.0, 20.0, 34.0, 35.0, 67.0, 84.0, 129.0, 228.0, 355.0, 637.0, 1275.0, 2537.0, 5699.0, 12946.0, 30417.0, 87118.0, 525656.0, 283734.0, 56825.0, 22615.0, 9479.0, 4267.0, 1974.0, 982.0, 468.0, 284.0, 189.0, 132.0, 76.0, 53.0, 34.0, 37.0, 23.0, 20.0, 16.0, 8.0, 11.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1845703125, -0.17894744873046875, -0.1733245849609375, -0.16770172119140625, -0.162078857421875, -0.15645599365234375, -0.1508331298828125, -0.14521026611328125, -0.13958740234375, -0.13396453857421875, -0.1283416748046875, -0.12271881103515625, -0.117095947265625, -0.11147308349609375, -0.1058502197265625, -0.10022735595703125, -0.0946044921875, -0.08898162841796875, -0.0833587646484375, -0.07773590087890625, -0.072113037109375, -0.06649017333984375, -0.0608673095703125, -0.05524444580078125, -0.04962158203125, -0.04399871826171875, -0.0383758544921875, -0.03275299072265625, -0.027130126953125, -0.02150726318359375, -0.0158843994140625, -0.01026153564453125, -0.004638671875, 0.00098419189453125, 0.0066070556640625, 0.01222991943359375, 0.017852783203125, 0.02347564697265625, 0.0290985107421875, 0.03472137451171875, 0.04034423828125, 0.04596710205078125, 0.0515899658203125, 0.05721282958984375, 0.062835693359375, 0.06845855712890625, 0.0740814208984375, 0.07970428466796875, 0.0853271484375, 0.09095001220703125, 0.0965728759765625, 0.10219573974609375, 0.107818603515625, 0.11344146728515625, 0.1190643310546875, 0.12468719482421875, 0.13031005859375, 0.13593292236328125, 0.1415557861328125, 0.14717864990234375, 0.152801513671875, 0.15842437744140625, 0.1640472412109375, 0.16967010498046875, 0.17529296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 1.0, 9.0, 7.0, 6.0, 9.0, 13.0, 11.0, 17.0, 16.0, 23.0, 29.0, 27.0, 31.0, 44.0, 38.0, 40.0, 37.0, 45.0, 50.0, 46.0, 37.0, 49.0, 44.0, 48.0, 33.0, 38.0, 33.0, 35.0, 21.0, 28.0, 25.0, 21.0, 19.0, 15.0, 10.0, 6.0, 11.0, 5.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.220947265625, -0.21445846557617188, -0.20796966552734375, -0.20148086547851562, -0.1949920654296875, -0.18850326538085938, -0.18201446533203125, -0.17552566528320312, -0.169036865234375, -0.16254806518554688, -0.15605926513671875, -0.14957046508789062, -0.1430816650390625, -0.13659286499023438, -0.13010406494140625, -0.12361526489257812, -0.11712646484375, -0.11063766479492188, -0.10414886474609375, -0.09766006469726562, -0.0911712646484375, -0.08468246459960938, -0.07819366455078125, -0.07170486450195312, -0.065216064453125, -0.058727264404296875, -0.05223846435546875, -0.045749664306640625, -0.0392608642578125, -0.032772064208984375, -0.02628326416015625, -0.019794464111328125, -0.0133056640625, -0.006816864013671875, -0.00032806396484375, 0.006160736083984375, 0.0126495361328125, 0.019138336181640625, 0.02562713623046875, 0.032115936279296875, 0.038604736328125, 0.045093536376953125, 0.05158233642578125, 0.058071136474609375, 0.0645599365234375, 0.07104873657226562, 0.07753753662109375, 0.08402633666992188, 0.09051513671875, 0.09700393676757812, 0.10349273681640625, 0.10998153686523438, 0.1164703369140625, 0.12295913696289062, 0.12944793701171875, 0.13593673706054688, 0.142425537109375, 0.14891433715820312, 0.15540313720703125, 0.16189193725585938, 0.1683807373046875, 0.17486953735351562, 0.18135833740234375, 0.18784713745117188, 0.1943359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 12.0, 6.0, 14.0, 23.0, 25.0, 33.0, 65.0, 103.0, 163.0, 282.0, 530.0, 931.0, 1892.0, 4160.0, 9224.0, 21380.0, 51593.0, 272314.0, 559298.0, 74862.0, 28782.0, 12379.0, 5380.0, 2447.0, 1134.0, 661.0, 362.0, 175.0, 106.0, 94.0, 45.0, 30.0, 17.0, 12.0, 14.0, 5.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0955810546875, -0.09278392791748047, -0.08998680114746094, -0.0871896743774414, -0.08439254760742188, -0.08159542083740234, -0.07879829406738281, -0.07600116729736328, -0.07320404052734375, -0.07040691375732422, -0.06760978698730469, -0.06481266021728516, -0.062015533447265625, -0.059218406677246094, -0.05642127990722656, -0.05362415313720703, -0.0508270263671875, -0.04802989959716797, -0.04523277282714844, -0.042435646057128906, -0.039638519287109375, -0.036841392517089844, -0.03404426574707031, -0.03124713897705078, -0.02845001220703125, -0.02565288543701172, -0.022855758666992188, -0.020058631896972656, -0.017261505126953125, -0.014464378356933594, -0.011667251586914062, -0.008870124816894531, -0.006072998046875, -0.0032758712768554688, -0.0004787445068359375, 0.0023183822631835938, 0.005115509033203125, 0.007912635803222656, 0.010709762573242188, 0.013506889343261719, 0.01630401611328125, 0.01910114288330078, 0.021898269653320312, 0.024695396423339844, 0.027492523193359375, 0.030289649963378906, 0.03308677673339844, 0.03588390350341797, 0.0386810302734375, 0.04147815704345703, 0.04427528381347656, 0.047072410583496094, 0.049869537353515625, 0.052666664123535156, 0.05546379089355469, 0.05826091766357422, 0.06105804443359375, 0.06385517120361328, 0.06665229797363281, 0.06944942474365234, 0.07224655151367188, 0.0750436782836914, 0.07784080505371094, 0.08063793182373047, 0.08343505859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 11.0, 9.0, 18.0, 23.0, 32.0, 38.0, 57.0, 87.0, 114.0, 106.0, 92.0, 85.0, 82.0, 60.0, 39.0, 37.0, 31.0, 22.0, 10.0, 13.0, 4.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.00010013580322265625, -9.7629614174366e-05, -9.512342512607574e-05, -9.261723607778549e-05, -9.011104702949524e-05, -8.760485798120499e-05, -8.509866893291473e-05, -8.259247988462448e-05, -8.008629083633423e-05, -7.758010178804398e-05, -7.507391273975372e-05, -7.256772369146347e-05, -7.006153464317322e-05, -6.755534559488297e-05, -6.504915654659271e-05, -6.254296749830246e-05, -6.003677845001221e-05, -5.7530589401721954e-05, -5.50244003534317e-05, -5.251821130514145e-05, -5.0012022256851196e-05, -4.7505833208560944e-05, -4.499964416027069e-05, -4.249345511198044e-05, -3.9987266063690186e-05, -3.748107701539993e-05, -3.497488796710968e-05, -3.246869891881943e-05, -2.9962509870529175e-05, -2.7456320822238922e-05, -2.495013177394867e-05, -2.2443942725658417e-05, -1.9937753677368164e-05, -1.743156462907791e-05, -1.4925375580787659e-05, -1.2419186532497406e-05, -9.912997484207153e-06, -7.406808435916901e-06, -4.900619387626648e-06, -2.3944303393363953e-06, 1.1175870895385742e-07, 2.61794775724411e-06, 5.124136805534363e-06, 7.630325853824615e-06, 1.0136514902114868e-05, 1.2642703950405121e-05, 1.5148892998695374e-05, 1.7655082046985626e-05, 2.016127109527588e-05, 2.266746014356613e-05, 2.5173649191856384e-05, 2.7679838240146637e-05, 3.018602728843689e-05, 3.269221633672714e-05, 3.5198405385017395e-05, 3.770459443330765e-05, 4.02107834815979e-05, 4.271697252988815e-05, 4.5223161578178406e-05, 4.772935062646866e-05, 5.023553967475891e-05, 5.2741728723049164e-05, 5.5247917771339417e-05, 5.775410681962967e-05, 6.026029586791992e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 6.0, 11.0, 13.0, 14.0, 28.0, 64.0, 61.0, 116.0, 177.0, 301.0, 592.0, 1162.0, 2901.0, 8085.0, 24248.0, 87975.0, 727625.0, 145267.0, 32746.0, 10431.0, 3632.0, 1517.0, 703.0, 339.0, 201.0, 124.0, 78.0, 40.0, 32.0, 14.0, 22.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0928955078125, -0.08953285217285156, -0.08617019653320312, -0.08280754089355469, -0.07944488525390625, -0.07608222961425781, -0.07271957397460938, -0.06935691833496094, -0.0659942626953125, -0.06263160705566406, -0.059268951416015625, -0.05590629577636719, -0.05254364013671875, -0.04918098449707031, -0.045818328857421875, -0.04245567321777344, -0.039093017578125, -0.03573036193847656, -0.032367706298828125, -0.029005050659179688, -0.02564239501953125, -0.022279739379882812, -0.018917083740234375, -0.015554428100585938, -0.0121917724609375, -0.008829116821289062, -0.005466461181640625, -0.0021038055419921875, 0.00125885009765625, 0.0046215057373046875, 0.007984161376953125, 0.011346817016601562, 0.01470947265625, 0.018072128295898438, 0.021434783935546875, 0.024797439575195312, 0.02816009521484375, 0.03152275085449219, 0.034885406494140625, 0.03824806213378906, 0.0416107177734375, 0.04497337341308594, 0.048336029052734375, 0.05169868469238281, 0.05506134033203125, 0.05842399597167969, 0.061786651611328125, 0.06514930725097656, 0.068511962890625, 0.07187461853027344, 0.07523727416992188, 0.07859992980957031, 0.08196258544921875, 0.08532524108886719, 0.08868789672851562, 0.09205055236816406, 0.0954132080078125, 0.09877586364746094, 0.10213851928710938, 0.10550117492675781, 0.10886383056640625, 0.11222648620605469, 0.11558914184570312, 0.11895179748535156, 0.122314453125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 9.0, 9.0, 8.0, 13.0, 12.0, 12.0, 21.0, 45.0, 63.0, 130.0, 180.0, 180.0, 126.0, 59.0, 38.0, 22.0, 15.0, 10.0, 10.0, 5.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1019287109375, -0.09862804412841797, -0.09532737731933594, -0.0920267105102539, -0.08872604370117188, -0.08542537689208984, -0.08212471008300781, -0.07882404327392578, -0.07552337646484375, -0.07222270965576172, -0.06892204284667969, -0.06562137603759766, -0.062320709228515625, -0.059020042419433594, -0.05571937561035156, -0.05241870880126953, -0.0491180419921875, -0.04581737518310547, -0.04251670837402344, -0.039216041564941406, -0.035915374755859375, -0.032614707946777344, -0.029314041137695312, -0.02601337432861328, -0.02271270751953125, -0.01941204071044922, -0.016111373901367188, -0.012810707092285156, -0.009510040283203125, -0.006209373474121094, -0.0029087066650390625, 0.00039196014404296875, 0.003692626953125, 0.006993293762207031, 0.010293960571289062, 0.013594627380371094, 0.016895294189453125, 0.020195960998535156, 0.023496627807617188, 0.02679729461669922, 0.03009796142578125, 0.03339862823486328, 0.03669929504394531, 0.039999961853027344, 0.043300628662109375, 0.046601295471191406, 0.04990196228027344, 0.05320262908935547, 0.0565032958984375, 0.05980396270751953, 0.06310462951660156, 0.0664052963256836, 0.06970596313476562, 0.07300662994384766, 0.07630729675292969, 0.07960796356201172, 0.08290863037109375, 0.08620929718017578, 0.08950996398925781, 0.09281063079833984, 0.09611129760742188, 0.0994119644165039, 0.10271263122558594, 0.10601329803466797, 0.10931396484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 13.0, 40.0, 62.0, 95.0, 133.0, 162.0, 170.0, 130.0, 92.0, 50.0, 22.0, 11.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.187971591949463, -2.1345534324645996, -2.0811355113983154, -2.027717351913452, -1.9742993116378784, -1.9208812713623047, -1.8674631118774414, -1.8140450716018677, -1.760627031326294, -1.7072089910507202, -1.653790831565857, -1.6003727912902832, -1.5469547510147095, -1.4935367107391357, -1.4401185512542725, -1.3867005109786987, -1.333282470703125, -1.2798644304275513, -1.226446270942688, -1.1730282306671143, -1.1196101903915405, -1.0661921501159668, -1.0127739906311035, -0.9593559503555298, -0.9059377908706665, -0.852519690990448, -0.7991016507148743, -0.7456835508346558, -0.692265510559082, -0.6388474106788635, -0.585429310798645, -0.5320112705230713, -0.47859323024749756, -0.42517516016960144, -0.3717570900917053, -0.3183389902114868, -0.2649209499359131, -0.21150285005569458, -0.15808477997779846, -0.10466670989990234, -0.051248639822006226, 0.002169433981180191, 0.05558750778436661, 0.10900558531284332, 0.16242365539073944, 0.21584174036979675, 0.26925981044769287, 0.322677880525589, 0.3760959506034851, 0.4295140206813812, 0.48293209075927734, 0.5363501906394958, 0.5897682309150696, 0.6431863307952881, 0.6966043710708618, 0.7500224709510803, 0.8034405708312988, 0.8568586707115173, 0.9102767109870911, 0.9636948108673096, 1.0171128511428833, 1.070530891418457, 1.1239490509033203, 1.177367091178894, 1.2307851314544678]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 5.0, 3.0, 9.0, 12.0, 15.0, 15.0, 16.0, 23.0, 28.0, 27.0, 33.0, 37.0, 44.0, 46.0, 40.0, 38.0, 44.0, 47.0, 34.0, 46.0, 39.0, 30.0, 44.0, 35.0, 39.0, 37.0, 30.0, 25.0, 23.0, 23.0, 17.0, 24.0, 8.0, 13.0, 11.0, 10.0, 7.0, 0.0, 4.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.9527403116226196, -0.9240773916244507, -0.8954145312309265, -0.8667516112327576, -0.8380887508392334, -0.8094258308410645, -0.7807629108428955, -0.7520999908447266, -0.7234371304512024, -0.6947742104530334, -0.6661113500595093, -0.6374484300613403, -0.6087855100631714, -0.5801226496696472, -0.5514597296714783, -0.5227968692779541, -0.49413394927978516, -0.4654710590839386, -0.43680816888809204, -0.4081452488899231, -0.37948235869407654, -0.35081946849823, -0.32215654850006104, -0.2934936583042145, -0.2648307681083679, -0.23616787791252136, -0.2075049728155136, -0.17884206771850586, -0.1501791775226593, -0.12151628732681274, -0.09285338222980499, -0.06419047713279724, -0.03552752733230591, -0.006864629685878754, 0.0217982679605484, 0.050461165606975555, 0.07912406325340271, 0.10778695344924927, 0.13644985854625702, 0.16511276364326477, 0.19377565383911133, 0.22243854403495789, 0.25110143423080444, 0.2797643542289734, 0.30842724442481995, 0.3370901346206665, 0.36575305461883545, 0.394415944814682, 0.42307883501052856, 0.4517417252063751, 0.4804046154022217, 0.5090675354003906, 0.5377304553985596, 0.5663933157920837, 0.5950562357902527, 0.6237190961837769, 0.6523820161819458, 0.6810449361801147, 0.7097077965736389, 0.7383707165718079, 0.767033576965332, 0.795696496963501, 0.8243594169616699, 0.8530223369598389, 0.881685197353363]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 7.0, 4.0, 6.0, 13.0, 18.0, 20.0, 24.0, 38.0, 55.0, 106.0, 139.0, 184.0, 347.0, 508.0, 813.0, 1365.0, 2384.0, 4421.0, 8805.0, 17998.0, 43305.0, 131267.0, 986459.0, 2741983.0, 161614.0, 50654.0, 20711.0, 9770.0, 4918.0, 2565.0, 1448.0, 845.0, 529.0, 340.0, 220.0, 115.0, 84.0, 57.0, 39.0, 23.0, 21.0, 17.0, 16.0, 10.0, 8.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.181640625, -0.1759777069091797, -0.17031478881835938, -0.16465187072753906, -0.15898895263671875, -0.15332603454589844, -0.14766311645507812, -0.1420001983642578, -0.1363372802734375, -0.1306743621826172, -0.12501144409179688, -0.11934852600097656, -0.11368560791015625, -0.10802268981933594, -0.10235977172851562, -0.09669685363769531, -0.091033935546875, -0.08537101745605469, -0.07970809936523438, -0.07404518127441406, -0.06838226318359375, -0.06271934509277344, -0.057056427001953125, -0.05139350891113281, -0.0457305908203125, -0.04006767272949219, -0.034404754638671875, -0.028741836547851562, -0.02307891845703125, -0.017416000366210938, -0.011753082275390625, -0.0060901641845703125, -0.00042724609375, 0.0052356719970703125, 0.010898590087890625, 0.016561508178710938, 0.02222442626953125, 0.027887344360351562, 0.033550262451171875, 0.03921318054199219, 0.0448760986328125, 0.05053901672363281, 0.056201934814453125, 0.06186485290527344, 0.06752777099609375, 0.07319068908691406, 0.07885360717773438, 0.08451652526855469, 0.090179443359375, 0.09584236145019531, 0.10150527954101562, 0.10716819763183594, 0.11283111572265625, 0.11849403381347656, 0.12415695190429688, 0.1298198699951172, 0.1354827880859375, 0.1411457061767578, 0.14680862426757812, 0.15247154235839844, 0.15813446044921875, 0.16379737854003906, 0.16946029663085938, 0.1751232147216797, 0.1807861328125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 13.0, 14.0, 18.0, 18.0, 19.0, 20.0, 21.0, 27.0, 19.0, 41.0, 46.0, 50.0, 38.0, 49.0, 54.0, 56.0, 52.0, 45.0, 52.0, 48.0, 58.0, 33.0, 34.0, 28.0, 19.0, 28.0, 17.0, 14.0, 15.0, 7.0, 8.0, 7.0, 8.0, 4.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0518798828125, -0.05023765563964844, -0.048595428466796875, -0.04695320129394531, -0.04531097412109375, -0.04366874694824219, -0.042026519775390625, -0.04038429260253906, -0.0387420654296875, -0.03709983825683594, -0.035457611083984375, -0.03381538391113281, -0.03217315673828125, -0.030530929565429688, -0.028888702392578125, -0.027246475219726562, -0.025604248046875, -0.023962020874023438, -0.022319793701171875, -0.020677566528320312, -0.01903533935546875, -0.017393112182617188, -0.015750885009765625, -0.014108657836914062, -0.0124664306640625, -0.010824203491210938, -0.009181976318359375, -0.0075397491455078125, -0.00589752197265625, -0.0042552947998046875, -0.002613067626953125, -0.0009708404541015625, 0.00067138671875, 0.0023136138916015625, 0.003955841064453125, 0.0055980682373046875, 0.00724029541015625, 0.008882522583007812, 0.010524749755859375, 0.012166976928710938, 0.0138092041015625, 0.015451431274414062, 0.017093658447265625, 0.018735885620117188, 0.02037811279296875, 0.022020339965820312, 0.023662567138671875, 0.025304794311523438, 0.026947021484375, 0.028589248657226562, 0.030231475830078125, 0.03187370300292969, 0.03351593017578125, 0.03515815734863281, 0.036800384521484375, 0.03844261169433594, 0.0400848388671875, 0.04172706604003906, 0.043369293212890625, 0.04501152038574219, 0.04665374755859375, 0.04829597473144531, 0.049938201904296875, 0.05158042907714844, 0.05322265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 3.0, 6.0, 2.0, 4.0, 9.0, 12.0, 11.0, 22.0, 19.0, 38.0, 36.0, 53.0, 62.0, 89.0, 120.0, 170.0, 322.0, 613.0, 1239.0, 2790.0, 7135.0, 21469.0, 91021.0, 1172408.0, 2745620.0, 111592.0, 25245.0, 8125.0, 3013.0, 1342.0, 648.0, 367.0, 177.0, 132.0, 94.0, 54.0, 45.0, 37.0, 31.0, 22.0, 18.0, 18.0, 13.0, 13.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.339599609375, -0.3293266296386719, -0.31905364990234375, -0.3087806701660156, -0.2985076904296875, -0.2882347106933594, -0.27796173095703125, -0.2676887512207031, -0.257415771484375, -0.24714279174804688, -0.23686981201171875, -0.22659683227539062, -0.2163238525390625, -0.20605087280273438, -0.19577789306640625, -0.18550491333007812, -0.17523193359375, -0.16495895385742188, -0.15468597412109375, -0.14441299438476562, -0.1341400146484375, -0.12386703491210938, -0.11359405517578125, -0.10332107543945312, -0.093048095703125, -0.08277511596679688, -0.07250213623046875, -0.062229156494140625, -0.0519561767578125, -0.041683197021484375, -0.03141021728515625, -0.021137237548828125, -0.0108642578125, -0.000591278076171875, 0.00968170166015625, 0.019954681396484375, 0.0302276611328125, 0.040500640869140625, 0.05077362060546875, 0.061046600341796875, 0.071319580078125, 0.08159255981445312, 0.09186553955078125, 0.10213851928710938, 0.1124114990234375, 0.12268447875976562, 0.13295745849609375, 0.14323043823242188, 0.15350341796875, 0.16377639770507812, 0.17404937744140625, 0.18432235717773438, 0.1945953369140625, 0.20486831665039062, 0.21514129638671875, 0.22541427612304688, 0.235687255859375, 0.24596023559570312, 0.25623321533203125, 0.2665061950683594, 0.2767791748046875, 0.2870521545410156, 0.29732513427734375, 0.3075981140136719, 0.31787109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 8.0, 9.0, 6.0, 16.0, 17.0, 42.0, 63.0, 136.0, 249.0, 992.0, 1847.0, 327.0, 149.0, 80.0, 47.0, 19.0, 25.0, 14.0, 16.0, 6.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.206298828125, -0.20088577270507812, -0.19547271728515625, -0.19005966186523438, -0.1846466064453125, -0.17923355102539062, -0.17382049560546875, -0.16840744018554688, -0.162994384765625, -0.15758132934570312, -0.15216827392578125, -0.14675521850585938, -0.1413421630859375, -0.13592910766601562, -0.13051605224609375, -0.12510299682617188, -0.11968994140625, -0.11427688598632812, -0.10886383056640625, -0.10345077514648438, -0.0980377197265625, -0.09262466430664062, -0.08721160888671875, -0.08179855346679688, -0.076385498046875, -0.07097244262695312, -0.06555938720703125, -0.060146331787109375, -0.0547332763671875, -0.049320220947265625, -0.04390716552734375, -0.038494110107421875, -0.0330810546875, -0.027667999267578125, -0.02225494384765625, -0.016841888427734375, -0.0114288330078125, -0.006015777587890625, -0.00060272216796875, 0.004810333251953125, 0.010223388671875, 0.015636444091796875, 0.02104949951171875, 0.026462554931640625, 0.0318756103515625, 0.037288665771484375, 0.04270172119140625, 0.048114776611328125, 0.05352783203125, 0.058940887451171875, 0.06435394287109375, 0.06976699829101562, 0.0751800537109375, 0.08059310913085938, 0.08600616455078125, 0.09141921997070312, 0.096832275390625, 0.10224533081054688, 0.10765838623046875, 0.11307144165039062, 0.1184844970703125, 0.12389755249023438, 0.12931060791015625, 0.13472366333007812, 0.14013671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 5.0, 5.0, 6.0, 7.0, 16.0, 20.0, 34.0, 36.0, 64.0, 79.0, 108.0, 116.0, 119.0, 103.0, 77.0, 69.0, 45.0, 22.0, 20.0, 12.0, 10.0, 11.0, 4.0, 3.0, 9.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44253700971603394, -0.4220002591609955, -0.40146347880363464, -0.3809267282485962, -0.36038994789123535, -0.3398531973361969, -0.31931644678115845, -0.2987796664237976, -0.27824291586875916, -0.2577061653137207, -0.23716938495635986, -0.2166326344013214, -0.19609586894512177, -0.17555910348892212, -0.15502235293388367, -0.13448558747768402, -0.11394882202148438, -0.09341205656528473, -0.07287529855966568, -0.05233853682875633, -0.031801775097846985, -0.011265009641647339, 0.00927174836397171, 0.02980850636959076, 0.050345271825790405, 0.07088203728199005, 0.0914187952876091, 0.11195555329322815, 0.1324923187494278, 0.15302908420562744, 0.1735658347606659, 0.19410260021686554, 0.2146393060684204, 0.23517607152462006, 0.2557128369808197, 0.27624958753585815, 0.296786367893219, 0.31732311844825745, 0.3378598690032959, 0.35839664936065674, 0.3789333999156952, 0.39947015047073364, 0.4200069308280945, 0.44054368138313293, 0.4610804319381714, 0.4816172122955322, 0.5021539926528931, 0.5226907134056091, 0.54322749376297, 0.5637642741203308, 0.5843009948730469, 0.6048377752304077, 0.6253745555877686, 0.6459113359451294, 0.6664480566978455, 0.6869848370552063, 0.7075215578079224, 0.7280583381652832, 0.7485950589179993, 0.7691318392753601, 0.789668619632721, 0.810205340385437, 0.8307421207427979, 0.8512789011001587, 0.8718156814575195]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 5.0, 5.0, 5.0, 11.0, 6.0, 10.0, 15.0, 12.0, 15.0, 18.0, 25.0, 14.0, 22.0, 29.0, 24.0, 24.0, 29.0, 42.0, 42.0, 47.0, 42.0, 44.0, 33.0, 37.0, 51.0, 48.0, 37.0, 39.0, 35.0, 29.0, 37.0, 27.0, 31.0, 20.0, 15.0, 14.0, 16.0, 13.0, 8.0, 8.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348694384098053, -0.3364925682544708, -0.32429075241088867, -0.31208890676498413, -0.299887090921402, -0.2876852750778198, -0.27548345923423767, -0.2632816433906555, -0.251079797744751, -0.23887798190116882, -0.22667615115642548, -0.21447433531284332, -0.20227250456809998, -0.19007068872451782, -0.17786887288093567, -0.16566704213619232, -0.15346522629261017, -0.14126341044902802, -0.12906157970428467, -0.11685976386070251, -0.10465793311595917, -0.09245611727237701, -0.08025429397821426, -0.06805247068405151, -0.05585064738988876, -0.04364882409572601, -0.03144700080156326, -0.01924518123269081, -0.007043357938528061, 0.005158465355634689, 0.01736028492450714, 0.02956210821866989, 0.04176393151283264, 0.05396575480699539, 0.06616757810115814, 0.0783693939447403, 0.09057122468948364, 0.1027730405330658, 0.11497486382722855, 0.1271766871213913, 0.13937851786613464, 0.1515803337097168, 0.16378216445446014, 0.1759839802980423, 0.18818581104278564, 0.2003876268863678, 0.21258944272994995, 0.2247912734746933, 0.23699308931827545, 0.2491949051618576, 0.26139673590660095, 0.2735985517501831, 0.28580036759376526, 0.2980022132396698, 0.31020402908325195, 0.3224058449268341, 0.33460766077041626, 0.3468094766139984, 0.35901129245758057, 0.3712131381034851, 0.38341495394706726, 0.3956167697906494, 0.40781858563423157, 0.4200204014778137, 0.43222224712371826]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 5.0, 12.0, 15.0, 10.0, 31.0, 47.0, 66.0, 89.0, 136.0, 206.0, 332.0, 568.0, 863.0, 1404.0, 2450.0, 4215.0, 7644.0, 13814.0, 25203.0, 45690.0, 81530.0, 149181.0, 267475.0, 203805.0, 107782.0, 59706.0, 33626.0, 18618.0, 10418.0, 5736.0, 3152.0, 1835.0, 1126.0, 647.0, 397.0, 268.0, 153.0, 103.0, 72.0, 47.0, 24.0, 16.0, 10.0, 9.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11859130859375, -0.11485481262207031, -0.11111831665039062, -0.10738182067871094, -0.10364532470703125, -0.09990882873535156, -0.09617233276367188, -0.09243583679199219, -0.0886993408203125, -0.08496284484863281, -0.08122634887695312, -0.07748985290527344, -0.07375335693359375, -0.07001686096191406, -0.06628036499023438, -0.06254386901855469, -0.058807373046875, -0.05507087707519531, -0.051334381103515625, -0.04759788513183594, -0.04386138916015625, -0.04012489318847656, -0.036388397216796875, -0.03265190124511719, -0.0289154052734375, -0.025178909301757812, -0.021442413330078125, -0.017705917358398438, -0.01396942138671875, -0.010232925415039062, -0.006496429443359375, -0.0027599334716796875, 0.0009765625, 0.0047130584716796875, 0.008449554443359375, 0.012186050415039062, 0.01592254638671875, 0.019659042358398438, 0.023395538330078125, 0.027132034301757812, 0.0308685302734375, 0.03460502624511719, 0.038341522216796875, 0.04207801818847656, 0.04581451416015625, 0.04955101013183594, 0.053287506103515625, 0.05702400207519531, 0.060760498046875, 0.06449699401855469, 0.06823348999023438, 0.07196998596191406, 0.07570648193359375, 0.07944297790527344, 0.08317947387695312, 0.08691596984863281, 0.0906524658203125, 0.09438896179199219, 0.09812545776367188, 0.10186195373535156, 0.10559844970703125, 0.10933494567871094, 0.11307144165039062, 0.11680793762207031, 0.12054443359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 13.0, 11.0, 16.0, 21.0, 27.0, 31.0, 28.0, 33.0, 32.0, 35.0, 29.0, 41.0, 50.0, 51.0, 55.0, 46.0, 53.0, 49.0, 45.0, 27.0, 37.0, 43.0, 34.0, 35.0, 24.0, 17.0, 18.0, 16.0, 8.0, 11.0, 9.0, 6.0, 11.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0548095703125, -0.053148746490478516, -0.05148792266845703, -0.04982709884643555, -0.04816627502441406, -0.04650545120239258, -0.044844627380371094, -0.04318380355834961, -0.041522979736328125, -0.03986215591430664, -0.038201332092285156, -0.03654050827026367, -0.03487968444824219, -0.0332188606262207, -0.03155803680419922, -0.029897212982177734, -0.02823638916015625, -0.026575565338134766, -0.02491474151611328, -0.023253917694091797, -0.021593093872070312, -0.019932270050048828, -0.018271446228027344, -0.01661062240600586, -0.014949798583984375, -0.01328897476196289, -0.011628150939941406, -0.009967327117919922, -0.008306503295898438, -0.006645679473876953, -0.004984855651855469, -0.0033240318298339844, -0.0016632080078125, -2.384185791015625e-06, 0.0016584396362304688, 0.003319263458251953, 0.0049800872802734375, 0.006640911102294922, 0.008301734924316406, 0.00996255874633789, 0.011623382568359375, 0.01328420639038086, 0.014945030212402344, 0.016605854034423828, 0.018266677856445312, 0.019927501678466797, 0.02158832550048828, 0.023249149322509766, 0.02490997314453125, 0.026570796966552734, 0.02823162078857422, 0.029892444610595703, 0.03155326843261719, 0.03321409225463867, 0.034874916076660156, 0.03653573989868164, 0.038196563720703125, 0.03985738754272461, 0.041518211364746094, 0.04317903518676758, 0.04483985900878906, 0.04650068283081055, 0.04816150665283203, 0.049822330474853516, 0.051483154296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 16.0, 19.0, 29.0, 40.0, 48.0, 71.0, 118.0, 121.0, 200.0, 292.0, 451.0, 712.0, 1167.0, 2622.0, 7088.0, 26073.0, 111909.0, 524565.0, 285357.0, 63190.0, 15364.0, 4529.0, 1846.0, 952.0, 579.0, 376.0, 230.0, 137.0, 113.0, 82.0, 56.0, 38.0, 33.0, 23.0, 18.0, 11.0, 18.0, 14.0, 2.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.263671875, -0.2551116943359375, -0.246551513671875, -0.2379913330078125, -0.22943115234375, -0.2208709716796875, -0.212310791015625, -0.2037506103515625, -0.1951904296875, -0.1866302490234375, -0.178070068359375, -0.1695098876953125, -0.16094970703125, -0.1523895263671875, -0.143829345703125, -0.1352691650390625, -0.126708984375, -0.1181488037109375, -0.109588623046875, -0.1010284423828125, -0.09246826171875, -0.0839080810546875, -0.075347900390625, -0.0667877197265625, -0.0582275390625, -0.0496673583984375, -0.041107177734375, -0.0325469970703125, -0.02398681640625, -0.0154266357421875, -0.006866455078125, 0.0016937255859375, 0.01025390625, 0.0188140869140625, 0.027374267578125, 0.0359344482421875, 0.04449462890625, 0.0530548095703125, 0.061614990234375, 0.0701751708984375, 0.0787353515625, 0.0872955322265625, 0.095855712890625, 0.1044158935546875, 0.11297607421875, 0.1215362548828125, 0.130096435546875, 0.1386566162109375, 0.147216796875, 0.1557769775390625, 0.164337158203125, 0.1728973388671875, 0.18145751953125, 0.1900177001953125, 0.198577880859375, 0.2071380615234375, 0.2156982421875, 0.2242584228515625, 0.232818603515625, 0.2413787841796875, 0.24993896484375, 0.2584991455078125, 0.267059326171875, 0.2756195068359375, 0.2841796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 7.0, 3.0, 7.0, 9.0, 15.0, 17.0, 21.0, 23.0, 23.0, 28.0, 40.0, 47.0, 31.0, 45.0, 38.0, 46.0, 52.0, 53.0, 59.0, 67.0, 46.0, 47.0, 47.0, 29.0, 36.0, 21.0, 23.0, 20.0, 21.0, 10.0, 13.0, 19.0, 11.0, 8.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298583984375, -0.29010009765625, -0.2816162109375, -0.27313232421875, -0.2646484375, -0.25616455078125, -0.2476806640625, -0.23919677734375, -0.230712890625, -0.22222900390625, -0.2137451171875, -0.20526123046875, -0.19677734375, -0.18829345703125, -0.1798095703125, -0.17132568359375, -0.162841796875, -0.15435791015625, -0.1458740234375, -0.13739013671875, -0.12890625, -0.12042236328125, -0.1119384765625, -0.10345458984375, -0.094970703125, -0.08648681640625, -0.0780029296875, -0.06951904296875, -0.06103515625, -0.05255126953125, -0.0440673828125, -0.03558349609375, -0.027099609375, -0.01861572265625, -0.0101318359375, -0.00164794921875, 0.0068359375, 0.01531982421875, 0.0238037109375, 0.03228759765625, 0.040771484375, 0.04925537109375, 0.0577392578125, 0.06622314453125, 0.07470703125, 0.08319091796875, 0.0916748046875, 0.10015869140625, 0.108642578125, 0.11712646484375, 0.1256103515625, 0.13409423828125, 0.142578125, 0.15106201171875, 0.1595458984375, 0.16802978515625, 0.176513671875, 0.18499755859375, 0.1934814453125, 0.20196533203125, 0.21044921875, 0.21893310546875, 0.2274169921875, 0.23590087890625, 0.244384765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 0.0, 3.0, 8.0, 11.0, 22.0, 28.0, 48.0, 84.0, 172.0, 381.0, 937.0, 2669.0, 10322.0, 80894.0, 711119.0, 212262.0, 22752.0, 4402.0, 1406.0, 533.0, 229.0, 128.0, 58.0, 44.0, 24.0, 5.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2254638671875, -0.218353271484375, -0.21124267578125, -0.204132080078125, -0.197021484375, -0.189910888671875, -0.18280029296875, -0.175689697265625, -0.1685791015625, -0.161468505859375, -0.15435791015625, -0.147247314453125, -0.14013671875, -0.133026123046875, -0.12591552734375, -0.118804931640625, -0.1116943359375, -0.104583740234375, -0.09747314453125, -0.090362548828125, -0.083251953125, -0.076141357421875, -0.06903076171875, -0.061920166015625, -0.0548095703125, -0.047698974609375, -0.04058837890625, -0.033477783203125, -0.0263671875, -0.019256591796875, -0.01214599609375, -0.005035400390625, 0.0020751953125, 0.009185791015625, 0.01629638671875, 0.023406982421875, 0.030517578125, 0.037628173828125, 0.04473876953125, 0.051849365234375, 0.0589599609375, 0.066070556640625, 0.07318115234375, 0.080291748046875, 0.08740234375, 0.094512939453125, 0.10162353515625, 0.108734130859375, 0.1158447265625, 0.122955322265625, 0.13006591796875, 0.137176513671875, 0.144287109375, 0.151397705078125, 0.15850830078125, 0.165618896484375, 0.1727294921875, 0.179840087890625, 0.18695068359375, 0.194061279296875, 0.201171875, 0.208282470703125, 0.21539306640625, 0.222503662109375, 0.2296142578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 13.0, 16.0, 10.0, 35.0, 27.0, 35.0, 59.0, 74.0, 82.0, 98.0, 74.0, 86.0, 66.0, 74.0, 52.0, 47.0, 26.0, 35.0, 22.0, 28.0, 9.0, 10.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6862831115722656e-05, -5.464628338813782e-05, -5.242973566055298e-05, -5.021318793296814e-05, -4.79966402053833e-05, -4.578009247779846e-05, -4.356354475021362e-05, -4.1346997022628784e-05, -3.9130449295043945e-05, -3.6913901567459106e-05, -3.469735383987427e-05, -3.248080611228943e-05, -3.026425838470459e-05, -2.804771065711975e-05, -2.5831162929534912e-05, -2.3614615201950073e-05, -2.1398067474365234e-05, -1.9181519746780396e-05, -1.6964972019195557e-05, -1.4748424291610718e-05, -1.2531876564025879e-05, -1.031532883644104e-05, -8.098781108856201e-06, -5.882233381271362e-06, -3.6656856536865234e-06, -1.4491379261016846e-06, 7.674098014831543e-07, 2.983957529067993e-06, 5.200505256652832e-06, 7.417052984237671e-06, 9.63360071182251e-06, 1.1850148439407349e-05, 1.4066696166992188e-05, 1.6283243894577026e-05, 1.8499791622161865e-05, 2.0716339349746704e-05, 2.2932887077331543e-05, 2.5149434804916382e-05, 2.736598253250122e-05, 2.958253026008606e-05, 3.17990779876709e-05, 3.401562571525574e-05, 3.6232173442840576e-05, 3.8448721170425415e-05, 4.0665268898010254e-05, 4.288181662559509e-05, 4.509836435317993e-05, 4.731491208076477e-05, 4.953145980834961e-05, 5.174800753593445e-05, 5.396455526351929e-05, 5.6181102991104126e-05, 5.8397650718688965e-05, 6.0614198446273804e-05, 6.283074617385864e-05, 6.504729390144348e-05, 6.726384162902832e-05, 6.948038935661316e-05, 7.1696937084198e-05, 7.391348481178284e-05, 7.613003253936768e-05, 7.834658026695251e-05, 8.056312799453735e-05, 8.277967572212219e-05, 8.499622344970703e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 7.0, 11.0, 25.0, 22.0, 25.0, 38.0, 58.0, 100.0, 137.0, 242.0, 340.0, 749.0, 1654.0, 4003.0, 12820.0, 59535.0, 361456.0, 497028.0, 84222.0, 17208.0, 4943.0, 1887.0, 860.0, 470.0, 260.0, 143.0, 91.0, 69.0, 45.0, 25.0, 30.0, 17.0, 10.0, 6.0, 2.0, 4.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.172119140625, -0.16721534729003906, -0.16231155395507812, -0.1574077606201172, -0.15250396728515625, -0.1476001739501953, -0.14269638061523438, -0.13779258728027344, -0.1328887939453125, -0.12798500061035156, -0.12308120727539062, -0.11817741394042969, -0.11327362060546875, -0.10836982727050781, -0.10346603393554688, -0.09856224060058594, -0.093658447265625, -0.08875465393066406, -0.08385086059570312, -0.07894706726074219, -0.07404327392578125, -0.06913948059082031, -0.06423568725585938, -0.05933189392089844, -0.0544281005859375, -0.04952430725097656, -0.044620513916015625, -0.03971672058105469, -0.03481292724609375, -0.029909133911132812, -0.025005340576171875, -0.020101547241210938, -0.01519775390625, -0.010293960571289062, -0.005390167236328125, -0.0004863739013671875, 0.00441741943359375, 0.009321212768554688, 0.014225006103515625, 0.019128799438476562, 0.0240325927734375, 0.028936386108398438, 0.033840179443359375, 0.03874397277832031, 0.04364776611328125, 0.04855155944824219, 0.053455352783203125, 0.05835914611816406, 0.063262939453125, 0.06816673278808594, 0.07307052612304688, 0.07797431945800781, 0.08287811279296875, 0.08778190612792969, 0.09268569946289062, 0.09758949279785156, 0.1024932861328125, 0.10739707946777344, 0.11230087280273438, 0.11720466613769531, 0.12210845947265625, 0.1270122528076172, 0.13191604614257812, 0.13681983947753906, 0.1417236328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 8.0, 5.0, 8.0, 14.0, 15.0, 18.0, 23.0, 28.0, 34.0, 37.0, 46.0, 68.0, 74.0, 99.0, 77.0, 84.0, 63.0, 56.0, 42.0, 42.0, 36.0, 15.0, 18.0, 10.0, 18.0, 7.0, 7.0, 11.0, 9.0, 10.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10479736328125, -0.10106563568115234, -0.09733390808105469, -0.09360218048095703, -0.08987045288085938, -0.08613872528076172, -0.08240699768066406, -0.0786752700805664, -0.07494354248046875, -0.0712118148803711, -0.06748008728027344, -0.06374835968017578, -0.060016632080078125, -0.05628490447998047, -0.05255317687988281, -0.048821449279785156, -0.0450897216796875, -0.041357994079589844, -0.03762626647949219, -0.03389453887939453, -0.030162811279296875, -0.02643108367919922, -0.022699356079101562, -0.018967628479003906, -0.01523590087890625, -0.011504173278808594, -0.0077724456787109375, -0.004040718078613281, -0.000308990478515625, 0.0034227371215820312, 0.0071544647216796875, 0.010886192321777344, 0.014617919921875, 0.018349647521972656, 0.022081375122070312, 0.02581310272216797, 0.029544830322265625, 0.03327655792236328, 0.03700828552246094, 0.040740013122558594, 0.04447174072265625, 0.048203468322753906, 0.05193519592285156, 0.05566692352294922, 0.059398651123046875, 0.06313037872314453, 0.06686210632324219, 0.07059383392333984, 0.0743255615234375, 0.07805728912353516, 0.08178901672363281, 0.08552074432373047, 0.08925247192382812, 0.09298419952392578, 0.09671592712402344, 0.1004476547241211, 0.10417938232421875, 0.1079111099243164, 0.11164283752441406, 0.11537456512451172, 0.11910629272460938, 0.12283802032470703, 0.1265697479248047, 0.13030147552490234, 0.134033203125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 21.0, 41.0, 68.0, 112.0, 138.0, 149.0, 140.0, 131.0, 71.0, 47.0, 32.0, 26.0, 9.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6079115867614746, -2.5323643684387207, -2.456817150115967, -2.381269931793213, -2.305722713470459, -2.230175733566284, -2.1546285152435303, -2.0790812969207764, -2.0035340785980225, -1.9279868602752686, -1.8524396419525146, -1.7768925428390503, -1.7013453245162964, -1.6257981061935425, -1.5502510070800781, -1.4747037887573242, -1.3991565704345703, -1.3236093521118164, -1.2480621337890625, -1.1725150346755981, -1.0969678163528442, -1.0214205980300903, -0.9458734393119812, -0.8703262805938721, -0.7947790622711182, -0.7192318439483643, -0.6436846852302551, -0.568137526512146, -0.4925903081893921, -0.41704311966896057, -0.34149593114852905, -0.2659487724304199, -0.19040131568908691, -0.1148541271686554, -0.03930693864822388, 0.03624024987220764, 0.11178743839263916, 0.18733462691307068, 0.2628818154335022, 0.33842897415161133, 0.41397619247436523, 0.48952338099479675, 0.5650705695152283, 0.6406177282333374, 0.7161649465560913, 0.7917121648788452, 0.8672593235969543, 0.9428064823150635, 1.0183537006378174, 1.0939009189605713, 1.1694481372833252, 1.2449952363967896, 1.3205424547195435, 1.3960896730422974, 1.4716367721557617, 1.5471839904785156, 1.6227312088012695, 1.6982784271240234, 1.7738256454467773, 1.8493727445602417, 1.9249199628829956, 2.00046706199646, 2.076014280319214, 2.1515614986419678, 2.2271087169647217]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 4.0, 9.0, 14.0, 10.0, 16.0, 15.0, 20.0, 15.0, 22.0, 30.0, 27.0, 35.0, 36.0, 36.0, 47.0, 41.0, 37.0, 54.0, 37.0, 49.0, 42.0, 41.0, 32.0, 44.0, 40.0, 29.0, 29.0, 24.0, 32.0, 20.0, 18.0, 16.0, 18.0, 6.0, 7.0, 7.0, 7.0, 5.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0], "bins": [-1.4591898918151855, -1.4181658029556274, -1.3771418333053589, -1.3361177444458008, -1.2950937747955322, -1.2540696859359741, -1.213045597076416, -1.1720216274261475, -1.1309975385665894, -1.0899734497070312, -1.0489494800567627, -1.0079253911972046, -0.9669013619422913, -0.9258773326873779, -0.8848533034324646, -0.8438292741775513, -0.8028052449226379, -0.7617812156677246, -0.7207571864128113, -0.679733157157898, -0.6387090682983398, -0.5976850390434265, -0.5566610097885132, -0.5156369209289551, -0.47461292147636414, -0.4335888922214508, -0.3925648331642151, -0.35154080390930176, -0.3105167746543884, -0.2694927155971527, -0.22846868634223938, -0.18744462728500366, -0.14642059803009033, -0.10539655387401581, -0.06437251716852188, -0.023348480463027954, 0.01767556369304657, 0.058699607849121094, 0.09972363710403442, 0.14074769616127014, 0.18177172541618347, 0.222795769572258, 0.2638198137283325, 0.30484384298324585, 0.3458678722381592, 0.3868919312953949, 0.4279159605503082, 0.46894001960754395, 0.5099640488624573, 0.5509880781173706, 0.5920121073722839, 0.6330361366271973, 0.6740602254867554, 0.7150842547416687, 0.756108283996582, 0.7971323728561401, 0.8381563425064087, 0.879180371761322, 0.9202044010162354, 0.9612284898757935, 1.002252459526062, 1.0432765483856201, 1.0843005180358887, 1.1253246068954468, 1.1663486957550049]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 7.0, 13.0, 23.0, 16.0, 33.0, 38.0, 60.0, 72.0, 128.0, 190.0, 309.0, 493.0, 735.0, 1283.0, 2280.0, 4286.0, 8756.0, 19914.0, 53330.0, 195645.0, 2829591.0, 877274.0, 128091.0, 40027.0, 15906.0, 7166.0, 3631.0, 1973.0, 1113.0, 653.0, 390.0, 279.0, 177.0, 103.0, 76.0, 63.0, 39.0, 24.0, 19.0, 16.0, 13.0, 8.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.190185546875, -0.18421554565429688, -0.17824554443359375, -0.17227554321289062, -0.1663055419921875, -0.16033554077148438, -0.15436553955078125, -0.14839553833007812, -0.142425537109375, -0.13645553588867188, -0.13048553466796875, -0.12451553344726562, -0.1185455322265625, -0.11257553100585938, -0.10660552978515625, -0.10063552856445312, -0.09466552734375, -0.08869552612304688, -0.08272552490234375, -0.07675552368164062, -0.0707855224609375, -0.06481552124023438, -0.05884552001953125, -0.052875518798828125, -0.046905517578125, -0.040935516357421875, -0.03496551513671875, -0.028995513916015625, -0.0230255126953125, -0.017055511474609375, -0.01108551025390625, -0.005115509033203125, 0.0008544921875, 0.006824493408203125, 0.01279449462890625, 0.018764495849609375, 0.0247344970703125, 0.030704498291015625, 0.03667449951171875, 0.042644500732421875, 0.048614501953125, 0.054584503173828125, 0.06055450439453125, 0.06652450561523438, 0.0724945068359375, 0.07846450805664062, 0.08443450927734375, 0.09040451049804688, 0.09637451171875, 0.10234451293945312, 0.10831451416015625, 0.11428451538085938, 0.1202545166015625, 0.12622451782226562, 0.13219451904296875, 0.13816452026367188, 0.144134521484375, 0.15010452270507812, 0.15607452392578125, 0.16204452514648438, 0.1680145263671875, 0.17398452758789062, 0.17995452880859375, 0.18592453002929688, 0.19189453125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 6.0, 0.0, 5.0, 1.0, 3.0, 6.0, 6.0, 11.0, 15.0, 18.0, 15.0, 12.0, 19.0, 16.0, 29.0, 31.0, 33.0, 51.0, 32.0, 38.0, 33.0, 52.0, 47.0, 52.0, 40.0, 50.0, 40.0, 30.0, 33.0, 45.0, 38.0, 26.0, 28.0, 20.0, 21.0, 16.0, 15.0, 19.0, 9.0, 13.0, 7.0, 11.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.052093505859375, -0.05044746398925781, -0.048801422119140625, -0.04715538024902344, -0.04550933837890625, -0.04386329650878906, -0.042217254638671875, -0.04057121276855469, -0.0389251708984375, -0.03727912902832031, -0.035633087158203125, -0.03398704528808594, -0.03234100341796875, -0.030694961547851562, -0.029048919677734375, -0.027402877807617188, -0.0257568359375, -0.024110794067382812, -0.022464752197265625, -0.020818710327148438, -0.01917266845703125, -0.017526626586914062, -0.015880584716796875, -0.014234542846679688, -0.0125885009765625, -0.010942459106445312, -0.009296417236328125, -0.0076503753662109375, -0.00600433349609375, -0.0043582916259765625, -0.002712249755859375, -0.0010662078857421875, 0.000579833984375, 0.0022258758544921875, 0.003871917724609375, 0.0055179595947265625, 0.00716400146484375, 0.008810043334960938, 0.010456085205078125, 0.012102127075195312, 0.0137481689453125, 0.015394210815429688, 0.017040252685546875, 0.018686294555664062, 0.02033233642578125, 0.021978378295898438, 0.023624420166015625, 0.025270462036132812, 0.02691650390625, 0.028562545776367188, 0.030208587646484375, 0.03185462951660156, 0.03350067138671875, 0.03514671325683594, 0.036792755126953125, 0.03843879699707031, 0.0400848388671875, 0.04173088073730469, 0.043376922607421875, 0.04502296447753906, 0.04666900634765625, 0.04831504821777344, 0.049961090087890625, 0.05160713195800781, 0.053253173828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 14.0, 12.0, 19.0, 29.0, 32.0, 75.0, 91.0, 140.0, 217.0, 371.0, 542.0, 839.0, 1578.0, 2834.0, 6090.0, 15226.0, 46514.0, 202239.0, 2797936.0, 945123.0, 120697.0, 31672.0, 11226.0, 4980.0, 2373.0, 1333.0, 777.0, 445.0, 286.0, 192.0, 111.0, 85.0, 56.0, 37.0, 31.0, 17.0, 17.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280029296875, -0.2715034484863281, -0.26297760009765625, -0.2544517517089844, -0.2459259033203125, -0.23740005493164062, -0.22887420654296875, -0.22034835815429688, -0.211822509765625, -0.20329666137695312, -0.19477081298828125, -0.18624496459960938, -0.1777191162109375, -0.16919326782226562, -0.16066741943359375, -0.15214157104492188, -0.14361572265625, -0.13508987426757812, -0.12656402587890625, -0.11803817749023438, -0.1095123291015625, -0.10098648071289062, -0.09246063232421875, -0.08393478393554688, -0.075408935546875, -0.06688308715820312, -0.05835723876953125, -0.049831390380859375, -0.0413055419921875, -0.032779693603515625, -0.02425384521484375, -0.015727996826171875, -0.0072021484375, 0.001323699951171875, 0.00984954833984375, 0.018375396728515625, 0.0269012451171875, 0.035427093505859375, 0.04395294189453125, 0.052478790283203125, 0.061004638671875, 0.06953048706054688, 0.07805633544921875, 0.08658218383789062, 0.0951080322265625, 0.10363388061523438, 0.11215972900390625, 0.12068557739257812, 0.12921142578125, 0.13773727416992188, 0.14626312255859375, 0.15478897094726562, 0.1633148193359375, 0.17184066772460938, 0.18036651611328125, 0.18889236450195312, 0.197418212890625, 0.20594406127929688, 0.21446990966796875, 0.22299575805664062, 0.2315216064453125, 0.24004745483398438, 0.24857330322265625, 0.2570991516113281, 0.265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 6.0, 7.0, 13.0, 18.0, 17.0, 34.0, 73.0, 105.0, 202.0, 443.0, 1716.0, 766.0, 318.0, 131.0, 84.0, 50.0, 34.0, 11.0, 9.0, 11.0, 10.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.200927734375, -0.19438552856445312, -0.18784332275390625, -0.18130111694335938, -0.1747589111328125, -0.16821670532226562, -0.16167449951171875, -0.15513229370117188, -0.148590087890625, -0.14204788208007812, -0.13550567626953125, -0.12896347045898438, -0.1224212646484375, -0.11587905883789062, -0.10933685302734375, -0.10279464721679688, -0.09625244140625, -0.08971023559570312, -0.08316802978515625, -0.07662582397460938, -0.0700836181640625, -0.06354141235351562, -0.05699920654296875, -0.050457000732421875, -0.043914794921875, -0.037372589111328125, -0.03083038330078125, -0.024288177490234375, -0.0177459716796875, -0.011203765869140625, -0.00466156005859375, 0.001880645751953125, 0.0084228515625, 0.014965057373046875, 0.02150726318359375, 0.028049468994140625, 0.0345916748046875, 0.041133880615234375, 0.04767608642578125, 0.054218292236328125, 0.060760498046875, 0.06730270385742188, 0.07384490966796875, 0.08038711547851562, 0.0869293212890625, 0.09347152709960938, 0.10001373291015625, 0.10655593872070312, 0.11309814453125, 0.11964035034179688, 0.12618255615234375, 0.13272476196289062, 0.1392669677734375, 0.14580917358398438, 0.15235137939453125, 0.15889358520507812, 0.165435791015625, 0.17197799682617188, 0.17852020263671875, 0.18506240844726562, 0.1916046142578125, 0.19814682006835938, 0.20468902587890625, 0.21123123168945312, 0.2177734375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 11.0, 30.0, 38.0, 62.0, 93.0, 106.0, 129.0, 150.0, 119.0, 88.0, 74.0, 41.0, 22.0, 20.0, 6.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5917373895645142, -0.5554035902023315, -0.5190697908401489, -0.4827359914779663, -0.4464021921157837, -0.4100683927536011, -0.37373459339141846, -0.33740079402923584, -0.3010669946670532, -0.2647331953048706, -0.228399395942688, -0.19206559658050537, -0.15573179721832275, -0.11939799785614014, -0.08306419849395752, -0.0467303991317749, -0.010396599769592285, 0.025937199592590332, 0.06227099895477295, 0.09860479831695557, 0.13493859767913818, 0.1712723970413208, 0.20760619640350342, 0.24393999576568604, 0.28027379512786865, 0.31660759449005127, 0.3529413938522339, 0.3892751932144165, 0.4256089925765991, 0.46194279193878174, 0.49827659130096436, 0.534610390663147, 0.5709443092346191, 0.6072781085968018, 0.6436119079589844, 0.679945707321167, 0.7162795066833496, 0.7526133060455322, 0.7889471054077148, 0.8252809047698975, 0.8616147041320801, 0.8979485034942627, 0.9342823028564453, 0.9706161022186279, 1.0069499015808105, 1.0432837009429932, 1.0796175003051758, 1.1159512996673584, 1.152285099029541, 1.1886188983917236, 1.2249526977539062, 1.2612864971160889, 1.2976202964782715, 1.333954095840454, 1.3702878952026367, 1.4066216945648193, 1.442955493927002, 1.4792892932891846, 1.5156230926513672, 1.5519568920135498, 1.5882906913757324, 1.624624490737915, 1.6609582901000977, 1.6972920894622803, 1.733625888824463]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 5.0, 8.0, 8.0, 13.0, 10.0, 14.0, 18.0, 15.0, 15.0, 25.0, 29.0, 28.0, 48.0, 36.0, 36.0, 41.0, 44.0, 43.0, 57.0, 50.0, 46.0, 45.0, 28.0, 30.0, 39.0, 31.0, 38.0, 29.0, 25.0, 18.0, 30.0, 19.0, 20.0, 10.0, 7.0, 8.0, 9.0, 7.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4947463870048523, -0.476949006319046, -0.45915162563323975, -0.44135424494743347, -0.4235568642616272, -0.4057595133781433, -0.38796213269233704, -0.37016475200653076, -0.3523673713207245, -0.3345699906349182, -0.31677260994911194, -0.29897522926330566, -0.2811778783798218, -0.2633804678916931, -0.24558311700820923, -0.22778573632240295, -0.20998835563659668, -0.1921909749507904, -0.17439359426498413, -0.15659622848033905, -0.13879884779453278, -0.1210014671087265, -0.10320409387350082, -0.08540672063827515, -0.06760933995246887, -0.049811962991952896, -0.03201458603143692, -0.014217209070920944, 0.0035801678895950317, 0.021377548575401306, 0.039174921810626984, 0.05697229504585266, 0.07476961612701416, 0.09256699681282043, 0.11036437004804611, 0.1281617432832718, 0.14595912396907806, 0.16375650465488434, 0.18155387043952942, 0.1993512511253357, 0.21714863181114197, 0.23494601249694824, 0.2527433931827545, 0.2705407738685608, 0.2883381247520447, 0.30613553524017334, 0.3239328861236572, 0.3417302668094635, 0.3595276474952698, 0.37732502818107605, 0.3951224088668823, 0.4129197895526886, 0.4307171702384949, 0.44851452112197876, 0.46631190180778503, 0.4841092824935913, 0.5019066333770752, 0.5197039842605591, 0.5375013947486877, 0.5552987456321716, 0.5730961561203003, 0.5908935070037842, 0.6086909174919128, 0.6264882683753967, 0.6442856788635254]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 7.0, 11.0, 19.0, 21.0, 41.0, 49.0, 64.0, 97.0, 165.0, 219.0, 338.0, 546.0, 867.0, 1444.0, 2486.0, 4168.0, 7517.0, 14060.0, 26987.0, 51927.0, 96208.0, 168435.0, 227097.0, 192823.0, 116802.0, 63609.0, 32887.0, 17654.0, 9446.0, 5127.0, 2878.0, 1708.0, 989.0, 615.0, 434.0, 237.0, 162.0, 116.0, 101.0, 57.0, 42.0, 28.0, 19.0, 16.0, 10.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1314697265625, -0.1271820068359375, -0.122894287109375, -0.1186065673828125, -0.11431884765625, -0.1100311279296875, -0.105743408203125, -0.1014556884765625, -0.09716796875, -0.0928802490234375, -0.088592529296875, -0.0843048095703125, -0.08001708984375, -0.0757293701171875, -0.071441650390625, -0.0671539306640625, -0.0628662109375, -0.0585784912109375, -0.054290771484375, -0.0500030517578125, -0.04571533203125, -0.0414276123046875, -0.037139892578125, -0.0328521728515625, -0.028564453125, -0.0242767333984375, -0.019989013671875, -0.0157012939453125, -0.01141357421875, -0.0071258544921875, -0.002838134765625, 0.0014495849609375, 0.0057373046875, 0.0100250244140625, 0.014312744140625, 0.0186004638671875, 0.02288818359375, 0.0271759033203125, 0.031463623046875, 0.0357513427734375, 0.0400390625, 0.0443267822265625, 0.048614501953125, 0.0529022216796875, 0.05718994140625, 0.0614776611328125, 0.065765380859375, 0.0700531005859375, 0.0743408203125, 0.0786285400390625, 0.082916259765625, 0.0872039794921875, 0.09149169921875, 0.0957794189453125, 0.100067138671875, 0.1043548583984375, 0.108642578125, 0.1129302978515625, 0.117218017578125, 0.1215057373046875, 0.12579345703125, 0.1300811767578125, 0.134368896484375, 0.1386566162109375, 0.1429443359375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 3.0, 8.0, 10.0, 15.0, 5.0, 26.0, 12.0, 18.0, 22.0, 25.0, 23.0, 45.0, 34.0, 38.0, 45.0, 47.0, 43.0, 49.0, 45.0, 44.0, 53.0, 50.0, 40.0, 40.0, 37.0, 28.0, 36.0, 38.0, 13.0, 16.0, 14.0, 10.0, 21.0, 5.0, 15.0, 5.0, 5.0, 6.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055511474609375, -0.0535426139831543, -0.051573753356933594, -0.04960489273071289, -0.04763603210449219, -0.045667171478271484, -0.04369831085205078, -0.04172945022583008, -0.039760589599609375, -0.03779172897338867, -0.03582286834716797, -0.033854007720947266, -0.03188514709472656, -0.02991628646850586, -0.027947425842285156, -0.025978565216064453, -0.02400970458984375, -0.022040843963623047, -0.020071983337402344, -0.01810312271118164, -0.016134262084960938, -0.014165401458740234, -0.012196540832519531, -0.010227680206298828, -0.008258819580078125, -0.006289958953857422, -0.004321098327636719, -0.0023522377014160156, -0.0003833770751953125, 0.0015854835510253906, 0.0035543441772460938, 0.005523204803466797, 0.0074920654296875, 0.009460926055908203, 0.011429786682128906, 0.01339864730834961, 0.015367507934570312, 0.017336368560791016, 0.01930522918701172, 0.021274089813232422, 0.023242950439453125, 0.025211811065673828, 0.02718067169189453, 0.029149532318115234, 0.031118392944335938, 0.03308725357055664, 0.035056114196777344, 0.03702497482299805, 0.03899383544921875, 0.04096269607543945, 0.042931556701660156, 0.04490041732788086, 0.04686927795410156, 0.048838138580322266, 0.05080699920654297, 0.05277585983276367, 0.054744720458984375, 0.05671358108520508, 0.05868244171142578, 0.060651302337646484, 0.06262016296386719, 0.06458902359008789, 0.0665578842163086, 0.0685267448425293, 0.07049560546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 8.0, 13.0, 21.0, 25.0, 37.0, 38.0, 64.0, 80.0, 127.0, 185.0, 279.0, 481.0, 805.0, 1683.0, 4762.0, 19146.0, 110461.0, 522701.0, 317940.0, 53292.0, 10357.0, 2998.0, 1226.0, 642.0, 416.0, 279.0, 150.0, 110.0, 70.0, 38.0, 29.0, 28.0, 13.0, 12.0, 7.0, 10.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329345703125, -0.31790924072265625, -0.3064727783203125, -0.29503631591796875, -0.283599853515625, -0.27216339111328125, -0.2607269287109375, -0.24929046630859375, -0.23785400390625, -0.22641754150390625, -0.2149810791015625, -0.20354461669921875, -0.192108154296875, -0.18067169189453125, -0.1692352294921875, -0.15779876708984375, -0.1463623046875, -0.13492584228515625, -0.1234893798828125, -0.11205291748046875, -0.100616455078125, -0.08917999267578125, -0.0777435302734375, -0.06630706787109375, -0.05487060546875, -0.04343414306640625, -0.0319976806640625, -0.02056121826171875, -0.009124755859375, 0.00231170654296875, 0.0137481689453125, 0.02518463134765625, 0.03662109375, 0.04805755615234375, 0.0594940185546875, 0.07093048095703125, 0.082366943359375, 0.09380340576171875, 0.1052398681640625, 0.11667633056640625, 0.12811279296875, 0.13954925537109375, 0.1509857177734375, 0.16242218017578125, 0.173858642578125, 0.18529510498046875, 0.1967315673828125, 0.20816802978515625, 0.2196044921875, 0.23104095458984375, 0.2424774169921875, 0.25391387939453125, 0.265350341796875, 0.27678680419921875, 0.2882232666015625, 0.29965972900390625, 0.31109619140625, 0.32253265380859375, 0.3339691162109375, 0.34540557861328125, 0.356842041015625, 0.36827850341796875, 0.3797149658203125, 0.39115142822265625, 0.402587890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 5.0, 8.0, 15.0, 3.0, 16.0, 10.0, 14.0, 20.0, 18.0, 15.0, 29.0, 24.0, 34.0, 30.0, 36.0, 43.0, 36.0, 48.0, 48.0, 53.0, 50.0, 34.0, 43.0, 50.0, 39.0, 29.0, 36.0, 28.0, 30.0, 24.0, 15.0, 14.0, 18.0, 23.0, 17.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.344482421875, -0.3341560363769531, -0.32382965087890625, -0.3135032653808594, -0.3031768798828125, -0.2928504943847656, -0.28252410888671875, -0.2721977233886719, -0.261871337890625, -0.2515449523925781, -0.24121856689453125, -0.23089218139648438, -0.2205657958984375, -0.21023941040039062, -0.19991302490234375, -0.18958663940429688, -0.17926025390625, -0.16893386840820312, -0.15860748291015625, -0.14828109741210938, -0.1379547119140625, -0.12762832641601562, -0.11730194091796875, -0.10697555541992188, -0.096649169921875, -0.08632278442382812, -0.07599639892578125, -0.06567001342773438, -0.0553436279296875, -0.045017242431640625, -0.03469085693359375, -0.024364471435546875, -0.0140380859375, -0.003711700439453125, 0.00661468505859375, 0.016941070556640625, 0.0272674560546875, 0.037593841552734375, 0.04792022705078125, 0.058246612548828125, 0.068572998046875, 0.07889938354492188, 0.08922576904296875, 0.09955215454101562, 0.1098785400390625, 0.12020492553710938, 0.13053131103515625, 0.14085769653320312, 0.15118408203125, 0.16151046752929688, 0.17183685302734375, 0.18216323852539062, 0.1924896240234375, 0.20281600952148438, 0.21314239501953125, 0.22346878051757812, 0.233795166015625, 0.24412155151367188, 0.25444793701171875, 0.2647743225097656, 0.2751007080078125, 0.2854270935058594, 0.29575347900390625, 0.3060798645019531, 0.31640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 12.0, 1.0, 12.0, 14.0, 10.0, 33.0, 42.0, 46.0, 100.0, 127.0, 205.0, 347.0, 626.0, 1289.0, 2791.0, 7116.0, 23598.0, 119434.0, 516269.0, 300482.0, 54477.0, 13049.0, 4461.0, 1869.0, 954.0, 475.0, 261.0, 175.0, 97.0, 62.0, 29.0, 33.0, 24.0, 8.0, 8.0, 6.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.18505859375, -0.17923355102539062, -0.17340850830078125, -0.16758346557617188, -0.1617584228515625, -0.15593338012695312, -0.15010833740234375, -0.14428329467773438, -0.138458251953125, -0.13263320922851562, -0.12680816650390625, -0.12098312377929688, -0.1151580810546875, -0.10933303833007812, -0.10350799560546875, -0.09768295288085938, -0.09185791015625, -0.08603286743164062, -0.08020782470703125, -0.07438278198242188, -0.0685577392578125, -0.06273269653320312, -0.05690765380859375, -0.051082611083984375, -0.045257568359375, -0.039432525634765625, -0.03360748291015625, -0.027782440185546875, -0.0219573974609375, -0.016132354736328125, -0.01030731201171875, -0.004482269287109375, 0.0013427734375, 0.007167816162109375, 0.01299285888671875, 0.018817901611328125, 0.0246429443359375, 0.030467987060546875, 0.03629302978515625, 0.042118072509765625, 0.047943115234375, 0.053768157958984375, 0.05959320068359375, 0.06541824340820312, 0.0712432861328125, 0.07706832885742188, 0.08289337158203125, 0.08871841430664062, 0.09454345703125, 0.10036849975585938, 0.10619354248046875, 0.11201858520507812, 0.1178436279296875, 0.12366867065429688, 0.12949371337890625, 0.13531875610351562, 0.141143798828125, 0.14696884155273438, 0.15279388427734375, 0.15861892700195312, 0.1644439697265625, 0.17026901245117188, 0.17609405517578125, 0.18191909790039062, 0.187744140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 6.0, 12.0, 12.0, 17.0, 24.0, 23.0, 26.0, 32.0, 43.0, 55.0, 55.0, 67.0, 76.0, 59.0, 62.0, 76.0, 60.0, 46.0, 47.0, 38.0, 42.0, 26.0, 18.0, 12.0, 13.0, 10.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.11679458618164e-05, -6.905663758516312e-05, -6.694532930850983e-05, -6.483402103185654e-05, -6.272271275520325e-05, -6.061140447854996e-05, -5.850009620189667e-05, -5.638878792524338e-05, -5.427747964859009e-05, -5.21661713719368e-05, -5.005486309528351e-05, -4.794355481863022e-05, -4.583224654197693e-05, -4.372093826532364e-05, -4.160962998867035e-05, -3.949832171201706e-05, -3.738701343536377e-05, -3.527570515871048e-05, -3.316439688205719e-05, -3.10530886054039e-05, -2.894178032875061e-05, -2.683047205209732e-05, -2.471916377544403e-05, -2.260785549879074e-05, -2.049654722213745e-05, -1.838523894548416e-05, -1.627393066883087e-05, -1.4162622392177582e-05, -1.2051314115524292e-05, -9.940005838871002e-06, -7.828697562217712e-06, -5.717389285564423e-06, -3.606081008911133e-06, -1.494772732257843e-06, 6.165355443954468e-07, 2.7278438210487366e-06, 4.839152097702026e-06, 6.950460374355316e-06, 9.061768651008606e-06, 1.1173076927661896e-05, 1.3284385204315186e-05, 1.5395693480968475e-05, 1.7507001757621765e-05, 1.9618310034275055e-05, 2.1729618310928345e-05, 2.3840926587581635e-05, 2.5952234864234924e-05, 2.8063543140888214e-05, 3.0174851417541504e-05, 3.2286159694194794e-05, 3.4397467970848083e-05, 3.650877624750137e-05, 3.862008452415466e-05, 4.073139280080795e-05, 4.284270107746124e-05, 4.495400935411453e-05, 4.706531763076782e-05, 4.917662590742111e-05, 5.12879341840744e-05, 5.339924246072769e-05, 5.551055073738098e-05, 5.762185901403427e-05, 5.973316729068756e-05, 6.184447556734085e-05, 6.395578384399414e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 6.0, 13.0, 12.0, 15.0, 29.0, 43.0, 58.0, 109.0, 195.0, 331.0, 707.0, 1652.0, 4507.0, 16301.0, 97994.0, 599505.0, 278869.0, 35457.0, 7953.0, 2649.0, 1023.0, 496.0, 245.0, 133.0, 88.0, 61.0, 31.0, 15.0, 16.0, 7.0, 5.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21728515625, -0.21043968200683594, -0.20359420776367188, -0.1967487335205078, -0.18990325927734375, -0.1830577850341797, -0.17621231079101562, -0.16936683654785156, -0.1625213623046875, -0.15567588806152344, -0.14883041381835938, -0.1419849395751953, -0.13513946533203125, -0.1282939910888672, -0.12144851684570312, -0.11460304260253906, -0.107757568359375, -0.10091209411621094, -0.09406661987304688, -0.08722114562988281, -0.08037567138671875, -0.07353019714355469, -0.06668472290039062, -0.05983924865722656, -0.0529937744140625, -0.04614830017089844, -0.039302825927734375, -0.03245735168457031, -0.02561187744140625, -0.018766403198242188, -0.011920928955078125, -0.0050754547119140625, 0.00177001953125, 0.008615493774414062, 0.015460968017578125, 0.022306442260742188, 0.02915191650390625, 0.03599739074707031, 0.042842864990234375, 0.04968833923339844, 0.0565338134765625, 0.06337928771972656, 0.07022476196289062, 0.07707023620605469, 0.08391571044921875, 0.09076118469238281, 0.09760665893554688, 0.10445213317871094, 0.111297607421875, 0.11814308166503906, 0.12498855590820312, 0.1318340301513672, 0.13867950439453125, 0.1455249786376953, 0.15237045288085938, 0.15921592712402344, 0.1660614013671875, 0.17290687561035156, 0.17975234985351562, 0.1865978240966797, 0.19344329833984375, 0.2002887725830078, 0.20713424682617188, 0.21397972106933594, 0.2208251953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 8.0, 6.0, 10.0, 22.0, 32.0, 34.0, 63.0, 80.0, 93.0, 108.0, 117.0, 103.0, 82.0, 58.0, 56.0, 34.0, 27.0, 19.0, 12.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155029296875, -0.148895263671875, -0.14276123046875, -0.136627197265625, -0.1304931640625, -0.124359130859375, -0.11822509765625, -0.112091064453125, -0.10595703125, -0.099822998046875, -0.09368896484375, -0.087554931640625, -0.0814208984375, -0.075286865234375, -0.06915283203125, -0.063018798828125, -0.056884765625, -0.050750732421875, -0.04461669921875, -0.038482666015625, -0.0323486328125, -0.026214599609375, -0.02008056640625, -0.013946533203125, -0.0078125, -0.001678466796875, 0.00445556640625, 0.010589599609375, 0.0167236328125, 0.022857666015625, 0.02899169921875, 0.035125732421875, 0.041259765625, 0.047393798828125, 0.05352783203125, 0.059661865234375, 0.0657958984375, 0.071929931640625, 0.07806396484375, 0.084197998046875, 0.09033203125, 0.096466064453125, 0.10260009765625, 0.108734130859375, 0.1148681640625, 0.121002197265625, 0.12713623046875, 0.133270263671875, 0.139404296875, 0.145538330078125, 0.15167236328125, 0.157806396484375, 0.1639404296875, 0.170074462890625, 0.17620849609375, 0.182342529296875, 0.1884765625, 0.194610595703125, 0.20074462890625, 0.206878662109375, 0.2130126953125, 0.219146728515625, 0.22528076171875, 0.231414794921875, 0.237548828125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 11.0, 16.0, 23.0, 38.0, 61.0, 86.0, 83.0, 124.0, 105.0, 112.0, 104.0, 85.0, 41.0, 34.0, 29.0, 18.0, 6.0, 7.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.481602907180786, -2.4121639728546143, -2.3427250385284424, -2.2732861042022705, -2.2038471698760986, -2.1344079971313477, -2.064969062805176, -1.9955302476882935, -1.926091194152832, -1.8566522598266602, -1.7872133255004883, -1.7177743911743164, -1.648335337638855, -1.578896403312683, -1.5094574689865112, -1.4400185346603394, -1.3705796003341675, -1.3011406660079956, -1.2317017316818237, -1.1622626781463623, -1.0928237438201904, -1.0233848094940186, -0.9539458751678467, -0.8845069408416748, -0.8150679469108582, -0.7456290125846863, -0.6761900186538696, -0.6067510843276978, -0.5373121500015259, -0.46787315607070923, -0.39843422174453735, -0.3289952576160431, -0.25955629348754883, -0.19011732935905457, -0.1206783801317215, -0.05123943090438843, 0.018199533224105835, 0.0876384973526001, 0.15707743167877197, 0.22651639580726624, 0.2959553599357605, 0.36539432406425476, 0.434833288192749, 0.5042722225189209, 0.5737111568450928, 0.6431501507759094, 0.7125890851020813, 0.782028079032898, 0.8514670133590698, 0.9209059476852417, 0.9903449416160583, 1.059783935546875, 1.1292228698730469, 1.1986618041992188, 1.2681007385253906, 1.3375396728515625, 1.4069786071777344, 1.4764175415039062, 1.5458564758300781, 1.61529541015625, 1.6847344636917114, 1.7541733980178833, 1.8236123323440552, 1.893051266670227, 1.9624903202056885]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 7.0, 6.0, 6.0, 14.0, 18.0, 17.0, 20.0, 29.0, 24.0, 32.0, 27.0, 31.0, 33.0, 48.0, 49.0, 35.0, 45.0, 49.0, 47.0, 43.0, 48.0, 35.0, 55.0, 34.0, 36.0, 31.0, 34.0, 25.0, 11.0, 21.0, 21.0, 11.0, 14.0, 9.0, 7.0, 9.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.795438528060913, -1.7371033430099487, -1.6787681579589844, -1.62043297290802, -1.5620977878570557, -1.5037624835968018, -1.445427417755127, -1.387092113494873, -1.3287569284439087, -1.2704217433929443, -1.21208655834198, -1.1537513732910156, -1.0954161882400513, -1.037081003189087, -0.9787457585334778, -0.9204105138778687, -0.8620753884315491, -0.8037402033805847, -0.7454050183296204, -0.6870697736740112, -0.6287345886230469, -0.5703994035720825, -0.5120642185211182, -0.4537290036678314, -0.39539381861686707, -0.3370586335659027, -0.27872341871261597, -0.2203882336616516, -0.16205303370952606, -0.10371783375740051, -0.04538264870643616, 0.012952566146850586, 0.07128775119781494, 0.1296229511499405, 0.18795815110206604, 0.2462933361530304, 0.30462855100631714, 0.3629637360572815, 0.42129892110824585, 0.4796341359615326, 0.5379693508148193, 0.5963045358657837, 0.654639720916748, 0.7129749059677124, 0.7713101506233215, 0.8296453356742859, 0.8879805207252502, 0.9463157653808594, 1.0046508312225342, 1.0629860162734985, 1.121321201324463, 1.1796563863754272, 1.2379915714263916, 1.2963268756866455, 1.3546619415283203, 1.4129972457885742, 1.4713324308395386, 1.529667615890503, 1.5880028009414673, 1.6463379859924316, 1.704673171043396, 1.7630083560943604, 1.8213436603546143, 1.8796788454055786, 1.938014030456543]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 13.0, 21.0, 15.0, 34.0, 24.0, 44.0, 59.0, 82.0, 104.0, 154.0, 216.0, 330.0, 494.0, 680.0, 974.0, 1467.0, 2337.0, 4004.0, 7228.0, 14993.0, 40464.0, 260288.0, 3743869.0, 71913.0, 21323.0, 9543.0, 4973.0, 2980.0, 1764.0, 1197.0, 775.0, 530.0, 407.0, 267.0, 189.0, 144.0, 91.0, 78.0, 50.0, 39.0, 28.0, 24.0, 18.0, 17.0, 9.0, 11.0, 4.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0], "bins": [-0.2125244140625, -0.20592498779296875, -0.1993255615234375, -0.19272613525390625, -0.186126708984375, -0.17952728271484375, -0.1729278564453125, -0.16632843017578125, -0.15972900390625, -0.15312957763671875, -0.1465301513671875, -0.13993072509765625, -0.133331298828125, -0.12673187255859375, -0.1201324462890625, -0.11353302001953125, -0.10693359375, -0.10033416748046875, -0.0937347412109375, -0.08713531494140625, -0.080535888671875, -0.07393646240234375, -0.0673370361328125, -0.06073760986328125, -0.05413818359375, -0.04753875732421875, -0.0409393310546875, -0.03433990478515625, -0.027740478515625, -0.02114105224609375, -0.0145416259765625, -0.00794219970703125, -0.0013427734375, 0.00525665283203125, 0.0118560791015625, 0.01845550537109375, 0.025054931640625, 0.03165435791015625, 0.0382537841796875, 0.04485321044921875, 0.05145263671875, 0.05805206298828125, 0.0646514892578125, 0.07125091552734375, 0.077850341796875, 0.08444976806640625, 0.0910491943359375, 0.09764862060546875, 0.104248046875, 0.11084747314453125, 0.1174468994140625, 0.12404632568359375, 0.130645751953125, 0.13724517822265625, 0.1438446044921875, 0.15044403076171875, 0.15704345703125, 0.16364288330078125, 0.1702423095703125, 0.17684173583984375, 0.183441162109375, 0.19004058837890625, 0.1966400146484375, 0.20323944091796875, 0.2098388671875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 12.0, 6.0, 5.0, 6.0, 9.0, 10.0, 11.0, 18.0, 9.0, 21.0, 20.0, 25.0, 19.0, 33.0, 27.0, 47.0, 32.0, 42.0, 40.0, 49.0, 53.0, 41.0, 46.0, 53.0, 29.0, 33.0, 35.0, 38.0, 36.0, 32.0, 25.0, 23.0, 26.0, 21.0, 12.0, 9.0, 15.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06488037109375, -0.06279945373535156, -0.060718536376953125, -0.05863761901855469, -0.05655670166015625, -0.05447578430175781, -0.052394866943359375, -0.05031394958496094, -0.0482330322265625, -0.04615211486816406, -0.044071197509765625, -0.04199028015136719, -0.03990936279296875, -0.03782844543457031, -0.035747528076171875, -0.03366661071777344, -0.031585693359375, -0.029504776000976562, -0.027423858642578125, -0.025342941284179688, -0.02326202392578125, -0.021181106567382812, -0.019100189208984375, -0.017019271850585938, -0.0149383544921875, -0.012857437133789062, -0.010776519775390625, -0.008695602416992188, -0.00661468505859375, -0.0045337677001953125, -0.002452850341796875, -0.0003719329833984375, 0.001708984375, 0.0037899017333984375, 0.005870819091796875, 0.007951736450195312, 0.01003265380859375, 0.012113571166992188, 0.014194488525390625, 0.016275405883789062, 0.0183563232421875, 0.020437240600585938, 0.022518157958984375, 0.024599075317382812, 0.02667999267578125, 0.028760910034179688, 0.030841827392578125, 0.03292274475097656, 0.035003662109375, 0.03708457946777344, 0.039165496826171875, 0.04124641418457031, 0.04332733154296875, 0.04540824890136719, 0.047489166259765625, 0.04957008361816406, 0.0516510009765625, 0.05373191833496094, 0.055812835693359375, 0.05789375305175781, 0.05997467041015625, 0.06205558776855469, 0.06413650512695312, 0.06621742248535156, 0.06829833984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 8.0, 8.0, 16.0, 16.0, 32.0, 22.0, 30.0, 50.0, 53.0, 73.0, 93.0, 136.0, 205.0, 273.0, 410.0, 658.0, 1113.0, 2492.0, 6826.0, 38394.0, 3937090.0, 183114.0, 14816.0, 3929.0, 1739.0, 956.0, 538.0, 356.0, 235.0, 173.0, 105.0, 69.0, 55.0, 44.0, 41.0, 30.0, 20.0, 16.0, 8.0, 3.0, 6.0, 6.0, 4.0, 3.0, 3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58251953125, -0.5635833740234375, -0.544647216796875, -0.5257110595703125, -0.50677490234375, -0.4878387451171875, -0.468902587890625, -0.4499664306640625, -0.4310302734375, -0.4120941162109375, -0.393157958984375, -0.3742218017578125, -0.35528564453125, -0.3363494873046875, -0.317413330078125, -0.2984771728515625, -0.279541015625, -0.2606048583984375, -0.241668701171875, -0.2227325439453125, -0.20379638671875, -0.1848602294921875, -0.165924072265625, -0.1469879150390625, -0.1280517578125, -0.1091156005859375, -0.090179443359375, -0.0712432861328125, -0.05230712890625, -0.0333709716796875, -0.014434814453125, 0.0045013427734375, 0.0234375, 0.0423736572265625, 0.061309814453125, 0.0802459716796875, 0.09918212890625, 0.1181182861328125, 0.137054443359375, 0.1559906005859375, 0.1749267578125, 0.1938629150390625, 0.212799072265625, 0.2317352294921875, 0.25067138671875, 0.2696075439453125, 0.288543701171875, 0.3074798583984375, 0.326416015625, 0.3453521728515625, 0.364288330078125, 0.3832244873046875, 0.40216064453125, 0.4210968017578125, 0.440032958984375, 0.4589691162109375, 0.4779052734375, 0.4968414306640625, 0.515777587890625, 0.5347137451171875, 0.55364990234375, 0.5725860595703125, 0.591522216796875, 0.6104583740234375, 0.62939453125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 7.0, 4.0, 19.0, 46.0, 133.0, 3339.0, 385.0, 96.0, 20.0, 9.0, 11.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26171875, -0.2558755874633789, -0.2500324249267578, -0.24418926239013672, -0.23834609985351562, -0.23250293731689453, -0.22665977478027344, -0.22081661224365234, -0.21497344970703125, -0.20913028717041016, -0.20328712463378906, -0.19744396209716797, -0.19160079956054688, -0.18575763702392578, -0.1799144744873047, -0.1740713119506836, -0.1682281494140625, -0.1623849868774414, -0.1565418243408203, -0.15069866180419922, -0.14485549926757812, -0.13901233673095703, -0.13316917419433594, -0.12732601165771484, -0.12148284912109375, -0.11563968658447266, -0.10979652404785156, -0.10395336151123047, -0.09811019897460938, -0.09226703643798828, -0.08642387390136719, -0.0805807113647461, -0.074737548828125, -0.0688943862915039, -0.06305122375488281, -0.05720806121826172, -0.051364898681640625, -0.04552173614501953, -0.03967857360839844, -0.033835411071777344, -0.02799224853515625, -0.022149085998535156, -0.016305923461914062, -0.010462760925292969, -0.004619598388671875, 0.0012235641479492188, 0.0070667266845703125, 0.012909889221191406, 0.0187530517578125, 0.024596214294433594, 0.030439376831054688, 0.03628253936767578, 0.042125701904296875, 0.04796886444091797, 0.05381202697753906, 0.059655189514160156, 0.06549835205078125, 0.07134151458740234, 0.07718467712402344, 0.08302783966064453, 0.08887100219726562, 0.09471416473388672, 0.10055732727050781, 0.1064004898071289, 0.11224365234375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 5.0, 9.0, 12.0, 13.0, 23.0, 65.0, 59.0, 65.0, 58.0, 90.0, 106.0, 110.0, 95.0, 73.0, 66.0, 53.0, 26.0, 21.0, 11.0, 11.0, 9.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.25623372197151184, -0.24541980028152466, -0.23460589349269867, -0.2237919718027115, -0.2129780650138855, -0.20216414332389832, -0.19135022163391113, -0.18053629994392395, -0.16972239315509796, -0.15890847146511078, -0.1480945646762848, -0.1372806429862976, -0.12646672129631042, -0.11565281450748444, -0.10483889281749725, -0.09402497857809067, -0.08321106433868408, -0.0723971500992775, -0.06158323213458061, -0.05076931416988373, -0.03995539993047714, -0.029141485691070557, -0.018327564001083374, -0.007513649761676788, 0.0033002644777297974, 0.014114180579781532, 0.024928096681833267, 0.03574201464653015, 0.04655592888593674, 0.05736984312534332, 0.0681837648153305, 0.07899767905473709, 0.08981156349182129, 0.10062547773122787, 0.11143939197063446, 0.12225331366062164, 0.13306722044944763, 0.14388114213943481, 0.154695063829422, 0.16550898551940918, 0.17632289230823517, 0.18713681399822235, 0.19795072078704834, 0.20876464247703552, 0.2195785641670227, 0.2303924709558487, 0.24120639264583588, 0.25202029943466187, 0.26283422112464905, 0.27364814281463623, 0.2844620645046234, 0.2952759861946106, 0.3060898780822754, 0.3169037997722626, 0.32771772146224976, 0.33853164315223694, 0.3493455648422241, 0.3601594865322113, 0.3709734082221985, 0.3817873001098633, 0.39260122179985046, 0.40341514348983765, 0.41422906517982483, 0.425042986869812, 0.4358568787574768]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 12.0, 5.0, 8.0, 8.0, 11.0, 11.0, 17.0, 19.0, 22.0, 19.0, 24.0, 26.0, 24.0, 21.0, 29.0, 35.0, 36.0, 39.0, 33.0, 41.0, 34.0, 38.0, 38.0, 39.0, 34.0, 29.0, 34.0, 36.0, 40.0, 21.0, 23.0, 27.0, 22.0, 14.0, 23.0, 12.0, 14.0, 18.0, 11.0, 11.0, 11.0, 5.0, 10.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.2018650770187378, -0.19580957293510437, -0.18975405395030975, -0.18369854986667633, -0.1776430308818817, -0.1715875267982483, -0.16553202271461487, -0.15947651863098145, -0.15342099964618683, -0.1473654955625534, -0.1413099765777588, -0.13525447249412537, -0.12919896841049194, -0.12314344942569733, -0.1170879453420639, -0.11103243380784988, -0.10497692227363586, -0.09892141073942184, -0.09286589920520782, -0.0868103951215744, -0.08075488358736038, -0.07469937205314636, -0.06864386796951294, -0.06258835643529892, -0.0565328449010849, -0.05047733336687088, -0.04442182555794716, -0.03836631774902344, -0.03231080621480942, -0.026255296543240547, -0.020199786871671677, -0.014144279062747955, -0.008088767528533936, -0.002033257856965065, 0.0040222518146038055, 0.010077761486172676, 0.016133271157741547, 0.022188780829310417, 0.028244290500879288, 0.03429979830980301, 0.04035530984401703, 0.04641082137823105, 0.05246632918715477, 0.05852183699607849, 0.06457734853029251, 0.07063286006450653, 0.07668836414813995, 0.08274387568235397, 0.088799387216568, 0.09485489875078201, 0.10091041028499603, 0.10696591436862946, 0.11302142590284348, 0.1190769374370575, 0.12513244152069092, 0.13118794560432434, 0.13724346458911896, 0.14329896867275238, 0.149354487657547, 0.15540999174118042, 0.16146549582481384, 0.16752101480960846, 0.17357651889324188, 0.1796320378780365, 0.18568754196166992]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 12.0, 7.0, 13.0, 12.0, 15.0, 29.0, 34.0, 69.0, 128.0, 246.0, 381.0, 741.0, 1380.0, 3023.0, 6265.0, 13289.0, 28625.0, 61810.0, 126473.0, 219902.0, 250813.0, 169439.0, 87982.0, 41475.0, 19024.0, 8781.0, 4197.0, 2076.0, 1036.0, 521.0, 305.0, 182.0, 84.0, 61.0, 28.0, 14.0, 14.0, 9.0, 8.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.1739501953125, -0.1687164306640625, -0.163482666015625, -0.1582489013671875, -0.15301513671875, -0.1477813720703125, -0.142547607421875, -0.1373138427734375, -0.132080078125, -0.1268463134765625, -0.121612548828125, -0.1163787841796875, -0.11114501953125, -0.1059112548828125, -0.100677490234375, -0.0954437255859375, -0.0902099609375, -0.0849761962890625, -0.079742431640625, -0.0745086669921875, -0.06927490234375, -0.0640411376953125, -0.058807373046875, -0.0535736083984375, -0.04833984375, -0.0431060791015625, -0.037872314453125, -0.0326385498046875, -0.02740478515625, -0.0221710205078125, -0.016937255859375, -0.0117034912109375, -0.0064697265625, -0.0012359619140625, 0.003997802734375, 0.0092315673828125, 0.01446533203125, 0.0196990966796875, 0.024932861328125, 0.0301666259765625, 0.035400390625, 0.0406341552734375, 0.045867919921875, 0.0511016845703125, 0.05633544921875, 0.0615692138671875, 0.066802978515625, 0.0720367431640625, 0.0772705078125, 0.0825042724609375, 0.087738037109375, 0.0929718017578125, 0.09820556640625, 0.1034393310546875, 0.108673095703125, 0.1139068603515625, 0.119140625, 0.1243743896484375, 0.129608154296875, 0.1348419189453125, 0.14007568359375, 0.1453094482421875, 0.150543212890625, 0.1557769775390625, 0.1610107421875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 4.0, 9.0, 11.0, 12.0, 6.0, 12.0, 9.0, 21.0, 27.0, 20.0, 19.0, 19.0, 23.0, 29.0, 41.0, 26.0, 38.0, 35.0, 30.0, 52.0, 36.0, 34.0, 39.0, 49.0, 40.0, 31.0, 38.0, 34.0, 29.0, 29.0, 28.0, 31.0, 21.0, 16.0, 25.0, 13.0, 14.0, 9.0, 4.0, 6.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.07330322265625, -0.07108592987060547, -0.06886863708496094, -0.0666513442993164, -0.06443405151367188, -0.062216758728027344, -0.05999946594238281, -0.05778217315673828, -0.05556488037109375, -0.05334758758544922, -0.05113029479980469, -0.048913002014160156, -0.046695709228515625, -0.044478416442871094, -0.04226112365722656, -0.04004383087158203, -0.0378265380859375, -0.03560924530029297, -0.03339195251464844, -0.031174659729003906, -0.028957366943359375, -0.026740074157714844, -0.024522781372070312, -0.02230548858642578, -0.02008819580078125, -0.01787090301513672, -0.015653610229492188, -0.013436317443847656, -0.011219024658203125, -0.009001731872558594, -0.0067844390869140625, -0.004567146301269531, -0.002349853515625, -0.00013256072998046875, 0.0020847320556640625, 0.004302024841308594, 0.006519317626953125, 0.008736610412597656, 0.010953903198242188, 0.013171195983886719, 0.01538848876953125, 0.01760578155517578, 0.019823074340820312, 0.022040367126464844, 0.024257659912109375, 0.026474952697753906, 0.028692245483398438, 0.03090953826904297, 0.0331268310546875, 0.03534412384033203, 0.03756141662597656, 0.039778709411621094, 0.041996002197265625, 0.044213294982910156, 0.04643058776855469, 0.04864788055419922, 0.05086517333984375, 0.05308246612548828, 0.05529975891113281, 0.057517051696777344, 0.059734344482421875, 0.061951637268066406, 0.06416893005371094, 0.06638622283935547, 0.068603515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 7.0, 5.0, 13.0, 16.0, 16.0, 25.0, 32.0, 43.0, 57.0, 79.0, 107.0, 141.0, 212.0, 298.0, 523.0, 790.0, 1285.0, 2868.0, 8393.0, 34649.0, 185715.0, 563839.0, 197340.0, 36592.0, 8805.0, 3069.0, 1407.0, 728.0, 490.0, 277.0, 205.0, 125.0, 103.0, 66.0, 57.0, 46.0, 26.0, 25.0, 19.0, 9.0, 17.0, 9.0, 5.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.364013671875, -0.3531532287597656, -0.34229278564453125, -0.3314323425292969, -0.3205718994140625, -0.3097114562988281, -0.29885101318359375, -0.2879905700683594, -0.277130126953125, -0.2662696838378906, -0.25540924072265625, -0.24454879760742188, -0.2336883544921875, -0.22282791137695312, -0.21196746826171875, -0.20110702514648438, -0.19024658203125, -0.17938613891601562, -0.16852569580078125, -0.15766525268554688, -0.1468048095703125, -0.13594436645507812, -0.12508392333984375, -0.11422348022460938, -0.103363037109375, -0.09250259399414062, -0.08164215087890625, -0.07078170776367188, -0.0599212646484375, -0.049060821533203125, -0.03820037841796875, -0.027339935302734375, -0.0164794921875, -0.005619049072265625, 0.00524139404296875, 0.016101837158203125, 0.0269622802734375, 0.037822723388671875, 0.04868316650390625, 0.059543609619140625, 0.070404052734375, 0.08126449584960938, 0.09212493896484375, 0.10298538208007812, 0.1138458251953125, 0.12470626831054688, 0.13556671142578125, 0.14642715454101562, 0.15728759765625, 0.16814804077148438, 0.17900848388671875, 0.18986892700195312, 0.2007293701171875, 0.21158981323242188, 0.22245025634765625, 0.23331069946289062, 0.244171142578125, 0.2550315856933594, 0.26589202880859375, 0.2767524719238281, 0.2876129150390625, 0.2984733581542969, 0.30933380126953125, 0.3201942443847656, 0.3310546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 5.0, 10.0, 8.0, 6.0, 12.0, 7.0, 12.0, 23.0, 27.0, 19.0, 29.0, 29.0, 24.0, 48.0, 47.0, 43.0, 35.0, 39.0, 51.0, 42.0, 39.0, 58.0, 41.0, 34.0, 46.0, 29.0, 38.0, 30.0, 28.0, 24.0, 20.0, 18.0, 16.0, 21.0, 9.0, 9.0, 10.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.392822265625, -0.37941741943359375, -0.3660125732421875, -0.35260772705078125, -0.339202880859375, -0.32579803466796875, -0.3123931884765625, -0.29898834228515625, -0.28558349609375, -0.27217864990234375, -0.2587738037109375, -0.24536895751953125, -0.231964111328125, -0.21855926513671875, -0.2051544189453125, -0.19174957275390625, -0.1783447265625, -0.16493988037109375, -0.1515350341796875, -0.13813018798828125, -0.124725341796875, -0.11132049560546875, -0.0979156494140625, -0.08451080322265625, -0.07110595703125, -0.05770111083984375, -0.0442962646484375, -0.03089141845703125, -0.017486572265625, -0.00408172607421875, 0.0093231201171875, 0.02272796630859375, 0.0361328125, 0.04953765869140625, 0.0629425048828125, 0.07634735107421875, 0.089752197265625, 0.10315704345703125, 0.1165618896484375, 0.12996673583984375, 0.14337158203125, 0.15677642822265625, 0.1701812744140625, 0.18358612060546875, 0.196990966796875, 0.21039581298828125, 0.2238006591796875, 0.23720550537109375, 0.2506103515625, 0.26401519775390625, 0.2774200439453125, 0.29082489013671875, 0.304229736328125, 0.31763458251953125, 0.3310394287109375, 0.34444427490234375, 0.35784912109375, 0.37125396728515625, 0.3846588134765625, 0.39806365966796875, 0.411468505859375, 0.42487335205078125, 0.4382781982421875, 0.45168304443359375, 0.465087890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 10.0, 9.0, 13.0, 10.0, 18.0, 18.0, 35.0, 59.0, 73.0, 101.0, 152.0, 249.0, 434.0, 837.0, 1625.0, 3400.0, 8213.0, 24460.0, 92304.0, 374199.0, 400835.0, 99532.0, 25892.0, 8657.0, 3598.0, 1695.0, 839.0, 488.0, 293.0, 178.0, 103.0, 84.0, 44.0, 38.0, 18.0, 12.0, 11.0, 5.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.14990234375, -0.14522171020507812, -0.14054107666015625, -0.13586044311523438, -0.1311798095703125, -0.12649917602539062, -0.12181854248046875, -0.11713790893554688, -0.112457275390625, -0.10777664184570312, -0.10309600830078125, -0.09841537475585938, -0.0937347412109375, -0.08905410766601562, -0.08437347412109375, -0.07969284057617188, -0.07501220703125, -0.07033157348632812, -0.06565093994140625, -0.060970306396484375, -0.0562896728515625, -0.051609039306640625, -0.04692840576171875, -0.042247772216796875, -0.037567138671875, -0.032886505126953125, -0.02820587158203125, -0.023525238037109375, -0.0188446044921875, -0.014163970947265625, -0.00948333740234375, -0.004802703857421875, -0.0001220703125, 0.004558563232421875, 0.00923919677734375, 0.013919830322265625, 0.0186004638671875, 0.023281097412109375, 0.02796173095703125, 0.032642364501953125, 0.037322998046875, 0.042003631591796875, 0.04668426513671875, 0.051364898681640625, 0.0560455322265625, 0.060726165771484375, 0.06540679931640625, 0.07008743286132812, 0.07476806640625, 0.07944869995117188, 0.08412933349609375, 0.08880996704101562, 0.0934906005859375, 0.09817123413085938, 0.10285186767578125, 0.10753250122070312, 0.112213134765625, 0.11689376831054688, 0.12157440185546875, 0.12625503540039062, 0.1309356689453125, 0.13561630249023438, 0.14029693603515625, 0.14497756958007812, 0.149658203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 4.0, 3.0, 17.0, 9.0, 9.0, 13.0, 17.0, 38.0, 18.0, 24.0, 26.0, 32.0, 34.0, 40.0, 45.0, 45.0, 49.0, 53.0, 50.0, 49.0, 50.0, 52.0, 56.0, 25.0, 43.0, 32.0, 38.0, 13.0, 23.0, 14.0, 8.0, 12.0, 8.0, 11.0, 9.0, 7.0, 9.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.0187110900878906e-05, -4.8590824007987976e-05, -4.6994537115097046e-05, -4.5398250222206116e-05, -4.3801963329315186e-05, -4.2205676436424255e-05, -4.0609389543533325e-05, -3.9013102650642395e-05, -3.7416815757751465e-05, -3.5820528864860535e-05, -3.4224241971969604e-05, -3.2627955079078674e-05, -3.1031668186187744e-05, -2.9435381293296814e-05, -2.7839094400405884e-05, -2.6242807507514954e-05, -2.4646520614624023e-05, -2.3050233721733093e-05, -2.1453946828842163e-05, -1.9857659935951233e-05, -1.8261373043060303e-05, -1.6665086150169373e-05, -1.5068799257278442e-05, -1.3472512364387512e-05, -1.1876225471496582e-05, -1.0279938578605652e-05, -8.683651685714722e-06, -7.0873647928237915e-06, -5.491077899932861e-06, -3.894791007041931e-06, -2.298504114151001e-06, -7.022172212600708e-07, 8.940696716308594e-07, 2.4903565645217896e-06, 4.08664345741272e-06, 5.68293035030365e-06, 7.27921724319458e-06, 8.87550413608551e-06, 1.047179102897644e-05, 1.206807792186737e-05, 1.36643648147583e-05, 1.526065170764923e-05, 1.685693860054016e-05, 1.845322549343109e-05, 2.004951238632202e-05, 2.164579927921295e-05, 2.3242086172103882e-05, 2.4838373064994812e-05, 2.6434659957885742e-05, 2.8030946850776672e-05, 2.9627233743667603e-05, 3.122352063655853e-05, 3.281980752944946e-05, 3.441609442234039e-05, 3.601238131523132e-05, 3.7608668208122253e-05, 3.9204955101013184e-05, 4.0801241993904114e-05, 4.2397528886795044e-05, 4.3993815779685974e-05, 4.5590102672576904e-05, 4.7186389565467834e-05, 4.8782676458358765e-05, 5.0378963351249695e-05, 5.1975250244140625e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 12.0, 14.0, 18.0, 23.0, 28.0, 56.0, 67.0, 91.0, 167.0, 270.0, 503.0, 1000.0, 2388.0, 7735.0, 38499.0, 311109.0, 579998.0, 86304.0, 13712.0, 3615.0, 1350.0, 669.0, 340.0, 201.0, 122.0, 70.0, 50.0, 32.0, 35.0, 20.0, 22.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1832275390625, -0.17695236206054688, -0.17067718505859375, -0.16440200805664062, -0.1581268310546875, -0.15185165405273438, -0.14557647705078125, -0.13930130004882812, -0.133026123046875, -0.12675094604492188, -0.12047576904296875, -0.11420059204101562, -0.1079254150390625, -0.10165023803710938, -0.09537506103515625, -0.08909988403320312, -0.08282470703125, -0.07654953002929688, -0.07027435302734375, -0.06399917602539062, -0.0577239990234375, -0.051448822021484375, -0.04517364501953125, -0.038898468017578125, -0.032623291015625, -0.026348114013671875, -0.02007293701171875, -0.013797760009765625, -0.0075225830078125, -0.001247406005859375, 0.00502777099609375, 0.011302947998046875, 0.017578125, 0.023853302001953125, 0.03012847900390625, 0.036403656005859375, 0.0426788330078125, 0.048954010009765625, 0.05522918701171875, 0.061504364013671875, 0.067779541015625, 0.07405471801757812, 0.08032989501953125, 0.08660507202148438, 0.0928802490234375, 0.09915542602539062, 0.10543060302734375, 0.11170578002929688, 0.11798095703125, 0.12425613403320312, 0.13053131103515625, 0.13680648803710938, 0.1430816650390625, 0.14935684204101562, 0.15563201904296875, 0.16190719604492188, 0.168182373046875, 0.17445755004882812, 0.18073272705078125, 0.18700790405273438, 0.1932830810546875, 0.19955825805664062, 0.20583343505859375, 0.21210861206054688, 0.2183837890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 7.0, 9.0, 9.0, 20.0, 16.0, 27.0, 29.0, 45.0, 52.0, 73.0, 72.0, 82.0, 94.0, 78.0, 79.0, 64.0, 44.0, 52.0, 33.0, 27.0, 17.0, 16.0, 14.0, 15.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166015625, -0.16053009033203125, -0.1550445556640625, -0.14955902099609375, -0.144073486328125, -0.13858795166015625, -0.1331024169921875, -0.12761688232421875, -0.12213134765625, -0.11664581298828125, -0.1111602783203125, -0.10567474365234375, -0.100189208984375, -0.09470367431640625, -0.0892181396484375, -0.08373260498046875, -0.0782470703125, -0.07276153564453125, -0.0672760009765625, -0.06179046630859375, -0.056304931640625, -0.05081939697265625, -0.0453338623046875, -0.03984832763671875, -0.03436279296875, -0.02887725830078125, -0.0233917236328125, -0.01790618896484375, -0.012420654296875, -0.00693511962890625, -0.0014495849609375, 0.00403594970703125, 0.009521484375, 0.01500701904296875, 0.0204925537109375, 0.02597808837890625, 0.031463623046875, 0.03694915771484375, 0.0424346923828125, 0.04792022705078125, 0.05340576171875, 0.05889129638671875, 0.0643768310546875, 0.06986236572265625, 0.075347900390625, 0.08083343505859375, 0.0863189697265625, 0.09180450439453125, 0.0972900390625, 0.10277557373046875, 0.1082611083984375, 0.11374664306640625, 0.119232177734375, 0.12471771240234375, 0.1302032470703125, 0.13568878173828125, 0.14117431640625, 0.14665985107421875, 0.1521453857421875, 0.15763092041015625, 0.163116455078125, 0.16860198974609375, 0.1740875244140625, 0.17957305908203125, 0.18505859375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 10.0, 31.0, 50.0, 106.0, 143.0, 188.0, 171.0, 140.0, 88.0, 44.0, 14.0, 8.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.472292900085449, -2.3467941284179688, -2.2212953567504883, -2.095796585083008, -1.970297932624817, -1.8447991609573364, -1.7193005084991455, -1.593801736831665, -1.4683029651641846, -1.342804193496704, -1.2173054218292236, -1.0918067693710327, -0.9663079977035522, -0.8408092260360718, -0.7153105139732361, -0.5898118019104004, -0.4643130302429199, -0.33881428837776184, -0.21331554651260376, -0.08781680464744568, 0.0376819372177124, 0.16318070888519287, 0.28867942094802856, 0.41417813301086426, 0.5396769046783447, 0.6651756763458252, 0.7906743884086609, 0.9161731004714966, 1.041671872138977, 1.1671706438064575, 1.2926692962646484, 1.418168067932129, 1.5436668395996094, 1.6691656112670898, 1.7946643829345703, 1.9201630353927612, 2.0456619262695312, 2.1711606979370117, 2.296659231185913, 2.4221580028533936, 2.547656774520874, 2.6731555461883545, 2.798654317855835, 2.9241530895233154, 3.049651622772217, 3.1751503944396973, 3.3006491661071777, 3.426147937774658, 3.5516467094421387, 3.677145481109619, 3.8026442527770996, 3.92814302444458, 4.0536417961120605, 4.179140567779541, 4.3046393394470215, 4.430137634277344, 4.555636405944824, 4.681135177612305, 4.806633949279785, 4.932132720947266, 5.057631492614746, 5.183130264282227, 5.308629035949707, 5.4341278076171875, 5.559626579284668]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 7.0, 5.0, 14.0, 14.0, 16.0, 21.0, 21.0, 25.0, 28.0, 33.0, 35.0, 38.0, 35.0, 33.0, 53.0, 44.0, 60.0, 52.0, 49.0, 48.0, 43.0, 34.0, 42.0, 38.0, 24.0, 30.0, 20.0, 22.0, 17.0, 15.0, 17.0, 14.0, 6.0, 8.0, 2.0, 3.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.229708671569824, -2.1599161624908447, -2.0901236534118652, -2.0203311443328857, -1.9505386352539062, -1.8807461261749268, -1.8109536170959473, -1.7411611080169678, -1.6713685989379883, -1.6015760898590088, -1.5317835807800293, -1.4619910717010498, -1.3921985626220703, -1.3224060535430908, -1.2526135444641113, -1.1828210353851318, -1.113028645515442, -1.0432361364364624, -0.9734436273574829, -0.9036511182785034, -0.8338586091995239, -0.7640661001205444, -0.6942736506462097, -0.6244811415672302, -0.5546886324882507, -0.48489612340927124, -0.41510361433029175, -0.34531113505363464, -0.27551862597465515, -0.20572611689567566, -0.13593363761901855, -0.06614112854003906, 0.0036513805389404297, 0.07344388216733932, 0.14323638379573822, 0.21302887797355652, 0.282821387052536, 0.3526138961315155, 0.4224063754081726, 0.4921988844871521, 0.5619913935661316, 0.6317839026451111, 0.7015764117240906, 0.7713688611984253, 0.8411613702774048, 0.9109538793563843, 0.9807463884353638, 1.0505388975143433, 1.1203314065933228, 1.1901239156723022, 1.2599164247512817, 1.3297089338302612, 1.3995014429092407, 1.4692939519882202, 1.5390863418579102, 1.6088788509368896, 1.6786713600158691, 1.7484638690948486, 1.8182563781738281, 1.8880488872528076, 1.957841396331787, 2.0276339054107666, 2.097426414489746, 2.1672189235687256, 2.237011432647705]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 9.0, 13.0, 19.0, 37.0, 53.0, 88.0, 110.0, 259.0, 406.0, 682.0, 1164.0, 1979.0, 3813.0, 7517.0, 18462.0, 74654.0, 3864265.0, 171732.0, 28420.0, 9999.0, 4644.0, 2517.0, 1395.0, 821.0, 471.0, 299.0, 157.0, 111.0, 59.0, 39.0, 33.0, 21.0, 12.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294921875, -0.285614013671875, -0.27630615234375, -0.266998291015625, -0.2576904296875, -0.248382568359375, -0.23907470703125, -0.229766845703125, -0.220458984375, -0.211151123046875, -0.20184326171875, -0.192535400390625, -0.1832275390625, -0.173919677734375, -0.16461181640625, -0.155303955078125, -0.14599609375, -0.136688232421875, -0.12738037109375, -0.118072509765625, -0.1087646484375, -0.099456787109375, -0.09014892578125, -0.080841064453125, -0.071533203125, -0.062225341796875, -0.05291748046875, -0.043609619140625, -0.0343017578125, -0.024993896484375, -0.01568603515625, -0.006378173828125, 0.0029296875, 0.012237548828125, 0.02154541015625, 0.030853271484375, 0.0401611328125, 0.049468994140625, 0.05877685546875, 0.068084716796875, 0.077392578125, 0.086700439453125, 0.09600830078125, 0.105316162109375, 0.1146240234375, 0.123931884765625, 0.13323974609375, 0.142547607421875, 0.15185546875, 0.161163330078125, 0.17047119140625, 0.179779052734375, 0.1890869140625, 0.198394775390625, 0.20770263671875, 0.217010498046875, 0.226318359375, 0.235626220703125, 0.24493408203125, 0.254241943359375, 0.2635498046875, 0.272857666015625, 0.28216552734375, 0.291473388671875, 0.30078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 10.0, 8.0, 8.0, 6.0, 12.0, 15.0, 22.0, 16.0, 26.0, 24.0, 37.0, 35.0, 32.0, 51.0, 42.0, 54.0, 50.0, 53.0, 46.0, 57.0, 55.0, 39.0, 43.0, 49.0, 36.0, 28.0, 23.0, 33.0, 9.0, 15.0, 13.0, 9.0, 10.0, 9.0, 8.0, 1.0, 3.0, 7.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10260009765625, -0.09972858428955078, -0.09685707092285156, -0.09398555755615234, -0.09111404418945312, -0.0882425308227539, -0.08537101745605469, -0.08249950408935547, -0.07962799072265625, -0.07675647735595703, -0.07388496398925781, -0.0710134506225586, -0.06814193725585938, -0.06527042388916016, -0.06239891052246094, -0.05952739715576172, -0.0566558837890625, -0.05378437042236328, -0.05091285705566406, -0.048041343688964844, -0.045169830322265625, -0.042298316955566406, -0.03942680358886719, -0.03655529022216797, -0.03368377685546875, -0.03081226348876953, -0.027940750122070312, -0.025069236755371094, -0.022197723388671875, -0.019326210021972656, -0.016454696655273438, -0.013583183288574219, -0.010711669921875, -0.007840156555175781, -0.0049686431884765625, -0.0020971298217773438, 0.000774383544921875, 0.0036458969116210938, 0.0065174102783203125, 0.009388923645019531, 0.01226043701171875, 0.015131950378417969, 0.018003463745117188, 0.020874977111816406, 0.023746490478515625, 0.026618003845214844, 0.029489517211914062, 0.03236103057861328, 0.0352325439453125, 0.03810405731201172, 0.04097557067871094, 0.043847084045410156, 0.046718597412109375, 0.049590110778808594, 0.05246162414550781, 0.05533313751220703, 0.05820465087890625, 0.06107616424560547, 0.06394767761230469, 0.0668191909790039, 0.06969070434570312, 0.07256221771240234, 0.07543373107910156, 0.07830524444580078, 0.0811767578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 9.0, 20.0, 29.0, 35.0, 42.0, 65.0, 103.0, 168.0, 217.0, 337.0, 594.0, 988.0, 1800.0, 3271.0, 6528.0, 15826.0, 53264.0, 592962.0, 3418180.0, 65860.0, 18289.0, 7297.0, 3672.0, 1884.0, 1067.0, 659.0, 364.0, 247.0, 166.0, 118.0, 85.0, 47.0, 26.0, 20.0, 15.0, 9.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4052734375, -0.39434051513671875, -0.3834075927734375, -0.37247467041015625, -0.361541748046875, -0.35060882568359375, -0.3396759033203125, -0.32874298095703125, -0.31781005859375, -0.30687713623046875, -0.2959442138671875, -0.28501129150390625, -0.274078369140625, -0.26314544677734375, -0.2522125244140625, -0.24127960205078125, -0.2303466796875, -0.21941375732421875, -0.2084808349609375, -0.19754791259765625, -0.186614990234375, -0.17568206787109375, -0.1647491455078125, -0.15381622314453125, -0.14288330078125, -0.13195037841796875, -0.1210174560546875, -0.11008453369140625, -0.099151611328125, -0.08821868896484375, -0.0772857666015625, -0.06635284423828125, -0.055419921875, -0.04448699951171875, -0.0335540771484375, -0.02262115478515625, -0.011688232421875, -0.00075531005859375, 0.0101776123046875, 0.02111053466796875, 0.03204345703125, 0.04297637939453125, 0.0539093017578125, 0.06484222412109375, 0.075775146484375, 0.08670806884765625, 0.0976409912109375, 0.10857391357421875, 0.1195068359375, 0.13043975830078125, 0.1413726806640625, 0.15230560302734375, 0.163238525390625, 0.17417144775390625, 0.1851043701171875, 0.19603729248046875, 0.20697021484375, 0.21790313720703125, 0.2288360595703125, 0.23976898193359375, 0.250701904296875, 0.26163482666015625, 0.2725677490234375, 0.28350067138671875, 0.29443359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 1.0, 7.0, 10.0, 11.0, 18.0, 32.0, 48.0, 84.0, 152.0, 2473.0, 863.0, 166.0, 81.0, 32.0, 23.0, 23.0, 8.0, 7.0, 8.0, 6.0, 0.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09405517578125, -0.09080886840820312, -0.08756256103515625, -0.08431625366210938, -0.0810699462890625, -0.07782363891601562, -0.07457733154296875, -0.07133102416992188, -0.068084716796875, -0.06483840942382812, -0.06159210205078125, -0.058345794677734375, -0.0550994873046875, -0.051853179931640625, -0.04860687255859375, -0.045360565185546875, -0.0421142578125, -0.038867950439453125, -0.03562164306640625, -0.032375335693359375, -0.0291290283203125, -0.025882720947265625, -0.02263641357421875, -0.019390106201171875, -0.016143798828125, -0.012897491455078125, -0.00965118408203125, -0.006404876708984375, -0.0031585693359375, 8.7738037109375e-05, 0.00333404541015625, 0.006580352783203125, 0.00982666015625, 0.013072967529296875, 0.01631927490234375, 0.019565582275390625, 0.0228118896484375, 0.026058197021484375, 0.02930450439453125, 0.032550811767578125, 0.035797119140625, 0.039043426513671875, 0.04228973388671875, 0.045536041259765625, 0.0487823486328125, 0.052028656005859375, 0.05527496337890625, 0.058521270751953125, 0.061767578125, 0.06501388549804688, 0.06826019287109375, 0.07150650024414062, 0.0747528076171875, 0.07799911499023438, 0.08124542236328125, 0.08449172973632812, 0.087738037109375, 0.09098434448242188, 0.09423065185546875, 0.09747695922851562, 0.1007232666015625, 0.10396957397460938, 0.10721588134765625, 0.11046218872070312, 0.11370849609375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 4.0, 11.0, 9.0, 12.0, 19.0, 32.0, 47.0, 42.0, 69.0, 75.0, 103.0, 98.0, 78.0, 83.0, 67.0, 58.0, 46.0, 48.0, 32.0, 12.0, 18.0, 7.0, 5.0, 5.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342792272567749, -0.3319152593612671, -0.32103821635246277, -0.31016120314598083, -0.2992841601371765, -0.2884071469306946, -0.27753013372421265, -0.2666530907154083, -0.2557760775089264, -0.24489904940128326, -0.23402202129364014, -0.2231450080871582, -0.21226797997951508, -0.20139095187187195, -0.19051392376422882, -0.1796368956565857, -0.16875986754894257, -0.15788283944129944, -0.1470058113336563, -0.13612878322601318, -0.12525177001953125, -0.11437474191188812, -0.103497713804245, -0.09262069314718246, -0.08174366503953934, -0.07086663693189621, -0.05998961627483368, -0.04911258816719055, -0.03823556378483772, -0.027358539402484894, -0.016481511294841766, -0.005604490637779236, 0.005272537469863892, 0.01614956185221672, 0.0270265880972147, 0.03790361434221268, 0.048780638724565506, 0.059657663106918335, 0.07053469121456146, 0.08141171187162399, 0.09228873997926712, 0.10316576808691025, 0.11404278874397278, 0.1249198168516159, 0.13579684495925903, 0.14667385816574097, 0.1575509011745453, 0.16842791438102722, 0.17930494248867035, 0.19018197059631348, 0.2010589987039566, 0.21193602681159973, 0.22281304001808167, 0.2336900681257248, 0.24456709623336792, 0.25544410943984985, 0.2663211524486542, 0.2771981656551361, 0.28807520866394043, 0.29895222187042236, 0.3098292648792267, 0.3207062780857086, 0.33158332109451294, 0.3424603343009949, 0.3533373475074768]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 0.0, 6.0, 7.0, 4.0, 8.0, 9.0, 8.0, 10.0, 19.0, 16.0, 18.0, 29.0, 32.0, 26.0, 25.0, 33.0, 37.0, 32.0, 45.0, 49.0, 38.0, 32.0, 34.0, 46.0, 51.0, 46.0, 33.0, 34.0, 30.0, 38.0, 22.0, 28.0, 26.0, 17.0, 17.0, 15.0, 14.0, 12.0, 7.0, 9.0, 8.0, 6.0, 7.0, 4.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.23529881238937378, -0.2280694842338562, -0.22084017097949982, -0.21361084282398224, -0.20638152956962585, -0.19915220141410828, -0.1919228732585907, -0.18469354510307312, -0.17746423184871674, -0.17023490369319916, -0.16300559043884277, -0.1557762622833252, -0.14854693412780762, -0.14131762087345123, -0.13408829271793365, -0.12685897946357727, -0.11962965130805969, -0.11240033060312271, -0.10517100989818573, -0.09794168174266815, -0.09071236103773117, -0.08348304033279419, -0.07625371217727661, -0.06902439147233963, -0.06179507076740265, -0.05456575006246567, -0.04733642563223839, -0.04010710120201111, -0.03287778049707413, -0.025648459792137146, -0.018419135361909866, -0.011189810931682587, -0.0039604902267456055, 0.003268832340836525, 0.010498154908418655, 0.017727477476000786, 0.024956800043582916, 0.0321861207485199, 0.03941544517874718, 0.04664476960897446, 0.05387409031391144, 0.06110341101884842, 0.0683327317237854, 0.07556205987930298, 0.08279138058423996, 0.09002070128917694, 0.09725002944469452, 0.1044793501496315, 0.11170867085456848, 0.11893799155950546, 0.12616731226444244, 0.13339664041996002, 0.1406259536743164, 0.14785528182983398, 0.15508460998535156, 0.16231393814086914, 0.16954325139522552, 0.1767725795507431, 0.1840018928050995, 0.19123122096061707, 0.19846054911613464, 0.20568986237049103, 0.2129191905260086, 0.220148503780365, 0.22737783193588257]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 12.0, 15.0, 11.0, 19.0, 36.0, 42.0, 94.0, 166.0, 261.0, 601.0, 1179.0, 2419.0, 5292.0, 12211.0, 27793.0, 65738.0, 151572.0, 280425.0, 263886.0, 134965.0, 57762.0, 24468.0, 10551.0, 4708.0, 2138.0, 1060.0, 504.0, 264.0, 147.0, 73.0, 48.0, 33.0, 16.0, 11.0, 11.0, 10.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.17845535278320312, -0.17319488525390625, -0.16793441772460938, -0.1626739501953125, -0.15741348266601562, -0.15215301513671875, -0.14689254760742188, -0.141632080078125, -0.13637161254882812, -0.13111114501953125, -0.12585067749023438, -0.1205902099609375, -0.11532974243164062, -0.11006927490234375, -0.10480880737304688, -0.09954833984375, -0.09428787231445312, -0.08902740478515625, -0.08376693725585938, -0.0785064697265625, -0.07324600219726562, -0.06798553466796875, -0.06272506713867188, -0.057464599609375, -0.052204132080078125, -0.04694366455078125, -0.041683197021484375, -0.0364227294921875, -0.031162261962890625, -0.02590179443359375, -0.020641326904296875, -0.015380859375, -0.010120391845703125, -0.00485992431640625, 0.000400543212890625, 0.0056610107421875, 0.010921478271484375, 0.01618194580078125, 0.021442413330078125, 0.026702880859375, 0.031963348388671875, 0.03722381591796875, 0.042484283447265625, 0.0477447509765625, 0.053005218505859375, 0.05826568603515625, 0.06352615356445312, 0.06878662109375, 0.07404708862304688, 0.07930755615234375, 0.08456802368164062, 0.0898284912109375, 0.09508895874023438, 0.10034942626953125, 0.10560989379882812, 0.110870361328125, 0.11613082885742188, 0.12139129638671875, 0.12665176391601562, 0.1319122314453125, 0.13717269897460938, 0.14243316650390625, 0.14769363403320312, 0.1529541015625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 8.0, 7.0, 13.0, 11.0, 16.0, 13.0, 26.0, 28.0, 39.0, 41.0, 37.0, 46.0, 58.0, 59.0, 61.0, 59.0, 49.0, 63.0, 58.0, 62.0, 38.0, 30.0, 34.0, 28.0, 31.0, 16.0, 13.0, 16.0, 11.0, 7.0, 7.0, 7.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1104736328125, -0.10685920715332031, -0.10324478149414062, -0.09963035583496094, -0.09601593017578125, -0.09240150451660156, -0.08878707885742188, -0.08517265319824219, -0.0815582275390625, -0.07794380187988281, -0.07432937622070312, -0.07071495056152344, -0.06710052490234375, -0.06348609924316406, -0.059871673583984375, -0.05625724792480469, -0.052642822265625, -0.04902839660644531, -0.045413970947265625, -0.04179954528808594, -0.03818511962890625, -0.03457069396972656, -0.030956268310546875, -0.027341842651367188, -0.0237274169921875, -0.020112991333007812, -0.016498565673828125, -0.012884140014648438, -0.00926971435546875, -0.0056552886962890625, -0.002040863037109375, 0.0015735626220703125, 0.00518798828125, 0.008802413940429688, 0.012416839599609375, 0.016031265258789062, 0.01964569091796875, 0.023260116577148438, 0.026874542236328125, 0.030488967895507812, 0.0341033935546875, 0.03771781921386719, 0.041332244873046875, 0.04494667053222656, 0.04856109619140625, 0.05217552185058594, 0.055789947509765625, 0.05940437316894531, 0.063018798828125, 0.06663322448730469, 0.07024765014648438, 0.07386207580566406, 0.07747650146484375, 0.08109092712402344, 0.08470535278320312, 0.08831977844238281, 0.0919342041015625, 0.09554862976074219, 0.09916305541992188, 0.10277748107910156, 0.10639190673828125, 0.11000633239746094, 0.11362075805664062, 0.11723518371582031, 0.120849609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 5.0, 2.0, 3.0, 8.0, 9.0, 6.0, 18.0, 34.0, 41.0, 57.0, 68.0, 105.0, 117.0, 172.0, 260.0, 414.0, 653.0, 1087.0, 2431.0, 7831.0, 42756.0, 357773.0, 545822.0, 70867.0, 11497.0, 3079.0, 1350.0, 706.0, 442.0, 277.0, 190.0, 130.0, 83.0, 76.0, 54.0, 39.0, 31.0, 24.0, 15.0, 10.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.390380859375, -0.3789405822753906, -0.36750030517578125, -0.3560600280761719, -0.3446197509765625, -0.3331794738769531, -0.32173919677734375, -0.3102989196777344, -0.298858642578125, -0.2874183654785156, -0.27597808837890625, -0.2645378112792969, -0.2530975341796875, -0.24165725708007812, -0.23021697998046875, -0.21877670288085938, -0.20733642578125, -0.19589614868164062, -0.18445587158203125, -0.17301559448242188, -0.1615753173828125, -0.15013504028320312, -0.13869476318359375, -0.12725448608398438, -0.115814208984375, -0.10437393188476562, -0.09293365478515625, -0.08149337768554688, -0.0700531005859375, -0.058612823486328125, -0.04717254638671875, -0.035732269287109375, -0.0242919921875, -0.012851715087890625, -0.00141143798828125, 0.010028839111328125, 0.0214691162109375, 0.032909393310546875, 0.04434967041015625, 0.055789947509765625, 0.067230224609375, 0.07867050170898438, 0.09011077880859375, 0.10155105590820312, 0.1129913330078125, 0.12443161010742188, 0.13587188720703125, 0.14731216430664062, 0.15875244140625, 0.17019271850585938, 0.18163299560546875, 0.19307327270507812, 0.2045135498046875, 0.21595382690429688, 0.22739410400390625, 0.23883438110351562, 0.250274658203125, 0.2617149353027344, 0.27315521240234375, 0.2845954895019531, 0.2960357666015625, 0.3074760437011719, 0.31891632080078125, 0.3303565979003906, 0.341796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 1.0, 9.0, 8.0, 13.0, 17.0, 18.0, 15.0, 21.0, 18.0, 24.0, 21.0, 31.0, 31.0, 50.0, 40.0, 24.0, 41.0, 41.0, 44.0, 46.0, 49.0, 43.0, 41.0, 46.0, 42.0, 34.0, 24.0, 36.0, 34.0, 18.0, 14.0, 12.0, 14.0, 17.0, 15.0, 12.0, 8.0, 5.0, 8.0, 9.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.42236328125, -0.4081764221191406, -0.39398956298828125, -0.3798027038574219, -0.3656158447265625, -0.3514289855957031, -0.33724212646484375, -0.3230552673339844, -0.308868408203125, -0.2946815490722656, -0.28049468994140625, -0.2663078308105469, -0.2521209716796875, -0.23793411254882812, -0.22374725341796875, -0.20956039428710938, -0.19537353515625, -0.18118667602539062, -0.16699981689453125, -0.15281295776367188, -0.1386260986328125, -0.12443923950195312, -0.11025238037109375, -0.09606552124023438, -0.081878662109375, -0.06769180297851562, -0.05350494384765625, -0.039318084716796875, -0.0251312255859375, -0.010944366455078125, 0.00324249267578125, 0.017429351806640625, 0.0316162109375, 0.045803070068359375, 0.05998992919921875, 0.07417678833007812, 0.0883636474609375, 0.10255050659179688, 0.11673736572265625, 0.13092422485351562, 0.145111083984375, 0.15929794311523438, 0.17348480224609375, 0.18767166137695312, 0.2018585205078125, 0.21604537963867188, 0.23023223876953125, 0.24441909790039062, 0.25860595703125, 0.2727928161621094, 0.28697967529296875, 0.3011665344238281, 0.3153533935546875, 0.3295402526855469, 0.34372711181640625, 0.3579139709472656, 0.372100830078125, 0.3862876892089844, 0.40047454833984375, 0.4146614074707031, 0.4288482666015625, 0.4430351257324219, 0.45722198486328125, 0.4714088439941406, 0.485595703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 3.0, 4.0, 6.0, 1.0, 10.0, 14.0, 28.0, 34.0, 45.0, 69.0, 133.0, 219.0, 398.0, 865.0, 2224.0, 8808.0, 55843.0, 553876.0, 378830.0, 37300.0, 6407.0, 1865.0, 702.0, 342.0, 204.0, 117.0, 76.0, 40.0, 26.0, 22.0, 16.0, 11.0, 5.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1405029296875, -0.13408851623535156, -0.12767410278320312, -0.12125968933105469, -0.11484527587890625, -0.10843086242675781, -0.10201644897460938, -0.09560203552246094, -0.0891876220703125, -0.08277320861816406, -0.07635879516601562, -0.06994438171386719, -0.06352996826171875, -0.05711555480957031, -0.050701141357421875, -0.04428672790527344, -0.037872314453125, -0.03145790100097656, -0.025043487548828125, -0.018629074096679688, -0.01221466064453125, -0.0058002471923828125, 0.000614166259765625, 0.0070285797119140625, 0.0134429931640625, 0.019857406616210938, 0.026271820068359375, 0.03268623352050781, 0.03910064697265625, 0.04551506042480469, 0.051929473876953125, 0.05834388732910156, 0.06475830078125, 0.07117271423339844, 0.07758712768554688, 0.08400154113769531, 0.09041595458984375, 0.09683036804199219, 0.10324478149414062, 0.10965919494628906, 0.1160736083984375, 0.12248802185058594, 0.12890243530273438, 0.1353168487548828, 0.14173126220703125, 0.1481456756591797, 0.15456008911132812, 0.16097450256347656, 0.167388916015625, 0.17380332946777344, 0.18021774291992188, 0.1866321563720703, 0.19304656982421875, 0.1994609832763672, 0.20587539672851562, 0.21228981018066406, 0.2187042236328125, 0.22511863708496094, 0.23153305053710938, 0.2379474639892578, 0.24436187744140625, 0.2507762908935547, 0.2571907043457031, 0.26360511779785156, 0.27001953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 12.0, 9.0, 14.0, 21.0, 22.0, 36.0, 48.0, 51.0, 67.0, 74.0, 80.0, 74.0, 85.0, 83.0, 79.0, 81.0, 44.0, 40.0, 25.0, 20.0, 10.0, 5.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.178285598754883e-05, -3.941543400287628e-05, -3.7048012018203735e-05, -3.468059003353119e-05, -3.231316804885864e-05, -2.9945746064186096e-05, -2.757832407951355e-05, -2.5210902094841003e-05, -2.2843480110168457e-05, -2.047605812549591e-05, -1.8108636140823364e-05, -1.5741214156150818e-05, -1.3373792171478271e-05, -1.1006370186805725e-05, -8.638948202133179e-06, -6.271526217460632e-06, -3.904104232788086e-06, -1.5366822481155396e-06, 8.307397365570068e-07, 3.1981617212295532e-06, 5.5655837059021e-06, 7.933005690574646e-06, 1.0300427675247192e-05, 1.2667849659919739e-05, 1.5035271644592285e-05, 1.740269362926483e-05, 1.9770115613937378e-05, 2.2137537598609924e-05, 2.450495958328247e-05, 2.6872381567955017e-05, 2.9239803552627563e-05, 3.160722553730011e-05, 3.3974647521972656e-05, 3.63420695066452e-05, 3.870949149131775e-05, 4.1076913475990295e-05, 4.344433546066284e-05, 4.581175744533539e-05, 4.8179179430007935e-05, 5.054660141468048e-05, 5.291402339935303e-05, 5.5281445384025574e-05, 5.764886736869812e-05, 6.0016289353370667e-05, 6.238371133804321e-05, 6.475113332271576e-05, 6.71185553073883e-05, 6.948597729206085e-05, 7.18533992767334e-05, 7.422082126140594e-05, 7.658824324607849e-05, 7.895566523075104e-05, 8.132308721542358e-05, 8.369050920009613e-05, 8.605793118476868e-05, 8.842535316944122e-05, 9.079277515411377e-05, 9.316019713878632e-05, 9.552761912345886e-05, 9.789504110813141e-05, 0.00010026246309280396, 0.0001026298850774765, 0.00010499730706214905, 0.0001073647290468216, 0.00010973215103149414]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 7.0, 8.0, 11.0, 21.0, 47.0, 90.0, 181.0, 507.0, 1505.0, 7903.0, 212198.0, 797738.0, 24248.0, 2761.0, 756.0, 308.0, 131.0, 58.0, 29.0, 25.0, 18.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340087890625, -0.329193115234375, -0.31829833984375, -0.307403564453125, -0.2965087890625, -0.285614013671875, -0.27471923828125, -0.263824462890625, -0.2529296875, -0.242034912109375, -0.23114013671875, -0.220245361328125, -0.2093505859375, -0.198455810546875, -0.18756103515625, -0.176666259765625, -0.165771484375, -0.154876708984375, -0.14398193359375, -0.133087158203125, -0.1221923828125, -0.111297607421875, -0.10040283203125, -0.089508056640625, -0.07861328125, -0.067718505859375, -0.05682373046875, -0.045928955078125, -0.0350341796875, -0.024139404296875, -0.01324462890625, -0.002349853515625, 0.008544921875, 0.019439697265625, 0.03033447265625, 0.041229248046875, 0.0521240234375, 0.063018798828125, 0.07391357421875, 0.084808349609375, 0.095703125, 0.106597900390625, 0.11749267578125, 0.128387451171875, 0.1392822265625, 0.150177001953125, 0.16107177734375, 0.171966552734375, 0.182861328125, 0.193756103515625, 0.20465087890625, 0.215545654296875, 0.2264404296875, 0.237335205078125, 0.24822998046875, 0.259124755859375, 0.27001953125, 0.280914306640625, 0.29180908203125, 0.302703857421875, 0.3135986328125, 0.324493408203125, 0.33538818359375, 0.346282958984375, 0.357177734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 11.0, 19.0, 45.0, 77.0, 137.0, 159.0, 159.0, 136.0, 107.0, 68.0, 39.0, 15.0, 10.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13671875, -0.12723922729492188, -0.11775970458984375, -0.10828018188476562, -0.0988006591796875, -0.08932113647460938, -0.07984161376953125, -0.07036209106445312, -0.060882568359375, -0.051403045654296875, -0.04192352294921875, -0.032444000244140625, -0.0229644775390625, -0.013484954833984375, -0.00400543212890625, 0.005474090576171875, 0.01495361328125, 0.024433135986328125, 0.03391265869140625, 0.043392181396484375, 0.0528717041015625, 0.062351226806640625, 0.07183074951171875, 0.08131027221679688, 0.090789794921875, 0.10026931762695312, 0.10974884033203125, 0.11922836303710938, 0.1287078857421875, 0.13818740844726562, 0.14766693115234375, 0.15714645385742188, 0.1666259765625, 0.17610549926757812, 0.18558502197265625, 0.19506454467773438, 0.2045440673828125, 0.21402359008789062, 0.22350311279296875, 0.23298263549804688, 0.242462158203125, 0.2519416809082031, 0.26142120361328125, 0.2709007263183594, 0.2803802490234375, 0.2898597717285156, 0.29933929443359375, 0.3088188171386719, 0.31829833984375, 0.3277778625488281, 0.33725738525390625, 0.3467369079589844, 0.3562164306640625, 0.3656959533691406, 0.37517547607421875, 0.3846549987792969, 0.394134521484375, 0.4036140441894531, 0.41309356689453125, 0.4225730895996094, 0.4320526123046875, 0.4415321350097656, 0.45101165771484375, 0.4604911804199219, 0.469970703125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 9.0, 7.0, 15.0, 37.0, 43.0, 88.0, 100.0, 113.0, 118.0, 108.0, 109.0, 95.0, 50.0, 38.0, 26.0, 17.0, 5.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0187923908233643, -0.9427394866943359, -0.8666865825653076, -0.7906336784362793, -0.714580774307251, -0.6385278701782227, -0.5624749660491943, -0.486422061920166, -0.4103691577911377, -0.3343162536621094, -0.25826334953308105, -0.18221044540405273, -0.10615754127502441, -0.030104637145996094, 0.04594826698303223, 0.12200117111206055, 0.19805407524108887, 0.2741069793701172, 0.3501598834991455, 0.42621278762817383, 0.5022656917572021, 0.5783185958862305, 0.6543715000152588, 0.7304244041442871, 0.8064773082733154, 0.8825302124023438, 0.9585831165313721, 1.0346360206604004, 1.1106889247894287, 1.186741828918457, 1.2627947330474854, 1.3388476371765137, 1.414900779724121, 1.4909536838531494, 1.5670065879821777, 1.643059492111206, 1.7191123962402344, 1.7951653003692627, 1.871218204498291, 1.9472711086273193, 2.0233240127563477, 2.099376916885376, 2.1754298210144043, 2.2514827251434326, 2.327535629272461, 2.4035885334014893, 2.4796414375305176, 2.555694341659546, 2.631747245788574, 2.7078001499176025, 2.783853054046631, 2.859905958175659, 2.9359588623046875, 3.012011766433716, 3.088064670562744, 3.1641175746917725, 3.240170478820801, 3.316223382949829, 3.3922762870788574, 3.4683291912078857, 3.544382095336914, 3.6204349994659424, 3.6964879035949707, 3.772540807723999, 3.8485937118530273]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 4.0, 3.0, 8.0, 4.0, 11.0, 8.0, 11.0, 13.0, 13.0, 19.0, 24.0, 34.0, 35.0, 36.0, 48.0, 46.0, 44.0, 37.0, 54.0, 50.0, 57.0, 46.0, 38.0, 48.0, 43.0, 46.0, 40.0, 31.0, 23.0, 28.0, 30.0, 12.0, 9.0, 15.0, 11.0, 5.0, 6.0, 4.0, 1.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2285633087158203, -2.160181760787964, -2.0918002128601074, -2.023418664932251, -1.955036997795105, -1.8866554498672485, -1.818273901939392, -1.7498923540115356, -1.6815106868743896, -1.6131291389465332, -1.5447475910186768, -1.4763660430908203, -1.4079843759536743, -1.3396028280258179, -1.2712212800979614, -1.202839732170105, -1.1344581842422485, -1.066076636314392, -0.9976950287818909, -0.9293134808540344, -0.8609318733215332, -0.7925503253936768, -0.7241687774658203, -0.6557872295379639, -0.5874056220054626, -0.5190240740776062, -0.450642466545105, -0.38226091861724854, -0.3138793408870697, -0.24549776315689087, -0.17711621522903442, -0.10873463749885559, -0.04035305976867676, 0.02802851051092148, 0.09641008079051971, 0.16479164361953735, 0.2331732213497162, 0.301554799079895, 0.36993634700775146, 0.4383179247379303, 0.5066995024681091, 0.5750810503959656, 0.6434626579284668, 0.7118442058563232, 0.7802257537841797, 0.8486073613166809, 0.9169889092445374, 0.9853705167770386, 1.053752064704895, 1.1221336126327515, 1.190515160560608, 1.258896827697754, 1.3272783756256104, 1.3956599235534668, 1.4640414714813232, 1.5324230194091797, 1.6008045673370361, 1.6691861152648926, 1.737567663192749, 1.8059492111206055, 1.8743308782577515, 1.942712426185608, 2.011094093322754, 2.0794756412506104, 2.147857189178467]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 20.0, 14.0, 21.0, 41.0, 41.0, 70.0, 107.0, 203.0, 282.0, 569.0, 922.0, 1769.0, 3784.0, 8388.0, 25997.0, 3717734.0, 394931.0, 23998.0, 7989.0, 3476.0, 1715.0, 905.0, 516.0, 328.0, 144.0, 126.0, 52.0, 48.0, 26.0, 19.0, 10.0, 12.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328857421875, -0.3175048828125, -0.30615234375, -0.2947998046875, -0.283447265625, -0.2720947265625, -0.2607421875, -0.2493896484375, -0.238037109375, -0.2266845703125, -0.21533203125, -0.2039794921875, -0.192626953125, -0.1812744140625, -0.169921875, -0.1585693359375, -0.147216796875, -0.1358642578125, -0.12451171875, -0.1131591796875, -0.101806640625, -0.0904541015625, -0.0791015625, -0.0677490234375, -0.056396484375, -0.0450439453125, -0.03369140625, -0.0223388671875, -0.010986328125, 0.0003662109375, 0.01171875, 0.0230712890625, 0.034423828125, 0.0457763671875, 0.05712890625, 0.0684814453125, 0.079833984375, 0.0911865234375, 0.1025390625, 0.1138916015625, 0.125244140625, 0.1365966796875, 0.14794921875, 0.1593017578125, 0.170654296875, 0.1820068359375, 0.193359375, 0.2047119140625, 0.216064453125, 0.2274169921875, 0.23876953125, 0.2501220703125, 0.261474609375, 0.2728271484375, 0.2841796875, 0.2955322265625, 0.306884765625, 0.3182373046875, 0.32958984375, 0.3409423828125, 0.352294921875, 0.3636474609375, 0.375, 0.3863525390625, 0.397705078125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 5.0, 10.0, 16.0, 10.0, 18.0, 25.0, 24.0, 31.0, 40.0, 47.0, 46.0, 55.0, 49.0, 54.0, 56.0, 68.0, 55.0, 55.0, 44.0, 54.0, 49.0, 23.0, 29.0, 25.0, 22.0, 17.0, 12.0, 10.0, 9.0, 15.0, 7.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1337890625, -0.1301727294921875, -0.126556396484375, -0.1229400634765625, -0.11932373046875, -0.1157073974609375, -0.112091064453125, -0.1084747314453125, -0.1048583984375, -0.1012420654296875, -0.097625732421875, -0.0940093994140625, -0.09039306640625, -0.0867767333984375, -0.083160400390625, -0.0795440673828125, -0.075927734375, -0.0723114013671875, -0.068695068359375, -0.0650787353515625, -0.06146240234375, -0.0578460693359375, -0.054229736328125, -0.0506134033203125, -0.0469970703125, -0.0433807373046875, -0.039764404296875, -0.0361480712890625, -0.03253173828125, -0.0289154052734375, -0.025299072265625, -0.0216827392578125, -0.01806640625, -0.0144500732421875, -0.010833740234375, -0.0072174072265625, -0.00360107421875, 1.52587890625e-05, 0.003631591796875, 0.0072479248046875, 0.0108642578125, 0.0144805908203125, 0.018096923828125, 0.0217132568359375, 0.02532958984375, 0.0289459228515625, 0.032562255859375, 0.0361785888671875, 0.039794921875, 0.0434112548828125, 0.047027587890625, 0.0506439208984375, 0.05426025390625, 0.0578765869140625, 0.061492919921875, 0.0651092529296875, 0.0687255859375, 0.0723419189453125, 0.075958251953125, 0.0795745849609375, 0.08319091796875, 0.0868072509765625, 0.090423583984375, 0.0940399169921875, 0.09765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 5.0, 16.0, 20.0, 21.0, 25.0, 43.0, 58.0, 90.0, 120.0, 163.0, 226.0, 405.0, 844.0, 1590.0, 3962.0, 15873.0, 327568.0, 3814307.0, 20378.0, 4606.0, 1740.0, 848.0, 454.0, 295.0, 157.0, 124.0, 73.0, 56.0, 39.0, 31.0, 20.0, 19.0, 18.0, 12.0, 14.0, 10.0, 7.0, 8.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6671829223632812, -0.6463775634765625, -0.6255722045898438, -0.604766845703125, -0.5839614868164062, -0.5631561279296875, -0.5423507690429688, -0.52154541015625, -0.5007400512695312, -0.4799346923828125, -0.45912933349609375, -0.438323974609375, -0.41751861572265625, -0.3967132568359375, -0.37590789794921875, -0.3551025390625, -0.33429718017578125, -0.3134918212890625, -0.29268646240234375, -0.271881103515625, -0.25107574462890625, -0.2302703857421875, -0.20946502685546875, -0.18865966796875, -0.16785430908203125, -0.1470489501953125, -0.12624359130859375, -0.105438232421875, -0.08463287353515625, -0.0638275146484375, -0.04302215576171875, -0.022216796875, -0.00141143798828125, 0.0193939208984375, 0.04019927978515625, 0.061004638671875, 0.08180999755859375, 0.1026153564453125, 0.12342071533203125, 0.14422607421875, 0.16503143310546875, 0.1858367919921875, 0.20664215087890625, 0.227447509765625, 0.24825286865234375, 0.2690582275390625, 0.28986358642578125, 0.3106689453125, 0.33147430419921875, 0.3522796630859375, 0.37308502197265625, 0.393890380859375, 0.41469573974609375, 0.4355010986328125, 0.45630645751953125, 0.47711181640625, 0.49791717529296875, 0.5187225341796875, 0.5395278930664062, 0.560333251953125, 0.5811386108398438, 0.6019439697265625, 0.6227493286132812, 0.6435546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 5.0, 10.0, 22.0, 48.0, 143.0, 3571.0, 164.0, 61.0, 22.0, 12.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177001953125, -0.170806884765625, -0.16461181640625, -0.158416748046875, -0.1522216796875, -0.146026611328125, -0.13983154296875, -0.133636474609375, -0.12744140625, -0.121246337890625, -0.11505126953125, -0.108856201171875, -0.1026611328125, -0.096466064453125, -0.09027099609375, -0.084075927734375, -0.077880859375, -0.071685791015625, -0.06549072265625, -0.059295654296875, -0.0531005859375, -0.046905517578125, -0.04071044921875, -0.034515380859375, -0.0283203125, -0.022125244140625, -0.01593017578125, -0.009735107421875, -0.0035400390625, 0.002655029296875, 0.00885009765625, 0.015045166015625, 0.021240234375, 0.027435302734375, 0.03363037109375, 0.039825439453125, 0.0460205078125, 0.052215576171875, 0.05841064453125, 0.064605712890625, 0.07080078125, 0.076995849609375, 0.08319091796875, 0.089385986328125, 0.0955810546875, 0.101776123046875, 0.10797119140625, 0.114166259765625, 0.120361328125, 0.126556396484375, 0.13275146484375, 0.138946533203125, 0.1451416015625, 0.151336669921875, 0.15753173828125, 0.163726806640625, 0.169921875, 0.176116943359375, 0.18231201171875, 0.188507080078125, 0.1947021484375, 0.200897216796875, 0.20709228515625, 0.213287353515625, 0.219482421875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 10.0, 8.0, 6.0, 16.0, 23.0, 38.0, 40.0, 53.0, 53.0, 70.0, 84.0, 105.0, 94.0, 84.0, 75.0, 58.0, 52.0, 40.0, 22.0, 23.0, 9.0, 12.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3961038589477539, -0.38502028584480286, -0.3739367127418518, -0.36285313963890076, -0.3517695665359497, -0.34068599343299866, -0.3296024203300476, -0.31851884722709656, -0.3074352741241455, -0.29635170102119446, -0.2852681279182434, -0.27418455481529236, -0.2631009817123413, -0.25201740860939026, -0.2409338355064392, -0.22985026240348816, -0.2187667042016983, -0.20768313109874725, -0.1965995579957962, -0.18551598489284515, -0.1744324117898941, -0.16334883868694305, -0.1522652804851532, -0.14118170738220215, -0.1300981342792511, -0.11901456117630005, -0.107930988073349, -0.09684741497039795, -0.0857638418674469, -0.07468026876449585, -0.0635967031121254, -0.05251313000917435, -0.0414295494556427, -0.03034597635269165, -0.01926240511238575, -0.00817883387207985, 0.0029047392308712006, 0.01398831233382225, 0.025071881711483, 0.03615545481443405, 0.0472390279173851, 0.05832260102033615, 0.0694061741232872, 0.08048973977565765, 0.0915733128786087, 0.10265688598155975, 0.1137404590845108, 0.12482403218746185, 0.1359076052904129, 0.14699117839336395, 0.158074751496315, 0.16915832459926605, 0.1802418977022171, 0.19132547080516815, 0.202409029006958, 0.21349260210990906, 0.2245761752128601, 0.23565974831581116, 0.2467433214187622, 0.25782689452171326, 0.2689104676246643, 0.27999404072761536, 0.2910776138305664, 0.30216118693351746, 0.3132447600364685]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 10.0, 7.0, 7.0, 7.0, 8.0, 8.0, 18.0, 21.0, 18.0, 18.0, 19.0, 25.0, 31.0, 22.0, 29.0, 38.0, 38.0, 31.0, 48.0, 42.0, 34.0, 30.0, 34.0, 36.0, 37.0, 39.0, 40.0, 38.0, 32.0, 23.0, 23.0, 24.0, 25.0, 19.0, 19.0, 13.0, 11.0, 11.0, 9.0, 9.0, 7.0, 6.0, 7.0, 3.0, 0.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.24584299325942993, -0.23785537481307983, -0.22986775636672974, -0.22188012301921844, -0.21389250457286835, -0.20590488612651825, -0.19791725277900696, -0.18992963433265686, -0.18194201588630676, -0.17395439743995667, -0.16596677899360657, -0.15797914564609528, -0.14999152719974518, -0.14200390875339508, -0.1340162754058838, -0.1260286569595337, -0.1180410385131836, -0.1100534200668335, -0.1020657941699028, -0.0940781682729721, -0.08609054982662201, -0.07810293138027191, -0.07011530548334122, -0.06212768331170082, -0.054140061140060425, -0.04615243896842003, -0.03816481679677963, -0.030177194625139236, -0.02218957245349884, -0.014201950281858444, -0.006214328110218048, 0.001773294061422348, 0.009760916233062744, 0.01774853840470314, 0.025736160576343536, 0.03372378274798393, 0.04171140491962433, 0.049699027091264725, 0.05768664926290512, 0.06567427515983582, 0.07366189360618591, 0.08164951205253601, 0.0896371379494667, 0.0976247638463974, 0.1056123822927475, 0.1136000007390976, 0.12158762663602829, 0.12957525253295898, 0.13756287097930908, 0.14555048942565918, 0.15353810787200928, 0.16152574121952057, 0.16951335966587067, 0.17750097811222076, 0.18548861145973206, 0.19347622990608215, 0.20146384835243225, 0.20945146679878235, 0.21743908524513245, 0.22542671859264374, 0.23341433703899384, 0.24140195548534393, 0.24938958883285522, 0.2573772072792053, 0.2653648257255554]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 8.0, 11.0, 16.0, 32.0, 34.0, 49.0, 66.0, 126.0, 246.0, 420.0, 655.0, 1251.0, 2580.0, 5164.0, 10967.0, 25008.0, 58428.0, 136417.0, 283623.0, 282887.0, 135859.0, 58057.0, 24921.0, 11057.0, 5068.0, 2546.0, 1316.0, 710.0, 396.0, 232.0, 128.0, 83.0, 61.0, 44.0, 25.0, 10.0, 13.0, 9.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.151123046875, -0.14624786376953125, -0.1413726806640625, -0.13649749755859375, -0.131622314453125, -0.12674713134765625, -0.1218719482421875, -0.11699676513671875, -0.11212158203125, -0.10724639892578125, -0.1023712158203125, -0.09749603271484375, -0.092620849609375, -0.08774566650390625, -0.0828704833984375, -0.07799530029296875, -0.0731201171875, -0.06824493408203125, -0.0633697509765625, -0.05849456787109375, -0.053619384765625, -0.04874420166015625, -0.0438690185546875, -0.03899383544921875, -0.03411865234375, -0.02924346923828125, -0.0243682861328125, -0.01949310302734375, -0.014617919921875, -0.00974273681640625, -0.0048675537109375, 7.62939453125e-06, 0.0048828125, 0.00975799560546875, 0.0146331787109375, 0.01950836181640625, 0.024383544921875, 0.02925872802734375, 0.0341339111328125, 0.03900909423828125, 0.04388427734375, 0.04875946044921875, 0.0536346435546875, 0.05850982666015625, 0.063385009765625, 0.06826019287109375, 0.0731353759765625, 0.07801055908203125, 0.0828857421875, 0.08776092529296875, 0.0926361083984375, 0.09751129150390625, 0.102386474609375, 0.10726165771484375, 0.1121368408203125, 0.11701202392578125, 0.12188720703125, 0.12676239013671875, 0.1316375732421875, 0.13651275634765625, 0.141387939453125, 0.14626312255859375, 0.1511383056640625, 0.15601348876953125, 0.160888671875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 9.0, 3.0, 6.0, 7.0, 11.0, 8.0, 13.0, 11.0, 18.0, 25.0, 23.0, 41.0, 51.0, 40.0, 45.0, 47.0, 46.0, 59.0, 57.0, 53.0, 45.0, 54.0, 48.0, 47.0, 34.0, 34.0, 26.0, 24.0, 21.0, 23.0, 12.0, 10.0, 11.0, 10.0, 8.0, 4.0, 2.0, 6.0, 6.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1190185546875, -0.11527347564697266, -0.11152839660644531, -0.10778331756591797, -0.10403823852539062, -0.10029315948486328, -0.09654808044433594, -0.0928030014038086, -0.08905792236328125, -0.0853128433227539, -0.08156776428222656, -0.07782268524169922, -0.07407760620117188, -0.07033252716064453, -0.06658744812011719, -0.06284236907958984, -0.0590972900390625, -0.055352210998535156, -0.05160713195800781, -0.04786205291748047, -0.044116973876953125, -0.04037189483642578, -0.03662681579589844, -0.032881736755371094, -0.02913665771484375, -0.025391578674316406, -0.021646499633789062, -0.01790142059326172, -0.014156341552734375, -0.010411262512207031, -0.0066661834716796875, -0.0029211044311523438, 0.000823974609375, 0.004569053649902344, 0.008314132690429688, 0.012059211730957031, 0.015804290771484375, 0.01954936981201172, 0.023294448852539062, 0.027039527893066406, 0.03078460693359375, 0.034529685974121094, 0.03827476501464844, 0.04201984405517578, 0.045764923095703125, 0.04951000213623047, 0.05325508117675781, 0.057000160217285156, 0.0607452392578125, 0.06449031829833984, 0.06823539733886719, 0.07198047637939453, 0.07572555541992188, 0.07947063446044922, 0.08321571350097656, 0.0869607925415039, 0.09070587158203125, 0.0944509506225586, 0.09819602966308594, 0.10194110870361328, 0.10568618774414062, 0.10943126678466797, 0.11317634582519531, 0.11692142486572266, 0.12066650390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 10.0, 12.0, 8.0, 22.0, 24.0, 40.0, 52.0, 89.0, 127.0, 193.0, 280.0, 489.0, 834.0, 1564.0, 4500.0, 29300.0, 452135.0, 517109.0, 32897.0, 4940.0, 1664.0, 878.0, 469.0, 288.0, 216.0, 132.0, 90.0, 50.0, 43.0, 31.0, 25.0, 10.0, 13.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.351318359375, -0.33831787109375, -0.3253173828125, -0.31231689453125, -0.29931640625, -0.28631591796875, -0.2733154296875, -0.26031494140625, -0.247314453125, -0.23431396484375, -0.2213134765625, -0.20831298828125, -0.1953125, -0.18231201171875, -0.1693115234375, -0.15631103515625, -0.143310546875, -0.13031005859375, -0.1173095703125, -0.10430908203125, -0.09130859375, -0.07830810546875, -0.0653076171875, -0.05230712890625, -0.039306640625, -0.02630615234375, -0.0133056640625, -0.00030517578125, 0.0126953125, 0.02569580078125, 0.0386962890625, 0.05169677734375, 0.064697265625, 0.07769775390625, 0.0906982421875, 0.10369873046875, 0.11669921875, 0.12969970703125, 0.1427001953125, 0.15570068359375, 0.168701171875, 0.18170166015625, 0.1947021484375, 0.20770263671875, 0.220703125, 0.23370361328125, 0.2467041015625, 0.25970458984375, 0.272705078125, 0.28570556640625, 0.2987060546875, 0.31170654296875, 0.32470703125, 0.33770751953125, 0.3507080078125, 0.36370849609375, 0.376708984375, 0.38970947265625, 0.4027099609375, 0.41571044921875, 0.4287109375, 0.44171142578125, 0.4547119140625, 0.46771240234375, 0.480712890625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 12.0, 5.0, 10.0, 16.0, 13.0, 18.0, 18.0, 26.0, 32.0, 40.0, 41.0, 41.0, 54.0, 47.0, 44.0, 49.0, 41.0, 47.0, 39.0, 37.0, 44.0, 44.0, 34.0, 34.0, 31.0, 28.0, 22.0, 28.0, 17.0, 8.0, 10.0, 13.0, 8.0, 5.0, 5.0, 4.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55078125, -0.5348014831542969, -0.5188217163085938, -0.5028419494628906, -0.4868621826171875, -0.4708824157714844, -0.45490264892578125, -0.4389228820800781, -0.422943115234375, -0.4069633483886719, -0.39098358154296875, -0.3750038146972656, -0.3590240478515625, -0.3430442810058594, -0.32706451416015625, -0.3110847473144531, -0.29510498046875, -0.2791252136230469, -0.26314544677734375, -0.24716567993164062, -0.2311859130859375, -0.21520614624023438, -0.19922637939453125, -0.18324661254882812, -0.167266845703125, -0.15128707885742188, -0.13530731201171875, -0.11932754516601562, -0.1033477783203125, -0.08736801147460938, -0.07138824462890625, -0.055408477783203125, -0.0394287109375, -0.023448944091796875, -0.00746917724609375, 0.008510589599609375, 0.0244903564453125, 0.040470123291015625, 0.05644989013671875, 0.07242965698242188, 0.088409423828125, 0.10438919067382812, 0.12036895751953125, 0.13634872436523438, 0.1523284912109375, 0.16830825805664062, 0.18428802490234375, 0.20026779174804688, 0.21624755859375, 0.23222732543945312, 0.24820709228515625, 0.2641868591308594, 0.2801666259765625, 0.2961463928222656, 0.31212615966796875, 0.3281059265136719, 0.344085693359375, 0.3600654602050781, 0.37604522705078125, 0.3920249938964844, 0.4080047607421875, 0.4239845275878906, 0.43996429443359375, 0.4559440612792969, 0.471923828125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 12.0, 8.0, 18.0, 18.0, 44.0, 70.0, 120.0, 256.0, 686.0, 2312.0, 17229.0, 547814.0, 461142.0, 15492.0, 2179.0, 630.0, 260.0, 100.0, 68.0, 36.0, 15.0, 8.0, 11.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.2543373107910156, -0.24524688720703125, -0.23615646362304688, -0.2270660400390625, -0.21797561645507812, -0.20888519287109375, -0.19979476928710938, -0.190704345703125, -0.18161392211914062, -0.17252349853515625, -0.16343307495117188, -0.1543426513671875, -0.14525222778320312, -0.13616180419921875, -0.12707138061523438, -0.11798095703125, -0.10889053344726562, -0.09980010986328125, -0.09070968627929688, -0.0816192626953125, -0.07252883911132812, -0.06343841552734375, -0.054347991943359375, -0.045257568359375, -0.036167144775390625, -0.02707672119140625, -0.017986297607421875, -0.0088958740234375, 0.000194549560546875, 0.00928497314453125, 0.018375396728515625, 0.0274658203125, 0.036556243896484375, 0.04564666748046875, 0.054737091064453125, 0.0638275146484375, 0.07291793823242188, 0.08200836181640625, 0.09109878540039062, 0.100189208984375, 0.10927963256835938, 0.11837005615234375, 0.12746047973632812, 0.1365509033203125, 0.14564132690429688, 0.15473175048828125, 0.16382217407226562, 0.17291259765625, 0.18200302124023438, 0.19109344482421875, 0.20018386840820312, 0.2092742919921875, 0.21836471557617188, 0.22745513916015625, 0.23654556274414062, 0.245635986328125, 0.2547264099121094, 0.26381683349609375, 0.2729072570800781, 0.2819976806640625, 0.2910881042480469, 0.30017852783203125, 0.3092689514160156, 0.318359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 4.0, 13.0, 8.0, 14.0, 11.0, 18.0, 23.0, 29.0, 40.0, 54.0, 58.0, 78.0, 74.0, 73.0, 66.0, 75.0, 54.0, 54.0, 40.0, 35.0, 19.0, 22.0, 18.0, 18.0, 12.0, 16.0, 7.0, 10.0, 8.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.756450653076172e-05, -4.602503031492233e-05, -4.448555409908295e-05, -4.294607788324356e-05, -4.1406601667404175e-05, -3.986712545156479e-05, -3.83276492357254e-05, -3.678817301988602e-05, -3.524869680404663e-05, -3.3709220588207245e-05, -3.216974437236786e-05, -3.063026815652847e-05, -2.9090791940689087e-05, -2.75513157248497e-05, -2.6011839509010315e-05, -2.447236329317093e-05, -2.2932887077331543e-05, -2.1393410861492157e-05, -1.985393464565277e-05, -1.8314458429813385e-05, -1.6774982213974e-05, -1.5235505998134613e-05, -1.3696029782295227e-05, -1.2156553566455841e-05, -1.0617077350616455e-05, -9.077601134777069e-06, -7.538124918937683e-06, -5.998648703098297e-06, -4.459172487258911e-06, -2.919696271419525e-06, -1.3802200555801392e-06, 1.5925616025924683e-07, 1.6987323760986328e-06, 3.238208591938019e-06, 4.777684807777405e-06, 6.317161023616791e-06, 7.856637239456177e-06, 9.396113455295563e-06, 1.0935589671134949e-05, 1.2475065886974335e-05, 1.401454210281372e-05, 1.5554018318653107e-05, 1.7093494534492493e-05, 1.863297075033188e-05, 2.0172446966171265e-05, 2.171192318201065e-05, 2.3251399397850037e-05, 2.4790875613689423e-05, 2.633035182952881e-05, 2.7869828045368195e-05, 2.940930426120758e-05, 3.0948780477046967e-05, 3.248825669288635e-05, 3.402773290872574e-05, 3.5567209124565125e-05, 3.710668534040451e-05, 3.8646161556243896e-05, 4.018563777208328e-05, 4.172511398792267e-05, 4.3264590203762054e-05, 4.480406641960144e-05, 4.6343542635440826e-05, 4.788301885128021e-05, 4.94224950671196e-05, 5.0961971282958984e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 8.0, 12.0, 13.0, 16.0, 35.0, 40.0, 61.0, 110.0, 185.0, 313.0, 573.0, 1127.0, 2843.0, 9704.0, 59346.0, 563640.0, 360983.0, 37655.0, 7338.0, 2372.0, 1013.0, 466.0, 266.0, 151.0, 83.0, 64.0, 35.0, 39.0, 20.0, 9.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1944580078125, -0.18888473510742188, -0.18331146240234375, -0.17773818969726562, -0.1721649169921875, -0.16659164428710938, -0.16101837158203125, -0.15544509887695312, -0.149871826171875, -0.14429855346679688, -0.13872528076171875, -0.13315200805664062, -0.1275787353515625, -0.12200546264648438, -0.11643218994140625, -0.11085891723632812, -0.10528564453125, -0.09971237182617188, -0.09413909912109375, -0.08856582641601562, -0.0829925537109375, -0.07741928100585938, -0.07184600830078125, -0.06627273559570312, -0.060699462890625, -0.055126190185546875, -0.04955291748046875, -0.043979644775390625, -0.0384063720703125, -0.032833099365234375, -0.02725982666015625, -0.021686553955078125, -0.01611328125, -0.010540008544921875, -0.00496673583984375, 0.000606536865234375, 0.0061798095703125, 0.011753082275390625, 0.01732635498046875, 0.022899627685546875, 0.028472900390625, 0.034046173095703125, 0.03961944580078125, 0.045192718505859375, 0.0507659912109375, 0.056339263916015625, 0.06191253662109375, 0.06748580932617188, 0.07305908203125, 0.07863235473632812, 0.08420562744140625, 0.08977890014648438, 0.0953521728515625, 0.10092544555664062, 0.10649871826171875, 0.11207199096679688, 0.117645263671875, 0.12321853637695312, 0.12879180908203125, 0.13436508178710938, 0.1399383544921875, 0.14551162719726562, 0.15108489990234375, 0.15665817260742188, 0.1622314453125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 8.0, 14.0, 20.0, 24.0, 30.0, 26.0, 64.0, 70.0, 109.0, 103.0, 106.0, 102.0, 82.0, 85.0, 60.0, 25.0, 26.0, 16.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228759765625, -0.22261810302734375, -0.2164764404296875, -0.21033477783203125, -0.204193115234375, -0.19805145263671875, -0.1919097900390625, -0.18576812744140625, -0.17962646484375, -0.17348480224609375, -0.1673431396484375, -0.16120147705078125, -0.155059814453125, -0.14891815185546875, -0.1427764892578125, -0.13663482666015625, -0.1304931640625, -0.12435150146484375, -0.1182098388671875, -0.11206817626953125, -0.105926513671875, -0.09978485107421875, -0.0936431884765625, -0.08750152587890625, -0.08135986328125, -0.07521820068359375, -0.0690765380859375, -0.06293487548828125, -0.056793212890625, -0.05065155029296875, -0.0445098876953125, -0.03836822509765625, -0.0322265625, -0.02608489990234375, -0.0199432373046875, -0.01380157470703125, -0.007659912109375, -0.00151824951171875, 0.0046234130859375, 0.01076507568359375, 0.01690673828125, 0.02304840087890625, 0.0291900634765625, 0.03533172607421875, 0.041473388671875, 0.04761505126953125, 0.0537567138671875, 0.05989837646484375, 0.0660400390625, 0.07218170166015625, 0.0783233642578125, 0.08446502685546875, 0.090606689453125, 0.09674835205078125, 0.1028900146484375, 0.10903167724609375, 0.11517333984375, 0.12131500244140625, 0.1274566650390625, 0.13359832763671875, 0.139739990234375, 0.14588165283203125, 0.1520233154296875, 0.15816497802734375, 0.164306640625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 6.0, 17.0, 46.0, 74.0, 151.0, 186.0, 173.0, 141.0, 103.0, 42.0, 35.0, 18.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1499881744384766, -2.0461342334747314, -1.9422802925109863, -1.8384263515472412, -1.7345725297927856, -1.6307185888290405, -1.5268646478652954, -1.4230108261108398, -1.3191568851470947, -1.2153029441833496, -1.1114490032196045, -1.0075950622558594, -0.9037412405014038, -0.7998872995376587, -0.6960333585739136, -0.5921794772148132, -0.48832547664642334, -0.3844715654850006, -0.2806176543235779, -0.17676371335983276, -0.07290980219841003, 0.030944108963012695, 0.1347980499267578, 0.23865193128585815, 0.34250587224960327, 0.446359783411026, 0.5502136945724487, 0.6540676355361938, 0.757921576499939, 0.8617754578590393, 0.9656293988227844, 1.0694832801818848, 1.1733372211456299, 1.277191162109375, 1.3810451030731201, 1.4848990440368652, 1.5887528657913208, 1.692606806755066, 1.796460747718811, 1.9003145694732666, 2.0041685104370117, 2.108022451400757, 2.211876392364502, 2.315730333328247, 2.419584274291992, 2.523437976837158, 2.6272921562194824, 2.7311458587646484, 2.8350000381469727, 2.9388539791107178, 3.042707920074463, 3.146561861038208, 3.250415802001953, 3.354269504547119, 3.4581236839294434, 3.5619773864746094, 3.6658313274383545, 3.7696852684020996, 3.8735392093658447, 3.97739315032959, 4.081246852874756, 4.18510103225708, 4.288954734802246, 4.39280891418457, 4.496662616729736]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 4.0, 10.0, 11.0, 21.0, 20.0, 30.0, 40.0, 42.0, 56.0, 60.0, 66.0, 55.0, 73.0, 81.0, 76.0, 64.0, 60.0, 49.0, 32.0, 30.0, 27.0, 18.0, 19.0, 10.0, 14.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.448465585708618, -3.346440315246582, -3.244414806365967, -3.1423892974853516, -3.0403640270233154, -2.9383387565612793, -2.836313247680664, -2.734287738800049, -2.6322624683380127, -2.5302371978759766, -2.4282116889953613, -2.326186180114746, -2.22416090965271, -2.122135639190674, -2.0201101303100586, -1.918084740638733, -1.8160593509674072, -1.7140339612960815, -1.6120085716247559, -1.5099831819534302, -1.4079577922821045, -1.3059324026107788, -1.2039070129394531, -1.1018816232681274, -0.9998562335968018, -0.8978308439254761, -0.7958054542541504, -0.6937800645828247, -0.591754674911499, -0.48972928524017334, -0.38770389556884766, -0.285678505897522, -0.1836533546447754, -0.08162796497344971, 0.020397424697875977, 0.12242281436920166, 0.22444820404052734, 0.326473593711853, 0.4284989833831787, 0.5305243730545044, 0.6325497627258301, 0.7345751523971558, 0.8366005420684814, 0.9386259317398071, 1.0406513214111328, 1.1426767110824585, 1.2447021007537842, 1.3467274904251099, 1.4487528800964355, 1.5507782697677612, 1.652803659439087, 1.7548290491104126, 1.8568544387817383, 1.958879828453064, 2.0609052181243896, 2.162930488586426, 2.264955997467041, 2.3669815063476562, 2.4690067768096924, 2.5710320472717285, 2.6730575561523438, 2.775083065032959, 2.877108335494995, 2.9791336059570312, 3.0811591148376465]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 0.0, 5.0, 6.0, 5.0, 8.0, 20.0, 22.0, 27.0, 44.0, 63.0, 88.0, 146.0, 169.0, 271.0, 404.0, 585.0, 989.0, 1573.0, 2886.0, 5665.0, 14227.0, 48686.0, 1776052.0, 2266472.0, 48711.0, 14034.0, 5807.0, 2877.0, 1589.0, 961.0, 598.0, 415.0, 268.0, 187.0, 128.0, 96.0, 61.0, 43.0, 31.0, 25.0, 10.0, 7.0, 14.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.30615234375, -0.2974052429199219, -0.28865814208984375, -0.2799110412597656, -0.2711639404296875, -0.2624168395996094, -0.25366973876953125, -0.24492263793945312, -0.236175537109375, -0.22742843627929688, -0.21868133544921875, -0.20993423461914062, -0.2011871337890625, -0.19244003295898438, -0.18369293212890625, -0.17494583129882812, -0.16619873046875, -0.15745162963867188, -0.14870452880859375, -0.13995742797851562, -0.1312103271484375, -0.12246322631835938, -0.11371612548828125, -0.10496902465820312, -0.096221923828125, -0.08747482299804688, -0.07872772216796875, -0.06998062133789062, -0.0612335205078125, -0.052486419677734375, -0.04373931884765625, -0.034992218017578125, -0.0262451171875, -0.017498016357421875, -0.00875091552734375, -3.814697265625e-06, 0.0087432861328125, 0.017490386962890625, 0.02623748779296875, 0.034984588623046875, 0.043731689453125, 0.052478790283203125, 0.06122589111328125, 0.06997299194335938, 0.0787200927734375, 0.08746719360351562, 0.09621429443359375, 0.10496139526367188, 0.11370849609375, 0.12245559692382812, 0.13120269775390625, 0.13994979858398438, 0.1486968994140625, 0.15744400024414062, 0.16619110107421875, 0.17493820190429688, 0.183685302734375, 0.19243240356445312, 0.20117950439453125, 0.20992660522460938, 0.2186737060546875, 0.22742080688476562, 0.23616790771484375, 0.24491500854492188, 0.253662109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 4.0, 5.0, 6.0, 11.0, 11.0, 13.0, 26.0, 34.0, 36.0, 35.0, 52.0, 51.0, 67.0, 65.0, 56.0, 68.0, 67.0, 47.0, 59.0, 47.0, 40.0, 44.0, 29.0, 27.0, 24.0, 13.0, 11.0, 14.0, 12.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1328125, -0.12845802307128906, -0.12410354614257812, -0.11974906921386719, -0.11539459228515625, -0.11104011535644531, -0.10668563842773438, -0.10233116149902344, -0.0979766845703125, -0.09362220764160156, -0.08926773071289062, -0.08491325378417969, -0.08055877685546875, -0.07620429992675781, -0.07184982299804688, -0.06749534606933594, -0.063140869140625, -0.05878639221191406, -0.054431915283203125, -0.05007743835449219, -0.04572296142578125, -0.04136848449707031, -0.037014007568359375, -0.03265953063964844, -0.0283050537109375, -0.023950576782226562, -0.019596099853515625, -0.015241622924804688, -0.01088714599609375, -0.0065326690673828125, -0.002178192138671875, 0.0021762847900390625, 0.00653076171875, 0.010885238647460938, 0.015239715576171875, 0.019594192504882812, 0.02394866943359375, 0.028303146362304688, 0.032657623291015625, 0.03701210021972656, 0.0413665771484375, 0.04572105407714844, 0.050075531005859375, 0.05443000793457031, 0.05878448486328125, 0.06313896179199219, 0.06749343872070312, 0.07184791564941406, 0.076202392578125, 0.08055686950683594, 0.08491134643554688, 0.08926582336425781, 0.09362030029296875, 0.09797477722167969, 0.10232925415039062, 0.10668373107910156, 0.1110382080078125, 0.11539268493652344, 0.11974716186523438, 0.12410163879394531, 0.12845611572265625, 0.1328105926513672, 0.13716506958007812, 0.14151954650878906, 0.1458740234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 6.0, 9.0, 8.0, 26.0, 26.0, 20.0, 34.0, 31.0, 59.0, 67.0, 98.0, 157.0, 375.0, 712.0, 1883.0, 7053.0, 55074.0, 4000047.0, 113681.0, 10464.0, 2468.0, 870.0, 423.0, 204.0, 121.0, 86.0, 68.0, 39.0, 31.0, 20.0, 19.0, 16.0, 14.0, 13.0, 10.0, 8.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6396484375, -0.6206207275390625, -0.601593017578125, -0.5825653076171875, -0.56353759765625, -0.5445098876953125, -0.525482177734375, -0.5064544677734375, -0.4874267578125, -0.4683990478515625, -0.449371337890625, -0.4303436279296875, -0.41131591796875, -0.3922882080078125, -0.373260498046875, -0.3542327880859375, -0.335205078125, -0.3161773681640625, -0.297149658203125, -0.2781219482421875, -0.25909423828125, -0.2400665283203125, -0.221038818359375, -0.2020111083984375, -0.1829833984375, -0.1639556884765625, -0.144927978515625, -0.1259002685546875, -0.10687255859375, -0.0878448486328125, -0.068817138671875, -0.0497894287109375, -0.03076171875, -0.0117340087890625, 0.007293701171875, 0.0263214111328125, 0.04534912109375, 0.0643768310546875, 0.083404541015625, 0.1024322509765625, 0.1214599609375, 0.1404876708984375, 0.159515380859375, 0.1785430908203125, 0.19757080078125, 0.2165985107421875, 0.235626220703125, 0.2546539306640625, 0.273681640625, 0.2927093505859375, 0.311737060546875, 0.3307647705078125, 0.34979248046875, 0.3688201904296875, 0.387847900390625, 0.4068756103515625, 0.4259033203125, 0.4449310302734375, 0.463958740234375, 0.4829864501953125, 0.50201416015625, 0.5210418701171875, 0.540069580078125, 0.5590972900390625, 0.578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 10.0, 10.0, 27.0, 60.0, 110.0, 561.0, 2984.0, 200.0, 55.0, 29.0, 11.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2200927734375, -0.21060752868652344, -0.20112228393554688, -0.1916370391845703, -0.18215179443359375, -0.1726665496826172, -0.16318130493164062, -0.15369606018066406, -0.1442108154296875, -0.13472557067871094, -0.12524032592773438, -0.11575508117675781, -0.10626983642578125, -0.09678459167480469, -0.08729934692382812, -0.07781410217285156, -0.068328857421875, -0.05884361267089844, -0.049358367919921875, -0.03987312316894531, -0.03038787841796875, -0.020902633666992188, -0.011417388916015625, -0.0019321441650390625, 0.0075531005859375, 0.017038345336914062, 0.026523590087890625, 0.03600883483886719, 0.04549407958984375, 0.05497932434082031, 0.06446456909179688, 0.07394981384277344, 0.08343505859375, 0.09292030334472656, 0.10240554809570312, 0.11189079284667969, 0.12137603759765625, 0.1308612823486328, 0.14034652709960938, 0.14983177185058594, 0.1593170166015625, 0.16880226135253906, 0.17828750610351562, 0.1877727508544922, 0.19725799560546875, 0.2067432403564453, 0.21622848510742188, 0.22571372985839844, 0.235198974609375, 0.24468421936035156, 0.2541694641113281, 0.2636547088623047, 0.27313995361328125, 0.2826251983642578, 0.2921104431152344, 0.30159568786621094, 0.3110809326171875, 0.32056617736816406, 0.3300514221191406, 0.3395366668701172, 0.34902191162109375, 0.3585071563720703, 0.3679924011230469, 0.37747764587402344, 0.386962890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 10.0, 28.0, 36.0, 69.0, 89.0, 100.0, 130.0, 129.0, 105.0, 96.0, 55.0, 40.0, 31.0, 17.0, 20.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6400371789932251, -0.6159711480140686, -0.5919051170349121, -0.5678390264511108, -0.5437729954719543, -0.5197069644927979, -0.49564090371131897, -0.4715748429298401, -0.4475088119506836, -0.4234427809715271, -0.3993767201900482, -0.37531065940856934, -0.35124462842941284, -0.32717859745025635, -0.30311253666877747, -0.2790464758872986, -0.2549804449081421, -0.2309143990278244, -0.2068483531475067, -0.18278230726718903, -0.15871626138687134, -0.13465021550655365, -0.11058416962623596, -0.08651812374591827, -0.062452077865600586, -0.0383860319852829, -0.01431998610496521, 0.009746059775352478, 0.033812105655670166, 0.057878151535987854, 0.08194419741630554, 0.10601024329662323, 0.13007628917694092, 0.1541423350572586, 0.1782083809375763, 0.20227442681789398, 0.22634047269821167, 0.25040650367736816, 0.27447256445884705, 0.2985386252403259, 0.3226046562194824, 0.3466706871986389, 0.3707367479801178, 0.3948028087615967, 0.4188688397407532, 0.44293487071990967, 0.46700093150138855, 0.49106699228286743, 0.5151330232620239, 0.5391990542411804, 0.5632650852203369, 0.5873311758041382, 0.6113972067832947, 0.6354632377624512, 0.6595293283462524, 0.6835953593254089, 0.7076613903045654, 0.7317274212837219, 0.7557934522628784, 0.7798595428466797, 0.8039255738258362, 0.8279916048049927, 0.852057695388794, 0.8761237263679504, 0.9001897573471069]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 12.0, 11.0, 12.0, 9.0, 12.0, 17.0, 27.0, 27.0, 34.0, 35.0, 39.0, 34.0, 37.0, 40.0, 53.0, 42.0, 57.0, 43.0, 56.0, 47.0, 40.0, 31.0, 39.0, 29.0, 22.0, 29.0, 19.0, 25.0, 21.0, 19.0, 16.0, 15.0, 14.0, 14.0, 3.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.48975038528442383, -0.47480884194374084, -0.45986732840538025, -0.44492578506469727, -0.42998427152633667, -0.4150427281856537, -0.4001011848449707, -0.3851596713066101, -0.3702181279659271, -0.35527658462524414, -0.34033507108688354, -0.32539352774620056, -0.3104519844055176, -0.295510470867157, -0.280568927526474, -0.265627384185791, -0.2506858706474304, -0.23574434220790863, -0.22080281376838684, -0.20586127042770386, -0.19091974198818207, -0.17597821354866028, -0.1610366702079773, -0.1460951417684555, -0.13115361332893372, -0.11621208488941193, -0.10127054899930954, -0.08632901310920715, -0.07138748466968536, -0.056445956230163574, -0.04150442034006119, -0.0265628844499588, -0.011621356010437012, 0.0033201761543750763, 0.018261708319187164, 0.03320324048399925, 0.04814477264881134, 0.06308630108833313, 0.07802783697843552, 0.0929693728685379, 0.10791090130805969, 0.12285242974758148, 0.13779395818710327, 0.15273550152778625, 0.16767702996730804, 0.18261855840682983, 0.19756010174751282, 0.2125016301870346, 0.2274431586265564, 0.24238468706607819, 0.2573262155056, 0.27226775884628296, 0.28720927238464355, 0.30215081572532654, 0.3170923590660095, 0.3320338726043701, 0.3469754159450531, 0.3619169592857361, 0.3768584728240967, 0.39180001616477966, 0.40674155950546265, 0.42168307304382324, 0.4366246163845062, 0.4515661597251892, 0.4665076732635498]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 11.0, 16.0, 16.0, 46.0, 59.0, 76.0, 138.0, 213.0, 431.0, 812.0, 1488.0, 2973.0, 6415.0, 14439.0, 32453.0, 77755.0, 191703.0, 382725.0, 196866.0, 79546.0, 33131.0, 14297.0, 6536.0, 3111.0, 1528.0, 736.0, 409.0, 233.0, 144.0, 94.0, 43.0, 39.0, 25.0, 12.0, 4.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2498779296875, -0.24263763427734375, -0.2353973388671875, -0.22815704345703125, -0.220916748046875, -0.21367645263671875, -0.2064361572265625, -0.19919586181640625, -0.19195556640625, -0.18471527099609375, -0.1774749755859375, -0.17023468017578125, -0.162994384765625, -0.15575408935546875, -0.1485137939453125, -0.14127349853515625, -0.134033203125, -0.12679290771484375, -0.1195526123046875, -0.11231231689453125, -0.105072021484375, -0.09783172607421875, -0.0905914306640625, -0.08335113525390625, -0.07611083984375, -0.06887054443359375, -0.0616302490234375, -0.05438995361328125, -0.047149658203125, -0.03990936279296875, -0.0326690673828125, -0.02542877197265625, -0.0181884765625, -0.01094818115234375, -0.0037078857421875, 0.00353240966796875, 0.010772705078125, 0.01801300048828125, 0.0252532958984375, 0.03249359130859375, 0.03973388671875, 0.04697418212890625, 0.0542144775390625, 0.06145477294921875, 0.068695068359375, 0.07593536376953125, 0.0831756591796875, 0.09041595458984375, 0.09765625, 0.10489654541015625, 0.1121368408203125, 0.11937713623046875, 0.126617431640625, 0.13385772705078125, 0.1410980224609375, 0.14833831787109375, 0.15557861328125, 0.16281890869140625, 0.1700592041015625, 0.17729949951171875, 0.184539794921875, 0.19178009033203125, 0.1990203857421875, 0.20626068115234375, 0.2135009765625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 5.0, 10.0, 16.0, 13.0, 20.0, 17.0, 25.0, 44.0, 32.0, 40.0, 43.0, 46.0, 51.0, 44.0, 47.0, 49.0, 50.0, 65.0, 49.0, 50.0, 38.0, 41.0, 30.0, 24.0, 19.0, 22.0, 23.0, 10.0, 18.0, 9.0, 7.0, 4.0, 11.0, 8.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125244140625, -0.12140560150146484, -0.11756706237792969, -0.11372852325439453, -0.10988998413085938, -0.10605144500732422, -0.10221290588378906, -0.0983743667602539, -0.09453582763671875, -0.0906972885131836, -0.08685874938964844, -0.08302021026611328, -0.07918167114257812, -0.07534313201904297, -0.07150459289550781, -0.06766605377197266, -0.0638275146484375, -0.059988975524902344, -0.05615043640136719, -0.05231189727783203, -0.048473358154296875, -0.04463481903076172, -0.04079627990722656, -0.036957740783691406, -0.03311920166015625, -0.029280662536621094, -0.025442123413085938, -0.02160358428955078, -0.017765045166015625, -0.013926506042480469, -0.010087966918945312, -0.006249427795410156, -0.002410888671875, 0.0014276504516601562, 0.0052661895751953125, 0.009104728698730469, 0.012943267822265625, 0.01678180694580078, 0.020620346069335938, 0.024458885192871094, 0.02829742431640625, 0.032135963439941406, 0.03597450256347656, 0.03981304168701172, 0.043651580810546875, 0.04749011993408203, 0.05132865905761719, 0.055167198181152344, 0.0590057373046875, 0.06284427642822266, 0.06668281555175781, 0.07052135467529297, 0.07435989379882812, 0.07819843292236328, 0.08203697204589844, 0.0858755111694336, 0.08971405029296875, 0.0935525894165039, 0.09739112854003906, 0.10122966766357422, 0.10506820678710938, 0.10890674591064453, 0.11274528503417969, 0.11658382415771484, 0.12042236328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 7.0, 6.0, 14.0, 13.0, 26.0, 36.0, 43.0, 58.0, 79.0, 112.0, 214.0, 260.0, 417.0, 720.0, 1187.0, 2491.0, 6404.0, 27639.0, 208071.0, 673426.0, 102061.0, 16147.0, 4453.0, 1900.0, 1007.0, 584.0, 366.0, 263.0, 161.0, 100.0, 74.0, 67.0, 40.0, 31.0, 19.0, 12.0, 16.0, 9.0, 7.0, 6.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353271484375, -0.3408050537109375, -0.328338623046875, -0.3158721923828125, -0.30340576171875, -0.2909393310546875, -0.278472900390625, -0.2660064697265625, -0.2535400390625, -0.2410736083984375, -0.228607177734375, -0.2161407470703125, -0.20367431640625, -0.1912078857421875, -0.178741455078125, -0.1662750244140625, -0.15380859375, -0.1413421630859375, -0.128875732421875, -0.1164093017578125, -0.10394287109375, -0.0914764404296875, -0.079010009765625, -0.0665435791015625, -0.0540771484375, -0.0416107177734375, -0.029144287109375, -0.0166778564453125, -0.00421142578125, 0.0082550048828125, 0.020721435546875, 0.0331878662109375, 0.045654296875, 0.0581207275390625, 0.070587158203125, 0.0830535888671875, 0.09552001953125, 0.1079864501953125, 0.120452880859375, 0.1329193115234375, 0.1453857421875, 0.1578521728515625, 0.170318603515625, 0.1827850341796875, 0.19525146484375, 0.2077178955078125, 0.220184326171875, 0.2326507568359375, 0.2451171875, 0.2575836181640625, 0.270050048828125, 0.2825164794921875, 0.29498291015625, 0.3074493408203125, 0.319915771484375, 0.3323822021484375, 0.3448486328125, 0.3573150634765625, 0.369781494140625, 0.3822479248046875, 0.39471435546875, 0.4071807861328125, 0.419647216796875, 0.4321136474609375, 0.444580078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 5.0, 6.0, 8.0, 8.0, 11.0, 13.0, 19.0, 22.0, 29.0, 31.0, 25.0, 34.0, 32.0, 32.0, 39.0, 51.0, 52.0, 42.0, 50.0, 39.0, 45.0, 39.0, 35.0, 43.0, 28.0, 30.0, 29.0, 42.0, 35.0, 22.0, 18.0, 14.0, 16.0, 8.0, 9.0, 8.0, 8.0, 9.0, 5.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.50732421875, -0.4927558898925781, -0.47818756103515625, -0.4636192321777344, -0.4490509033203125, -0.4344825744628906, -0.41991424560546875, -0.4053459167480469, -0.390777587890625, -0.3762092590332031, -0.36164093017578125, -0.3470726013183594, -0.3325042724609375, -0.3179359436035156, -0.30336761474609375, -0.2887992858886719, -0.27423095703125, -0.2596626281738281, -0.24509429931640625, -0.23052597045898438, -0.2159576416015625, -0.20138931274414062, -0.18682098388671875, -0.17225265502929688, -0.157684326171875, -0.14311599731445312, -0.12854766845703125, -0.11397933959960938, -0.0994110107421875, -0.08484268188476562, -0.07027435302734375, -0.055706024169921875, -0.0411376953125, -0.026569366455078125, -0.01200103759765625, 0.002567291259765625, 0.0171356201171875, 0.031703948974609375, 0.04627227783203125, 0.060840606689453125, 0.075408935546875, 0.08997726440429688, 0.10454559326171875, 0.11911392211914062, 0.1336822509765625, 0.14825057983398438, 0.16281890869140625, 0.17738723754882812, 0.19195556640625, 0.20652389526367188, 0.22109222412109375, 0.23566055297851562, 0.2502288818359375, 0.2647972106933594, 0.27936553955078125, 0.2939338684082031, 0.308502197265625, 0.3230705261230469, 0.33763885498046875, 0.3522071838378906, 0.3667755126953125, 0.3813438415527344, 0.39591217041015625, 0.4104804992675781, 0.425048828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 14.0, 10.0, 20.0, 27.0, 47.0, 59.0, 88.0, 130.0, 203.0, 332.0, 547.0, 1050.0, 2058.0, 4922.0, 13190.0, 43790.0, 167780.0, 533523.0, 202642.0, 52160.0, 15156.0, 5646.0, 2285.0, 1136.0, 651.0, 359.0, 231.0, 161.0, 99.0, 70.0, 44.0, 28.0, 26.0, 15.0, 14.0, 10.0, 4.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09375, -0.0904684066772461, -0.08718681335449219, -0.08390522003173828, -0.08062362670898438, -0.07734203338623047, -0.07406044006347656, -0.07077884674072266, -0.06749725341796875, -0.06421566009521484, -0.06093406677246094, -0.05765247344970703, -0.054370880126953125, -0.05108928680419922, -0.04780769348144531, -0.044526100158691406, -0.0412445068359375, -0.037962913513183594, -0.03468132019042969, -0.03139972686767578, -0.028118133544921875, -0.02483654022216797, -0.021554946899414062, -0.018273353576660156, -0.01499176025390625, -0.011710166931152344, -0.008428573608398438, -0.005146980285644531, -0.001865386962890625, 0.0014162063598632812, 0.0046977996826171875, 0.007979393005371094, 0.011260986328125, 0.014542579650878906, 0.017824172973632812, 0.02110576629638672, 0.024387359619140625, 0.02766895294189453, 0.030950546264648438, 0.034232139587402344, 0.03751373291015625, 0.040795326232910156, 0.04407691955566406, 0.04735851287841797, 0.050640106201171875, 0.05392169952392578, 0.05720329284667969, 0.060484886169433594, 0.0637664794921875, 0.0670480728149414, 0.07032966613769531, 0.07361125946044922, 0.07689285278320312, 0.08017444610595703, 0.08345603942871094, 0.08673763275146484, 0.09001922607421875, 0.09330081939697266, 0.09658241271972656, 0.09986400604248047, 0.10314559936523438, 0.10642719268798828, 0.10970878601074219, 0.1129903793334961, 0.11627197265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 14.0, 4.0, 7.0, 18.0, 16.0, 18.0, 15.0, 12.0, 20.0, 25.0, 43.0, 59.0, 62.0, 74.0, 81.0, 101.0, 61.0, 52.0, 49.0, 47.0, 38.0, 25.0, 26.0, 28.0, 26.0, 19.0, 14.0, 9.0, 10.0, 4.0, 4.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.7756900787353516e-05, -5.601998418569565e-05, -5.428306758403778e-05, -5.254615098237991e-05, -5.0809234380722046e-05, -4.907231777906418e-05, -4.733540117740631e-05, -4.5598484575748444e-05, -4.3861567974090576e-05, -4.212465137243271e-05, -4.038773477077484e-05, -3.8650818169116974e-05, -3.6913901567459106e-05, -3.517698496580124e-05, -3.344006836414337e-05, -3.1703151762485504e-05, -2.9966235160827637e-05, -2.822931855916977e-05, -2.6492401957511902e-05, -2.4755485355854034e-05, -2.3018568754196167e-05, -2.12816521525383e-05, -1.9544735550880432e-05, -1.7807818949222565e-05, -1.6070902347564697e-05, -1.433398574590683e-05, -1.2597069144248962e-05, -1.0860152542591095e-05, -9.123235940933228e-06, -7.38631933927536e-06, -5.649402737617493e-06, -3.912486135959625e-06, -2.175569534301758e-06, -4.386529326438904e-07, 1.298263669013977e-06, 3.0351802706718445e-06, 4.772096872329712e-06, 6.509013473987579e-06, 8.245930075645447e-06, 9.982846677303314e-06, 1.1719763278961182e-05, 1.3456679880619049e-05, 1.5193596482276917e-05, 1.6930513083934784e-05, 1.866742968559265e-05, 2.040434628725052e-05, 2.2141262888908386e-05, 2.3878179490566254e-05, 2.561509609222412e-05, 2.735201269388199e-05, 2.9088929295539856e-05, 3.0825845897197723e-05, 3.256276249885559e-05, 3.429967910051346e-05, 3.6036595702171326e-05, 3.777351230382919e-05, 3.951042890548706e-05, 4.124734550714493e-05, 4.2984262108802795e-05, 4.472117871046066e-05, 4.645809531211853e-05, 4.81950119137764e-05, 4.9931928515434265e-05, 5.166884511709213e-05, 5.340576171875e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 9.0, 7.0, 18.0, 24.0, 45.0, 66.0, 155.0, 240.0, 472.0, 1153.0, 3454.0, 16878.0, 192524.0, 744443.0, 75962.0, 9189.0, 2176.0, 861.0, 415.0, 195.0, 108.0, 65.0, 29.0, 20.0, 13.0, 8.0, 4.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1632080078125, -0.15723609924316406, -0.15126419067382812, -0.1452922821044922, -0.13932037353515625, -0.1333484649658203, -0.12737655639648438, -0.12140464782714844, -0.1154327392578125, -0.10946083068847656, -0.10348892211914062, -0.09751701354980469, -0.09154510498046875, -0.08557319641113281, -0.07960128784179688, -0.07362937927246094, -0.067657470703125, -0.06168556213378906, -0.055713653564453125, -0.04974174499511719, -0.04376983642578125, -0.03779792785644531, -0.031826019287109375, -0.025854110717773438, -0.0198822021484375, -0.013910293579101562, -0.007938385009765625, -0.0019664764404296875, 0.00400543212890625, 0.009977340698242188, 0.015949249267578125, 0.021921157836914062, 0.02789306640625, 0.03386497497558594, 0.039836883544921875, 0.04580879211425781, 0.05178070068359375, 0.05775260925292969, 0.06372451782226562, 0.06969642639160156, 0.0756683349609375, 0.08164024353027344, 0.08761215209960938, 0.09358406066894531, 0.09955596923828125, 0.10552787780761719, 0.11149978637695312, 0.11747169494628906, 0.123443603515625, 0.12941551208496094, 0.13538742065429688, 0.1413593292236328, 0.14733123779296875, 0.1533031463623047, 0.15927505493164062, 0.16524696350097656, 0.1712188720703125, 0.17719078063964844, 0.18316268920898438, 0.1891345977783203, 0.19510650634765625, 0.2010784149169922, 0.20705032348632812, 0.21302223205566406, 0.218994140625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 11.0, 6.0, 12.0, 19.0, 19.0, 25.0, 31.0, 35.0, 42.0, 56.0, 69.0, 80.0, 77.0, 76.0, 80.0, 68.0, 60.0, 44.0, 42.0, 47.0, 22.0, 15.0, 18.0, 15.0, 9.0, 6.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.184814453125, -0.18032455444335938, -0.17583465576171875, -0.17134475708007812, -0.1668548583984375, -0.16236495971679688, -0.15787506103515625, -0.15338516235351562, -0.148895263671875, -0.14440536499023438, -0.13991546630859375, -0.13542556762695312, -0.1309356689453125, -0.12644577026367188, -0.12195587158203125, -0.11746597290039062, -0.11297607421875, -0.10848617553710938, -0.10399627685546875, -0.09950637817382812, -0.0950164794921875, -0.09052658081054688, -0.08603668212890625, -0.08154678344726562, -0.077056884765625, -0.07256698608398438, -0.06807708740234375, -0.06358718872070312, -0.0590972900390625, -0.054607391357421875, -0.05011749267578125, -0.045627593994140625, -0.0411376953125, -0.036647796630859375, -0.03215789794921875, -0.027667999267578125, -0.0231781005859375, -0.018688201904296875, -0.01419830322265625, -0.009708404541015625, -0.005218505859375, -0.000728607177734375, 0.00376129150390625, 0.008251190185546875, 0.0127410888671875, 0.017230987548828125, 0.02172088623046875, 0.026210784912109375, 0.03070068359375, 0.035190582275390625, 0.03968048095703125, 0.044170379638671875, 0.0486602783203125, 0.053150177001953125, 0.05764007568359375, 0.062129974365234375, 0.066619873046875, 0.07110977172851562, 0.07559967041015625, 0.08008956909179688, 0.0845794677734375, 0.08906936645507812, 0.09355926513671875, 0.09804916381835938, 0.1025390625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 10.0, 19.0, 34.0, 49.0, 74.0, 93.0, 98.0, 140.0, 125.0, 110.0, 88.0, 56.0, 34.0, 17.0, 22.0, 8.0, 4.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.698230504989624, -2.6213791370391846, -2.544527769088745, -2.4676764011383057, -2.390825033187866, -2.3139736652374268, -2.2371222972869873, -2.160270929336548, -2.0834195613861084, -2.006568193435669, -1.9297168254852295, -1.85286545753479, -1.7760140895843506, -1.6991627216339111, -1.6223113536834717, -1.5454599857330322, -1.4686086177825928, -1.3917572498321533, -1.3149058818817139, -1.2380545139312744, -1.161203145980835, -1.0843517780303955, -1.007500410079956, -0.9306490421295166, -0.8537976741790771, -0.7769463062286377, -0.7000949382781982, -0.6232435703277588, -0.5463922023773193, -0.4695408344268799, -0.39268946647644043, -0.315838098526001, -0.23898696899414062, -0.16213560104370117, -0.08528423309326172, -0.008432865142822266, 0.06841850280761719, 0.14526987075805664, 0.2221212387084961, 0.29897260665893555, 0.375823974609375, 0.45267534255981445, 0.5295267105102539, 0.6063780784606934, 0.6832294464111328, 0.7600808143615723, 0.8369321823120117, 0.9137835502624512, 0.9906349182128906, 1.06748628616333, 1.1443376541137695, 1.221189022064209, 1.2980403900146484, 1.374891757965088, 1.4517431259155273, 1.5285944938659668, 1.6054458618164062, 1.6822972297668457, 1.7591485977172852, 1.8359999656677246, 1.912851333618164, 1.9897027015686035, 2.066554069519043, 2.1434054374694824, 2.220256805419922]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 6.0, 6.0, 7.0, 12.0, 10.0, 15.0, 19.0, 30.0, 34.0, 38.0, 36.0, 42.0, 47.0, 47.0, 52.0, 66.0, 57.0, 67.0, 69.0, 45.0, 46.0, 55.0, 34.0, 22.0, 28.0, 25.0, 11.0, 17.0, 13.0, 8.0, 9.0, 3.0, 3.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.6690609455108643, -2.5888559818267822, -2.5086510181427, -2.428445816040039, -2.348240852355957, -2.268035888671875, -2.187830924987793, -2.107625961303711, -2.027420997619629, -1.9472160339355469, -1.8670109510421753, -1.7868059873580933, -1.7066009044647217, -1.6263959407806396, -1.5461909770965576, -1.4659860134124756, -1.3857808113098145, -1.3055758476257324, -1.2253707647323608, -1.1451658010482788, -1.0649607181549072, -0.9847557544708252, -0.9045507907867432, -0.8243457674980164, -0.7441407442092896, -0.6639357209205627, -0.5837306976318359, -0.5035257339477539, -0.4233207106590271, -0.3431156873703003, -0.2629106938838959, -0.18270570039749146, -0.10250043869018555, -0.022295430302619934, 0.05790957808494568, 0.1381145864725113, 0.2183195948600769, 0.2985246181488037, 0.37872961163520813, 0.45893460512161255, 0.5391396284103394, 0.6193446516990662, 0.699549674987793, 0.779754638671875, 0.8599596619606018, 0.9401646852493286, 1.0203696489334106, 1.1005747318267822, 1.1807796955108643, 1.2609846591949463, 1.3411897420883179, 1.4213947057724, 1.5015997886657715, 1.5818047523498535, 1.6620097160339355, 1.7422146797180176, 1.8224197626113892, 1.9026247262954712, 1.9828298091888428, 2.063034772872925, 2.143239736557007, 2.223444938659668, 2.30364990234375, 2.383854866027832, 2.464059829711914]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 10.0, 11.0, 25.0, 20.0, 38.0, 39.0, 60.0, 81.0, 143.0, 244.0, 381.0, 731.0, 1245.0, 2344.0, 4602.0, 9979.0, 23620.0, 67940.0, 306300.0, 2507142.0, 1056663.0, 142270.0, 40254.0, 15700.0, 6850.0, 3292.0, 1770.0, 973.0, 587.0, 338.0, 184.0, 129.0, 85.0, 62.0, 40.0, 30.0, 29.0, 14.0, 10.0, 9.0, 8.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1614990234375, -0.15588760375976562, -0.15027618408203125, -0.14466476440429688, -0.1390533447265625, -0.13344192504882812, -0.12783050537109375, -0.12221908569335938, -0.116607666015625, -0.11099624633789062, -0.10538482666015625, -0.09977340698242188, -0.0941619873046875, -0.08855056762695312, -0.08293914794921875, -0.07732772827148438, -0.07171630859375, -0.06610488891601562, -0.06049346923828125, -0.054882049560546875, -0.0492706298828125, -0.043659210205078125, -0.03804779052734375, -0.032436370849609375, -0.026824951171875, -0.021213531494140625, -0.01560211181640625, -0.009990692138671875, -0.0043792724609375, 0.001232147216796875, 0.00684356689453125, 0.012454986572265625, 0.01806640625, 0.023677825927734375, 0.02928924560546875, 0.034900665283203125, 0.0405120849609375, 0.046123504638671875, 0.05173492431640625, 0.057346343994140625, 0.062957763671875, 0.06856918334960938, 0.07418060302734375, 0.07979202270507812, 0.0854034423828125, 0.09101486206054688, 0.09662628173828125, 0.10223770141601562, 0.10784912109375, 0.11346054077148438, 0.11907196044921875, 0.12468338012695312, 0.1302947998046875, 0.13590621948242188, 0.14151763916015625, 0.14712905883789062, 0.152740478515625, 0.15835189819335938, 0.16396331787109375, 0.16957473754882812, 0.1751861572265625, 0.18079757690429688, 0.18640899658203125, 0.19202041625976562, 0.1976318359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 8.0, 5.0, 12.0, 16.0, 12.0, 22.0, 33.0, 17.0, 29.0, 34.0, 26.0, 41.0, 47.0, 42.0, 46.0, 53.0, 52.0, 51.0, 50.0, 51.0, 45.0, 43.0, 39.0, 35.0, 25.0, 27.0, 26.0, 18.0, 18.0, 15.0, 16.0, 10.0, 6.0, 7.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0947265625, -0.09137535095214844, -0.08802413940429688, -0.08467292785644531, -0.08132171630859375, -0.07797050476074219, -0.07461929321289062, -0.07126808166503906, -0.0679168701171875, -0.06456565856933594, -0.061214447021484375, -0.05786323547363281, -0.05451202392578125, -0.05116081237792969, -0.047809600830078125, -0.04445838928222656, -0.041107177734375, -0.03775596618652344, -0.034404754638671875, -0.031053543090820312, -0.02770233154296875, -0.024351119995117188, -0.020999908447265625, -0.017648696899414062, -0.0142974853515625, -0.010946273803710938, -0.007595062255859375, -0.0042438507080078125, -0.00089263916015625, 0.0024585723876953125, 0.005809783935546875, 0.009160995483398438, 0.01251220703125, 0.015863418579101562, 0.019214630126953125, 0.022565841674804688, 0.02591705322265625, 0.029268264770507812, 0.032619476318359375, 0.03597068786621094, 0.0393218994140625, 0.04267311096191406, 0.046024322509765625, 0.04937553405761719, 0.05272674560546875, 0.05607795715332031, 0.059429168701171875, 0.06278038024902344, 0.066131591796875, 0.06948280334472656, 0.07283401489257812, 0.07618522644042969, 0.07953643798828125, 0.08288764953613281, 0.08623886108398438, 0.08959007263183594, 0.0929412841796875, 0.09629249572753906, 0.09964370727539062, 0.10299491882324219, 0.10634613037109375, 0.10969734191894531, 0.11304855346679688, 0.11639976501464844, 0.1197509765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 6.0, 8.0, 6.0, 14.0, 25.0, 25.0, 37.0, 58.0, 90.0, 141.0, 232.0, 393.0, 695.0, 1366.0, 2880.0, 6638.0, 19475.0, 70948.0, 494011.0, 3190663.0, 325366.0, 54830.0, 15745.0, 5575.0, 2349.0, 1167.0, 604.0, 320.0, 200.0, 124.0, 84.0, 63.0, 37.0, 26.0, 19.0, 23.0, 6.0, 6.0, 8.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2332763671875, -0.22476768493652344, -0.21625900268554688, -0.2077503204345703, -0.19924163818359375, -0.1907329559326172, -0.18222427368164062, -0.17371559143066406, -0.1652069091796875, -0.15669822692871094, -0.14818954467773438, -0.1396808624267578, -0.13117218017578125, -0.12266349792480469, -0.11415481567382812, -0.10564613342285156, -0.097137451171875, -0.08862876892089844, -0.08012008666992188, -0.07161140441894531, -0.06310272216796875, -0.05459403991699219, -0.046085357666015625, -0.03757667541503906, -0.0290679931640625, -0.020559310913085938, -0.012050628662109375, -0.0035419464111328125, 0.00496673583984375, 0.013475418090820312, 0.021984100341796875, 0.030492782592773438, 0.03900146484375, 0.04751014709472656, 0.056018829345703125, 0.06452751159667969, 0.07303619384765625, 0.08154487609863281, 0.09005355834960938, 0.09856224060058594, 0.1070709228515625, 0.11557960510253906, 0.12408828735351562, 0.1325969696044922, 0.14110565185546875, 0.1496143341064453, 0.15812301635742188, 0.16663169860839844, 0.175140380859375, 0.18364906311035156, 0.19215774536132812, 0.2006664276123047, 0.20917510986328125, 0.2176837921142578, 0.22619247436523438, 0.23470115661621094, 0.2432098388671875, 0.25171852111816406, 0.2602272033691406, 0.2687358856201172, 0.27724456787109375, 0.2857532501220703, 0.2942619323730469, 0.30277061462402344, 0.311279296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 12.0, 12.0, 8.0, 17.0, 22.0, 30.0, 34.0, 74.0, 76.0, 127.0, 262.0, 427.0, 861.0, 862.0, 484.0, 277.0, 175.0, 79.0, 61.0, 40.0, 29.0, 24.0, 22.0, 16.0, 4.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34716796875, -0.3366851806640625, -0.326202392578125, -0.3157196044921875, -0.30523681640625, -0.2947540283203125, -0.284271240234375, -0.2737884521484375, -0.2633056640625, -0.2528228759765625, -0.242340087890625, -0.2318572998046875, -0.22137451171875, -0.2108917236328125, -0.200408935546875, -0.1899261474609375, -0.179443359375, -0.1689605712890625, -0.158477783203125, -0.1479949951171875, -0.13751220703125, -0.1270294189453125, -0.116546630859375, -0.1060638427734375, -0.0955810546875, -0.0850982666015625, -0.074615478515625, -0.0641326904296875, -0.05364990234375, -0.0431671142578125, -0.032684326171875, -0.0222015380859375, -0.01171875, -0.0012359619140625, 0.009246826171875, 0.0197296142578125, 0.03021240234375, 0.0406951904296875, 0.051177978515625, 0.0616607666015625, 0.0721435546875, 0.0826263427734375, 0.093109130859375, 0.1035919189453125, 0.11407470703125, 0.1245574951171875, 0.135040283203125, 0.1455230712890625, 0.156005859375, 0.1664886474609375, 0.176971435546875, 0.1874542236328125, 0.19793701171875, 0.2084197998046875, 0.218902587890625, 0.2293853759765625, 0.2398681640625, 0.2503509521484375, 0.260833740234375, 0.2713165283203125, 0.28179931640625, 0.2922821044921875, 0.302764892578125, 0.3132476806640625, 0.32373046875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 8.0, 23.0, 77.0, 168.0, 323.0, 271.0, 87.0, 18.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.902897834777832, -4.725628852844238, -4.5483598709106445, -4.371090888977051, -4.193821907043457, -4.0165534019470215, -3.8392844200134277, -3.662015438079834, -3.4847464561462402, -3.3074774742126465, -3.1302084922790527, -2.952939748764038, -2.7756707668304443, -2.5984017848968506, -2.421133041381836, -2.243864059448242, -2.0665950775146484, -1.8893260955810547, -1.7120572328567505, -1.5347883701324463, -1.3575193881988525, -1.1802504062652588, -1.0029815435409546, -0.8257126808166504, -0.6484436988830566, -0.47117477655410767, -0.2939058542251587, -0.11663693189620972, 0.06063199043273926, 0.23790091276168823, 0.4151698350906372, 0.5924386978149414, 0.7697076797485352, 0.9469766020774841, 1.124245524406433, 1.3015143871307373, 1.478783369064331, 1.6560523509979248, 1.833321213722229, 2.010590076446533, 2.187859058380127, 2.3651280403137207, 2.5423970222473145, 2.719665765762329, 2.896934747695923, 3.0742037296295166, 3.2514724731445312, 3.428741455078125, 3.6060104370117188, 3.7832794189453125, 3.9605484008789062, 4.1378173828125, 4.315086364746094, 4.492354869842529, 4.669623851776123, 4.846892833709717, 5.0241618156433105, 5.201430797576904, 5.378699779510498, 5.555968761444092, 5.733237266540527, 5.910506248474121, 6.087775230407715, 6.265044212341309, 6.442313194274902]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 1.0, 6.0, 4.0, 12.0, 7.0, 7.0, 12.0, 18.0, 17.0, 21.0, 31.0, 34.0, 35.0, 43.0, 41.0, 38.0, 49.0, 47.0, 51.0, 41.0, 48.0, 54.0, 44.0, 33.0, 37.0, 37.0, 24.0, 37.0, 19.0, 21.0, 23.0, 22.0, 17.0, 14.0, 14.0, 14.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5907424688339233, -1.5431251525878906, -1.4955079555511475, -1.4478906393051147, -1.400273323059082, -1.3526561260223389, -1.3050388097763062, -1.2574214935302734, -1.2098042964935303, -1.1621869802474976, -1.1145697832107544, -1.0669524669647217, -1.0193352699279785, -0.9717179536819458, -0.9241006374359131, -0.8764833807945251, -0.8288661241531372, -0.7812488675117493, -0.7336316108703613, -0.6860142946243286, -0.6383970379829407, -0.5907797813415527, -0.54316246509552, -0.4955452084541321, -0.44792795181274414, -0.4003106951713562, -0.3526934087276459, -0.30507612228393555, -0.2574588656425476, -0.20984159409999847, -0.16222432255744934, -0.11460703611373901, -0.06698989868164062, -0.01937262713909149, 0.02824464440345764, 0.07586191594600677, 0.12347918748855591, 0.17109645903110504, 0.21871373057365417, 0.2663310170173645, 0.31394827365875244, 0.3615655303001404, 0.4091828167438507, 0.45680010318756104, 0.504417359828949, 0.5520346164703369, 0.5996519327163696, 0.6472691893577576, 0.6948864459991455, 0.7425037026405334, 0.7901209592819214, 0.8377382755279541, 0.885355532169342, 0.93297278881073, 0.9805901050567627, 1.0282073020935059, 1.0758246183395386, 1.1234419345855713, 1.1710591316223145, 1.2186764478683472, 1.2662937641143799, 1.313910961151123, 1.3615282773971558, 1.4091455936431885, 1.4567627906799316]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 8.0, 5.0, 17.0, 14.0, 15.0, 28.0, 37.0, 62.0, 92.0, 130.0, 205.0, 268.0, 437.0, 631.0, 938.0, 1582.0, 2432.0, 3991.0, 6822.0, 11689.0, 20536.0, 38006.0, 78665.0, 199680.0, 360356.0, 171976.0, 69749.0, 34400.0, 18721.0, 10568.0, 6100.0, 3733.0, 2313.0, 1444.0, 959.0, 668.0, 423.0, 261.0, 190.0, 130.0, 84.0, 54.0, 37.0, 32.0, 19.0, 13.0, 11.0, 8.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1771240234375, -0.171661376953125, -0.16619873046875, -0.160736083984375, -0.1552734375, -0.149810791015625, -0.14434814453125, -0.138885498046875, -0.1334228515625, -0.127960205078125, -0.12249755859375, -0.117034912109375, -0.111572265625, -0.106109619140625, -0.10064697265625, -0.095184326171875, -0.0897216796875, -0.084259033203125, -0.07879638671875, -0.073333740234375, -0.06787109375, -0.062408447265625, -0.05694580078125, -0.051483154296875, -0.0460205078125, -0.040557861328125, -0.03509521484375, -0.029632568359375, -0.024169921875, -0.018707275390625, -0.01324462890625, -0.007781982421875, -0.0023193359375, 0.003143310546875, 0.00860595703125, 0.014068603515625, 0.01953125, 0.024993896484375, 0.03045654296875, 0.035919189453125, 0.0413818359375, 0.046844482421875, 0.05230712890625, 0.057769775390625, 0.063232421875, 0.068695068359375, 0.07415771484375, 0.079620361328125, 0.0850830078125, 0.090545654296875, 0.09600830078125, 0.101470947265625, 0.10693359375, 0.112396240234375, 0.11785888671875, 0.123321533203125, 0.1287841796875, 0.134246826171875, 0.13970947265625, 0.145172119140625, 0.150634765625, 0.156097412109375, 0.16156005859375, 0.167022705078125, 0.1724853515625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 9.0, 5.0, 8.0, 7.0, 17.0, 14.0, 7.0, 22.0, 22.0, 25.0, 20.0, 27.0, 34.0, 38.0, 48.0, 43.0, 38.0, 27.0, 64.0, 49.0, 46.0, 43.0, 37.0, 38.0, 40.0, 34.0, 25.0, 27.0, 22.0, 27.0, 23.0, 14.0, 13.0, 8.0, 14.0, 8.0, 6.0, 13.0, 12.0, 10.0, 2.0, 6.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0919189453125, -0.08893299102783203, -0.08594703674316406, -0.0829610824584961, -0.07997512817382812, -0.07698917388916016, -0.07400321960449219, -0.07101726531982422, -0.06803131103515625, -0.06504535675048828, -0.06205940246582031, -0.059073448181152344, -0.056087493896484375, -0.053101539611816406, -0.05011558532714844, -0.04712963104248047, -0.0441436767578125, -0.04115772247314453, -0.03817176818847656, -0.035185813903808594, -0.032199859619140625, -0.029213905334472656, -0.026227951049804688, -0.02324199676513672, -0.02025604248046875, -0.01727008819580078, -0.014284133911132812, -0.011298179626464844, -0.008312225341796875, -0.005326271057128906, -0.0023403167724609375, 0.0006456375122070312, 0.003631591796875, 0.006617546081542969, 0.009603500366210938, 0.012589454650878906, 0.015575408935546875, 0.018561363220214844, 0.021547317504882812, 0.02453327178955078, 0.02751922607421875, 0.03050518035888672, 0.03349113464355469, 0.036477088928222656, 0.039463043212890625, 0.042448997497558594, 0.04543495178222656, 0.04842090606689453, 0.0514068603515625, 0.05439281463623047, 0.05737876892089844, 0.060364723205566406, 0.06335067749023438, 0.06633663177490234, 0.06932258605957031, 0.07230854034423828, 0.07529449462890625, 0.07828044891357422, 0.08126640319824219, 0.08425235748291016, 0.08723831176757812, 0.0902242660522461, 0.09321022033691406, 0.09619617462158203, 0.09918212890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 6.0, 8.0, 13.0, 19.0, 25.0, 28.0, 37.0, 67.0, 78.0, 134.0, 226.0, 352.0, 599.0, 1198.0, 2632.0, 8148.0, 43927.0, 704815.0, 253012.0, 23533.0, 5306.0, 1967.0, 999.0, 498.0, 294.0, 201.0, 128.0, 77.0, 69.0, 36.0, 27.0, 34.0, 14.0, 9.0, 12.0, 3.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.50537109375, -0.488983154296875, -0.47259521484375, -0.456207275390625, -0.4398193359375, -0.423431396484375, -0.40704345703125, -0.390655517578125, -0.374267578125, -0.357879638671875, -0.34149169921875, -0.325103759765625, -0.3087158203125, -0.292327880859375, -0.27593994140625, -0.259552001953125, -0.2431640625, -0.226776123046875, -0.21038818359375, -0.194000244140625, -0.1776123046875, -0.161224365234375, -0.14483642578125, -0.128448486328125, -0.112060546875, -0.095672607421875, -0.07928466796875, -0.062896728515625, -0.0465087890625, -0.030120849609375, -0.01373291015625, 0.002655029296875, 0.01904296875, 0.035430908203125, 0.05181884765625, 0.068206787109375, 0.0845947265625, 0.100982666015625, 0.11737060546875, 0.133758544921875, 0.150146484375, 0.166534423828125, 0.18292236328125, 0.199310302734375, 0.2156982421875, 0.232086181640625, 0.24847412109375, 0.264862060546875, 0.28125, 0.297637939453125, 0.31402587890625, 0.330413818359375, 0.3468017578125, 0.363189697265625, 0.37957763671875, 0.395965576171875, 0.412353515625, 0.428741455078125, 0.44512939453125, 0.461517333984375, 0.4779052734375, 0.494293212890625, 0.51068115234375, 0.527069091796875, 0.54345703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 10.0, 7.0, 5.0, 6.0, 13.0, 20.0, 19.0, 28.0, 26.0, 33.0, 29.0, 42.0, 41.0, 32.0, 37.0, 41.0, 42.0, 39.0, 48.0, 42.0, 51.0, 44.0, 33.0, 30.0, 21.0, 30.0, 44.0, 29.0, 19.0, 21.0, 17.0, 17.0, 13.0, 12.0, 6.0, 8.0, 8.0, 6.0, 10.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.50146484375, -0.487396240234375, -0.47332763671875, -0.459259033203125, -0.4451904296875, -0.431121826171875, -0.41705322265625, -0.402984619140625, -0.388916015625, -0.374847412109375, -0.36077880859375, -0.346710205078125, -0.3326416015625, -0.318572998046875, -0.30450439453125, -0.290435791015625, -0.2763671875, -0.262298583984375, -0.24822998046875, -0.234161376953125, -0.2200927734375, -0.206024169921875, -0.19195556640625, -0.177886962890625, -0.163818359375, -0.149749755859375, -0.13568115234375, -0.121612548828125, -0.1075439453125, -0.093475341796875, -0.07940673828125, -0.065338134765625, -0.05126953125, -0.037200927734375, -0.02313232421875, -0.009063720703125, 0.0050048828125, 0.019073486328125, 0.03314208984375, 0.047210693359375, 0.061279296875, 0.075347900390625, 0.08941650390625, 0.103485107421875, 0.1175537109375, 0.131622314453125, 0.14569091796875, 0.159759521484375, 0.173828125, 0.187896728515625, 0.20196533203125, 0.216033935546875, 0.2301025390625, 0.244171142578125, 0.25823974609375, 0.272308349609375, 0.286376953125, 0.300445556640625, 0.31451416015625, 0.328582763671875, 0.3426513671875, 0.356719970703125, 0.37078857421875, 0.384857177734375, 0.39892578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 9.0, 16.0, 9.0, 27.0, 30.0, 39.0, 75.0, 94.0, 184.0, 273.0, 473.0, 941.0, 1818.0, 4130.0, 10735.0, 32882.0, 168411.0, 691524.0, 98437.0, 23762.0, 8054.0, 3215.0, 1476.0, 861.0, 385.0, 236.0, 147.0, 95.0, 63.0, 42.0, 31.0, 25.0, 9.0, 8.0, 14.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.14697265625, -0.1419677734375, -0.136962890625, -0.1319580078125, -0.126953125, -0.1219482421875, -0.116943359375, -0.1119384765625, -0.10693359375, -0.1019287109375, -0.096923828125, -0.0919189453125, -0.0869140625, -0.0819091796875, -0.076904296875, -0.0718994140625, -0.06689453125, -0.0618896484375, -0.056884765625, -0.0518798828125, -0.046875, -0.0418701171875, -0.036865234375, -0.0318603515625, -0.02685546875, -0.0218505859375, -0.016845703125, -0.0118408203125, -0.0068359375, -0.0018310546875, 0.003173828125, 0.0081787109375, 0.01318359375, 0.0181884765625, 0.023193359375, 0.0281982421875, 0.033203125, 0.0382080078125, 0.043212890625, 0.0482177734375, 0.05322265625, 0.0582275390625, 0.063232421875, 0.0682373046875, 0.0732421875, 0.0782470703125, 0.083251953125, 0.0882568359375, 0.09326171875, 0.0982666015625, 0.103271484375, 0.1082763671875, 0.11328125, 0.1182861328125, 0.123291015625, 0.1282958984375, 0.13330078125, 0.1383056640625, 0.143310546875, 0.1483154296875, 0.1533203125, 0.1583251953125, 0.163330078125, 0.1683349609375, 0.17333984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 3.0, 8.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 5.0, 10.0, 7.0, 10.0, 14.0, 20.0, 20.0, 34.0, 41.0, 42.0, 54.0, 59.0, 70.0, 83.0, 90.0, 73.0, 62.0, 49.0, 27.0, 32.0, 26.0, 16.0, 19.0, 13.0, 13.0, 9.0, 8.0, 10.0, 6.0, 5.0, 12.0, 6.0, 3.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0], "bins": [-4.595518112182617e-05, -4.450324922800064e-05, -4.305131733417511e-05, -4.159938544034958e-05, -4.014745354652405e-05, -3.869552165269852e-05, -3.7243589758872986e-05, -3.5791657865047455e-05, -3.4339725971221924e-05, -3.288779407739639e-05, -3.143586218357086e-05, -2.998393028974533e-05, -2.85319983959198e-05, -2.708006650209427e-05, -2.5628134608268738e-05, -2.4176202714443207e-05, -2.2724270820617676e-05, -2.1272338926792145e-05, -1.9820407032966614e-05, -1.8368475139141083e-05, -1.6916543245315552e-05, -1.546461135149002e-05, -1.401267945766449e-05, -1.2560747563838959e-05, -1.1108815670013428e-05, -9.656883776187897e-06, -8.204951882362366e-06, -6.753019988536835e-06, -5.301088094711304e-06, -3.849156200885773e-06, -2.3972243070602417e-06, -9.452924132347107e-07, 5.066394805908203e-07, 1.9585713744163513e-06, 3.4105032682418823e-06, 4.862435162067413e-06, 6.314367055892944e-06, 7.766298949718475e-06, 9.218230843544006e-06, 1.0670162737369537e-05, 1.2122094631195068e-05, 1.35740265250206e-05, 1.502595841884613e-05, 1.647789031267166e-05, 1.7929822206497192e-05, 1.9381754100322723e-05, 2.0833685994148254e-05, 2.2285617887973785e-05, 2.3737549781799316e-05, 2.5189481675624847e-05, 2.664141356945038e-05, 2.809334546327591e-05, 2.954527735710144e-05, 3.099720925092697e-05, 3.24491411447525e-05, 3.3901073038578033e-05, 3.5353004932403564e-05, 3.6804936826229095e-05, 3.8256868720054626e-05, 3.970880061388016e-05, 4.116073250770569e-05, 4.261266440153122e-05, 4.406459629535675e-05, 4.551652818918228e-05, 4.696846008300781e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 8.0, 5.0, 18.0, 12.0, 22.0, 25.0, 40.0, 55.0, 88.0, 132.0, 186.0, 346.0, 616.0, 1138.0, 2497.0, 6173.0, 21691.0, 137523.0, 739509.0, 109359.0, 18741.0, 5507.0, 2242.0, 1076.0, 584.0, 331.0, 203.0, 114.0, 79.0, 55.0, 44.0, 21.0, 24.0, 19.0, 17.0, 9.0, 7.0, 12.0, 5.0, 2.0, 0.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1705322265625, -0.16510963439941406, -0.15968704223632812, -0.1542644500732422, -0.14884185791015625, -0.1434192657470703, -0.13799667358398438, -0.13257408142089844, -0.1271514892578125, -0.12172889709472656, -0.11630630493164062, -0.11088371276855469, -0.10546112060546875, -0.10003852844238281, -0.09461593627929688, -0.08919334411621094, -0.083770751953125, -0.07834815979003906, -0.07292556762695312, -0.06750297546386719, -0.06208038330078125, -0.05665779113769531, -0.051235198974609375, -0.04581260681152344, -0.0403900146484375, -0.03496742248535156, -0.029544830322265625, -0.024122238159179688, -0.01869964599609375, -0.013277053833007812, -0.007854461669921875, -0.0024318695068359375, 0.00299072265625, 0.008413314819335938, 0.013835906982421875, 0.019258499145507812, 0.02468109130859375, 0.030103683471679688, 0.035526275634765625, 0.04094886779785156, 0.0463714599609375, 0.05179405212402344, 0.057216644287109375, 0.06263923645019531, 0.06806182861328125, 0.07348442077636719, 0.07890701293945312, 0.08432960510253906, 0.089752197265625, 0.09517478942871094, 0.10059738159179688, 0.10601997375488281, 0.11144256591796875, 0.11686515808105469, 0.12228775024414062, 0.12771034240722656, 0.1331329345703125, 0.13855552673339844, 0.14397811889648438, 0.1494007110595703, 0.15482330322265625, 0.1602458953857422, 0.16566848754882812, 0.17109107971191406, 0.176513671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 8.0, 11.0, 19.0, 10.0, 23.0, 22.0, 16.0, 33.0, 54.0, 47.0, 60.0, 69.0, 74.0, 83.0, 74.0, 67.0, 59.0, 65.0, 31.0, 33.0, 30.0, 22.0, 15.0, 19.0, 6.0, 9.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1131591796875, -0.10870552062988281, -0.10425186157226562, -0.09979820251464844, -0.09534454345703125, -0.09089088439941406, -0.08643722534179688, -0.08198356628417969, -0.0775299072265625, -0.07307624816894531, -0.06862258911132812, -0.06416893005371094, -0.05971527099609375, -0.05526161193847656, -0.050807952880859375, -0.04635429382324219, -0.041900634765625, -0.03744697570800781, -0.032993316650390625, -0.028539657592773438, -0.02408599853515625, -0.019632339477539062, -0.015178680419921875, -0.010725021362304688, -0.0062713623046875, -0.0018177032470703125, 0.002635955810546875, 0.0070896148681640625, 0.01154327392578125, 0.015996932983398438, 0.020450592041015625, 0.024904251098632812, 0.02935791015625, 0.03381156921386719, 0.038265228271484375, 0.04271888732910156, 0.04717254638671875, 0.05162620544433594, 0.056079864501953125, 0.06053352355957031, 0.0649871826171875, 0.06944084167480469, 0.07389450073242188, 0.07834815979003906, 0.08280181884765625, 0.08725547790527344, 0.09170913696289062, 0.09616279602050781, 0.100616455078125, 0.10507011413574219, 0.10952377319335938, 0.11397743225097656, 0.11843109130859375, 0.12288475036621094, 0.12733840942382812, 0.1317920684814453, 0.1362457275390625, 0.1406993865966797, 0.14515304565429688, 0.14960670471191406, 0.15406036376953125, 0.15851402282714844, 0.16296768188476562, 0.1674213409423828, 0.171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 6.0, 5.0, 10.0, 11.0, 43.0, 63.0, 99.0, 149.0, 212.0, 165.0, 109.0, 53.0, 35.0, 10.0, 12.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.661623001098633, -2.5535011291503906, -2.4453794956207275, -2.3372576236724854, -2.2291359901428223, -2.12101411819458, -2.012892246246338, -1.9047706127166748, -1.7966487407684326, -1.68852698802948, -1.5804052352905273, -1.4722833633422852, -1.3641616106033325, -1.2560398578643799, -1.1479181051254272, -1.0397963523864746, -0.931674599647522, -0.8235528469085693, -0.7154310345649719, -0.6073092818260193, -0.49918749928474426, -0.39106571674346924, -0.2829439640045166, -0.1748221516609192, -0.06670039892196655, 0.041421376168727875, 0.1495431512594223, 0.25766491889953613, 0.36578670144081116, 0.4739084839820862, 0.5820302367210388, 0.6901520490646362, 0.7982738018035889, 0.9063955545425415, 1.0145173072814941, 1.1226391792297363, 1.230760931968689, 1.3388826847076416, 1.4470044374465942, 1.5551261901855469, 1.663248062133789, 1.7713698148727417, 1.8794915676116943, 1.9876134395599365, 2.0957350730895996, 2.203856945037842, 2.311978816986084, 2.420100450515747, 2.52822208404541, 2.6363439559936523, 2.7444655895233154, 2.8525874614715576, 2.9607090950012207, 3.068830966949463, 3.176952838897705, 3.285074472427368, 3.3931963443756104, 3.5013182163238525, 3.6094398498535156, 3.717561721801758, 3.825683355331421, 3.933805227279663, 4.041926860809326, 4.150048732757568, 4.2581706047058105]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 9.0, 3.0, 7.0, 4.0, 7.0, 14.0, 15.0, 14.0, 12.0, 17.0, 16.0, 32.0, 21.0, 25.0, 38.0, 44.0, 38.0, 36.0, 62.0, 56.0, 48.0, 45.0, 45.0, 49.0, 46.0, 30.0, 32.0, 35.0, 22.0, 35.0, 27.0, 23.0, 11.0, 13.0, 17.0, 6.0, 8.0, 7.0, 7.0, 1.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.1636312007904053, -2.1042208671569824, -2.0448105335235596, -1.9854000806808472, -1.9259897470474243, -1.8665794134140015, -1.8071690797805786, -1.7477586269378662, -1.6883482933044434, -1.6289379596710205, -1.5695276260375977, -1.5101171731948853, -1.4507068395614624, -1.3912965059280396, -1.3318861722946167, -1.2724757194519043, -1.2130653858184814, -1.1536550521850586, -1.0942447185516357, -1.0348342657089233, -0.9754239320755005, -0.9160135984420776, -0.8566032648086548, -0.7971928715705872, -0.7377825975418091, -0.6783722639083862, -0.6189618706703186, -0.5595515370368958, -0.5001411437988281, -0.4407308101654053, -0.38132044672966003, -0.3219100832939148, -0.26249969005584717, -0.20308932662010193, -0.1436789631843567, -0.08426861464977264, -0.024858251214027405, 0.03455209732055664, 0.09396246075630188, 0.15337282419204712, 0.21278318762779236, 0.2721935510635376, 0.33160391449928284, 0.3910142779350281, 0.4504246115684509, 0.5098350048065186, 0.5692453384399414, 0.6286556720733643, 0.6880660653114319, 0.7474763989448547, 0.8068867921829224, 0.8662971258163452, 0.9257075190544128, 0.9851178526878357, 1.0445282459259033, 1.1039385795593262, 1.163348913192749, 1.2227592468261719, 1.2821695804595947, 1.3415800333023071, 1.40099036693573, 1.4604007005691528, 1.5198110342025757, 1.579221487045288, 1.638631820678711]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 8.0, 4.0, 11.0, 14.0, 21.0, 24.0, 45.0, 54.0, 89.0, 172.0, 320.0, 728.0, 1696.0, 4621.0, 14819.0, 75555.0, 1213364.0, 2719962.0, 131114.0, 21756.0, 5965.0, 2074.0, 858.0, 419.0, 224.0, 98.0, 84.0, 43.0, 29.0, 28.0, 16.0, 13.0, 6.0, 7.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2625617980957031, -0.25412750244140625, -0.24569320678710938, -0.2372589111328125, -0.22882461547851562, -0.22039031982421875, -0.21195602416992188, -0.203521728515625, -0.19508743286132812, -0.18665313720703125, -0.17821884155273438, -0.1697845458984375, -0.16135025024414062, -0.15291595458984375, -0.14448165893554688, -0.13604736328125, -0.12761306762695312, -0.11917877197265625, -0.11074447631835938, -0.1023101806640625, -0.09387588500976562, -0.08544158935546875, -0.07700729370117188, -0.068572998046875, -0.060138702392578125, -0.05170440673828125, -0.043270111083984375, -0.0348358154296875, -0.026401519775390625, -0.01796722412109375, -0.009532928466796875, -0.0010986328125, 0.007335662841796875, 0.01576995849609375, 0.024204254150390625, 0.0326385498046875, 0.041072845458984375, 0.04950714111328125, 0.057941436767578125, 0.066375732421875, 0.07481002807617188, 0.08324432373046875, 0.09167861938476562, 0.1001129150390625, 0.10854721069335938, 0.11698150634765625, 0.12541580200195312, 0.13385009765625, 0.14228439331054688, 0.15071868896484375, 0.15915298461914062, 0.1675872802734375, 0.17602157592773438, 0.18445587158203125, 0.19289016723632812, 0.201324462890625, 0.20975875854492188, 0.21819305419921875, 0.22662734985351562, 0.2350616455078125, 0.24349594116210938, 0.25193023681640625, 0.2603645324707031, 0.268798828125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 9.0, 12.0, 18.0, 17.0, 29.0, 33.0, 46.0, 57.0, 43.0, 58.0, 80.0, 55.0, 68.0, 76.0, 73.0, 60.0, 52.0, 41.0, 38.0, 39.0, 16.0, 16.0, 14.0, 12.0, 6.0, 11.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148193359375, -0.14346694946289062, -0.13874053955078125, -0.13401412963867188, -0.1292877197265625, -0.12456130981445312, -0.11983489990234375, -0.11510848999023438, -0.110382080078125, -0.10565567016601562, -0.10092926025390625, -0.09620285034179688, -0.0914764404296875, -0.08675003051757812, -0.08202362060546875, -0.07729721069335938, -0.07257080078125, -0.06784439086914062, -0.06311798095703125, -0.058391571044921875, -0.0536651611328125, -0.048938751220703125, -0.04421234130859375, -0.039485931396484375, -0.034759521484375, -0.030033111572265625, -0.02530670166015625, -0.020580291748046875, -0.0158538818359375, -0.011127471923828125, -0.00640106201171875, -0.001674652099609375, 0.0030517578125, 0.007778167724609375, 0.01250457763671875, 0.017230987548828125, 0.0219573974609375, 0.026683807373046875, 0.03141021728515625, 0.036136627197265625, 0.040863037109375, 0.045589447021484375, 0.05031585693359375, 0.055042266845703125, 0.0597686767578125, 0.06449508666992188, 0.06922149658203125, 0.07394790649414062, 0.07867431640625, 0.08340072631835938, 0.08812713623046875, 0.09285354614257812, 0.0975799560546875, 0.10230636596679688, 0.10703277587890625, 0.11175918579101562, 0.116485595703125, 0.12121200561523438, 0.12593841552734375, 0.13066482543945312, 0.1353912353515625, 0.14011764526367188, 0.14484405517578125, 0.14957046508789062, 0.154296875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 5.0, 8.0, 18.0, 18.0, 34.0, 50.0, 99.0, 167.0, 250.0, 457.0, 796.0, 1556.0, 3315.0, 6806.0, 16530.0, 46498.0, 183244.0, 1551741.0, 2075879.0, 222980.0, 51840.0, 17943.0, 7180.0, 3278.0, 1552.0, 886.0, 421.0, 274.0, 180.0, 109.0, 57.0, 36.0, 28.0, 13.0, 12.0, 11.0, 5.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.24755859375, -0.2406940460205078, -0.23382949829101562, -0.22696495056152344, -0.22010040283203125, -0.21323585510253906, -0.20637130737304688, -0.1995067596435547, -0.1926422119140625, -0.1857776641845703, -0.17891311645507812, -0.17204856872558594, -0.16518402099609375, -0.15831947326660156, -0.15145492553710938, -0.1445903778076172, -0.137725830078125, -0.1308612823486328, -0.12399673461914062, -0.11713218688964844, -0.11026763916015625, -0.10340309143066406, -0.09653854370117188, -0.08967399597167969, -0.0828094482421875, -0.07594490051269531, -0.06908035278320312, -0.06221580505371094, -0.05535125732421875, -0.04848670959472656, -0.041622161865234375, -0.03475761413574219, -0.02789306640625, -0.021028518676757812, -0.014163970947265625, -0.0072994232177734375, -0.00043487548828125, 0.0064296722412109375, 0.013294219970703125, 0.020158767700195312, 0.0270233154296875, 0.03388786315917969, 0.040752410888671875, 0.04761695861816406, 0.05448150634765625, 0.06134605407714844, 0.06821060180664062, 0.07507514953613281, 0.081939697265625, 0.08880424499511719, 0.09566879272460938, 0.10253334045410156, 0.10939788818359375, 0.11626243591308594, 0.12312698364257812, 0.1299915313720703, 0.1368560791015625, 0.1437206268310547, 0.15058517456054688, 0.15744972229003906, 0.16431427001953125, 0.17117881774902344, 0.17804336547851562, 0.1849079132080078, 0.1917724609375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 5.0, 6.0, 11.0, 17.0, 12.0, 16.0, 21.0, 25.0, 36.0, 69.0, 91.0, 112.0, 174.0, 278.0, 435.0, 702.0, 728.0, 464.0, 331.0, 170.0, 101.0, 60.0, 48.0, 37.0, 28.0, 20.0, 12.0, 14.0, 11.0, 9.0, 6.0, 4.0, 2.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.284423828125, -0.2760581970214844, -0.26769256591796875, -0.2593269348144531, -0.2509613037109375, -0.24259567260742188, -0.23423004150390625, -0.22586441040039062, -0.217498779296875, -0.20913314819335938, -0.20076751708984375, -0.19240188598632812, -0.1840362548828125, -0.17567062377929688, -0.16730499267578125, -0.15893936157226562, -0.15057373046875, -0.14220809936523438, -0.13384246826171875, -0.12547683715820312, -0.1171112060546875, -0.10874557495117188, -0.10037994384765625, -0.09201431274414062, -0.083648681640625, -0.07528305053710938, -0.06691741943359375, -0.058551788330078125, -0.0501861572265625, -0.041820526123046875, -0.03345489501953125, -0.025089263916015625, -0.0167236328125, -0.008358001708984375, 7.62939453125e-06, 0.008373260498046875, 0.0167388916015625, 0.025104522705078125, 0.03347015380859375, 0.041835784912109375, 0.050201416015625, 0.058567047119140625, 0.06693267822265625, 0.07529830932617188, 0.0836639404296875, 0.09202957153320312, 0.10039520263671875, 0.10876083374023438, 0.11712646484375, 0.12549209594726562, 0.13385772705078125, 0.14222335815429688, 0.1505889892578125, 0.15895462036132812, 0.16732025146484375, 0.17568588256835938, 0.184051513671875, 0.19241714477539062, 0.20078277587890625, 0.20914840698242188, 0.2175140380859375, 0.22587966918945312, 0.23424530029296875, 0.24261093139648438, 0.2509765625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 15.0, 17.0, 65.0, 119.0, 242.0, 246.0, 165.0, 66.0, 26.0, 10.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50014591217041, -5.373208999633789, -5.24627161026001, -5.1193342208862305, -4.992397308349609, -4.865460395812988, -4.738523006439209, -4.61158561706543, -4.484648704528809, -4.3577117919921875, -4.230774402618408, -4.103837013244629, -3.976900100708008, -3.8499629497528076, -3.7230257987976074, -3.5960886478424072, -3.469151496887207, -3.342214345932007, -3.2152771949768066, -3.0883400440216064, -2.9614028930664062, -2.834465742111206, -2.707528591156006, -2.5805914402008057, -2.4536542892456055, -2.3267171382904053, -2.199779987335205, -2.072842836380005, -1.9459056854248047, -1.8189685344696045, -1.6920313835144043, -1.565094232559204, -1.438157081604004, -1.3112199306488037, -1.1842827796936035, -1.0573456287384033, -0.9304084777832031, -0.8034713268280029, -0.6765341758728027, -0.5495970249176025, -0.42265987396240234, -0.29572272300720215, -0.16878557205200195, -0.04184842109680176, 0.08508872985839844, 0.21202588081359863, 0.33896303176879883, 0.465900182723999, 0.5928373336791992, 0.7197744846343994, 0.8467116355895996, 0.9736487865447998, 1.1005859375, 1.2275230884552002, 1.3544602394104004, 1.4813973903656006, 1.6083345413208008, 1.735271692276001, 1.8622088432312012, 1.9891459941864014, 2.1160831451416016, 2.2430202960968018, 2.369957447052002, 2.496894598007202, 2.6238317489624023]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 7.0, 10.0, 6.0, 14.0, 14.0, 25.0, 27.0, 22.0, 37.0, 42.0, 36.0, 46.0, 40.0, 52.0, 48.0, 62.0, 65.0, 57.0, 51.0, 55.0, 39.0, 38.0, 34.0, 29.0, 27.0, 23.0, 19.0, 15.0, 9.0, 12.0, 10.0, 4.0, 4.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5750240087509155, -1.5291730165481567, -1.4833221435546875, -1.4374711513519287, -1.39162015914917, -1.3457691669464111, -1.299918293952942, -1.254067301750183, -1.2082164287567139, -1.162365436553955, -1.1165145635604858, -1.070663571357727, -1.0248125791549683, -0.9789616465568542, -0.9331107139587402, -0.8872597217559814, -0.8414087295532227, -0.7955577969551086, -0.7497068047523499, -0.7038558721542358, -0.658004879951477, -0.612153947353363, -0.566303014755249, -0.5204520225524902, -0.4746010899543762, -0.4287501275539398, -0.3828991651535034, -0.3370482325553894, -0.291197270154953, -0.2453463077545166, -0.1994953751564026, -0.1536444127559662, -0.10779345035552979, -0.06194249540567398, -0.016091540455818176, 0.02975940704345703, 0.07561036944389343, 0.12146133184432983, 0.16731226444244385, 0.21316322684288025, 0.25901418924331665, 0.30486515164375305, 0.35071611404418945, 0.39656704664230347, 0.44241800904273987, 0.48826897144317627, 0.5341199040412903, 0.5799708366394043, 0.6258218288421631, 0.6716727614402771, 0.7175237536430359, 0.7633746862411499, 0.8092256784439087, 0.8550766110420227, 0.9009275436401367, 0.9467785358428955, 0.9926294684410095, 1.0384804010391235, 1.0843313932418823, 1.1301822662353516, 1.1760332584381104, 1.2218842506408691, 1.267735242843628, 1.3135861158370972, 1.359437108039856]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 5.0, 12.0, 15.0, 17.0, 27.0, 41.0, 61.0, 99.0, 136.0, 198.0, 386.0, 574.0, 856.0, 1383.0, 2257.0, 3690.0, 6558.0, 12295.0, 22965.0, 49836.0, 131136.0, 349574.0, 284315.0, 98631.0, 39669.0, 19256.0, 10178.0, 5664.0, 3282.0, 2040.0, 1219.0, 732.0, 500.0, 336.0, 202.0, 134.0, 93.0, 62.0, 49.0, 24.0, 13.0, 7.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.1807861328125, -0.17528533935546875, -0.1697845458984375, -0.16428375244140625, -0.158782958984375, -0.15328216552734375, -0.1477813720703125, -0.14228057861328125, -0.13677978515625, -0.13127899169921875, -0.1257781982421875, -0.12027740478515625, -0.114776611328125, -0.10927581787109375, -0.1037750244140625, -0.09827423095703125, -0.0927734375, -0.08727264404296875, -0.0817718505859375, -0.07627105712890625, -0.070770263671875, -0.06526947021484375, -0.0597686767578125, -0.05426788330078125, -0.04876708984375, -0.04326629638671875, -0.0377655029296875, -0.03226470947265625, -0.026763916015625, -0.02126312255859375, -0.0157623291015625, -0.01026153564453125, -0.0047607421875, 0.00074005126953125, 0.0062408447265625, 0.01174163818359375, 0.017242431640625, 0.02274322509765625, 0.0282440185546875, 0.03374481201171875, 0.03924560546875, 0.04474639892578125, 0.0502471923828125, 0.05574798583984375, 0.061248779296875, 0.06674957275390625, 0.0722503662109375, 0.07775115966796875, 0.083251953125, 0.08875274658203125, 0.0942535400390625, 0.09975433349609375, 0.105255126953125, 0.11075592041015625, 0.1162567138671875, 0.12175750732421875, 0.12725830078125, 0.13275909423828125, 0.1382598876953125, 0.14376068115234375, 0.149261474609375, 0.15476226806640625, 0.1602630615234375, 0.16576385498046875, 0.1712646484375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 6.0, 9.0, 5.0, 11.0, 12.0, 19.0, 15.0, 26.0, 29.0, 22.0, 35.0, 28.0, 36.0, 45.0, 40.0, 50.0, 38.0, 38.0, 53.0, 49.0, 43.0, 40.0, 35.0, 35.0, 32.0, 39.0, 34.0, 23.0, 22.0, 24.0, 25.0, 11.0, 14.0, 12.0, 6.0, 5.0, 8.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.10479736328125, -0.10155773162841797, -0.09831809997558594, -0.0950784683227539, -0.09183883666992188, -0.08859920501708984, -0.08535957336425781, -0.08211994171142578, -0.07888031005859375, -0.07564067840576172, -0.07240104675292969, -0.06916141510009766, -0.06592178344726562, -0.0626821517944336, -0.05944252014160156, -0.05620288848876953, -0.0529632568359375, -0.04972362518310547, -0.04648399353027344, -0.043244361877441406, -0.040004730224609375, -0.036765098571777344, -0.03352546691894531, -0.03028583526611328, -0.02704620361328125, -0.02380657196044922, -0.020566940307617188, -0.017327308654785156, -0.014087677001953125, -0.010848045349121094, -0.0076084136962890625, -0.004368782043457031, -0.001129150390625, 0.0021104812622070312, 0.0053501129150390625, 0.008589744567871094, 0.011829376220703125, 0.015069007873535156, 0.018308639526367188, 0.02154827117919922, 0.02478790283203125, 0.02802753448486328, 0.03126716613769531, 0.034506797790527344, 0.037746429443359375, 0.040986061096191406, 0.04422569274902344, 0.04746532440185547, 0.0507049560546875, 0.05394458770751953, 0.05718421936035156, 0.060423851013183594, 0.06366348266601562, 0.06690311431884766, 0.07014274597167969, 0.07338237762451172, 0.07662200927734375, 0.07986164093017578, 0.08310127258300781, 0.08634090423583984, 0.08958053588867188, 0.0928201675415039, 0.09605979919433594, 0.09929943084716797, 0.1025390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 10.0, 11.0, 9.0, 25.0, 28.0, 31.0, 40.0, 64.0, 123.0, 158.0, 331.0, 613.0, 1243.0, 2882.0, 9557.0, 48180.0, 694315.0, 254192.0, 26207.0, 6330.0, 2100.0, 890.0, 502.0, 258.0, 160.0, 96.0, 69.0, 35.0, 25.0, 19.0, 17.0, 16.0, 8.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.438720703125, -0.4240150451660156, -0.40930938720703125, -0.3946037292480469, -0.3798980712890625, -0.3651924133300781, -0.35048675537109375, -0.3357810974121094, -0.321075439453125, -0.3063697814941406, -0.29166412353515625, -0.2769584655761719, -0.2622528076171875, -0.24754714965820312, -0.23284149169921875, -0.21813583374023438, -0.20343017578125, -0.18872451782226562, -0.17401885986328125, -0.15931320190429688, -0.1446075439453125, -0.12990188598632812, -0.11519622802734375, -0.10049057006835938, -0.085784912109375, -0.07107925415039062, -0.05637359619140625, -0.041667938232421875, -0.0269622802734375, -0.012256622314453125, 0.00244903564453125, 0.017154693603515625, 0.0318603515625, 0.046566009521484375, 0.06127166748046875, 0.07597732543945312, 0.0906829833984375, 0.10538864135742188, 0.12009429931640625, 0.13479995727539062, 0.149505615234375, 0.16421127319335938, 0.17891693115234375, 0.19362258911132812, 0.2083282470703125, 0.22303390502929688, 0.23773956298828125, 0.2524452209472656, 0.26715087890625, 0.2818565368652344, 0.29656219482421875, 0.3112678527832031, 0.3259735107421875, 0.3406791687011719, 0.35538482666015625, 0.3700904846191406, 0.384796142578125, 0.3995018005371094, 0.41420745849609375, 0.4289131164550781, 0.4436187744140625, 0.4583244323730469, 0.47303009033203125, 0.4877357482910156, 0.50244140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 9.0, 3.0, 6.0, 4.0, 12.0, 16.0, 23.0, 21.0, 28.0, 38.0, 31.0, 44.0, 47.0, 53.0, 58.0, 54.0, 66.0, 59.0, 58.0, 44.0, 50.0, 48.0, 41.0, 30.0, 39.0, 21.0, 30.0, 17.0, 10.0, 8.0, 7.0, 8.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.57568359375, -0.5591812133789062, -0.5426788330078125, -0.5261764526367188, -0.509674072265625, -0.49317169189453125, -0.4766693115234375, -0.46016693115234375, -0.44366455078125, -0.42716217041015625, -0.4106597900390625, -0.39415740966796875, -0.377655029296875, -0.36115264892578125, -0.3446502685546875, -0.32814788818359375, -0.3116455078125, -0.29514312744140625, -0.2786407470703125, -0.26213836669921875, -0.245635986328125, -0.22913360595703125, -0.2126312255859375, -0.19612884521484375, -0.17962646484375, -0.16312408447265625, -0.1466217041015625, -0.13011932373046875, -0.113616943359375, -0.09711456298828125, -0.0806121826171875, -0.06410980224609375, -0.047607421875, -0.03110504150390625, -0.0146026611328125, 0.00189971923828125, 0.018402099609375, 0.03490447998046875, 0.0514068603515625, 0.06790924072265625, 0.08441162109375, 0.10091400146484375, 0.1174163818359375, 0.13391876220703125, 0.150421142578125, 0.16692352294921875, 0.1834259033203125, 0.19992828369140625, 0.2164306640625, 0.23293304443359375, 0.2494354248046875, 0.26593780517578125, 0.282440185546875, 0.29894256591796875, 0.3154449462890625, 0.33194732666015625, 0.34844970703125, 0.36495208740234375, 0.3814544677734375, 0.39795684814453125, 0.414459228515625, 0.43096160888671875, 0.4474639892578125, 0.46396636962890625, 0.48046875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 8.0, 3.0, 5.0, 11.0, 14.0, 27.0, 38.0, 65.0, 91.0, 125.0, 194.0, 451.0, 921.0, 2129.0, 6293.0, 23568.0, 159366.0, 729027.0, 100394.0, 17379.0, 4995.0, 1760.0, 716.0, 411.0, 185.0, 119.0, 73.0, 70.0, 26.0, 27.0, 18.0, 12.0, 6.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1754150390625, -0.16901206970214844, -0.16260910034179688, -0.1562061309814453, -0.14980316162109375, -0.1434001922607422, -0.13699722290039062, -0.13059425354003906, -0.1241912841796875, -0.11778831481933594, -0.11138534545898438, -0.10498237609863281, -0.09857940673828125, -0.09217643737792969, -0.08577346801757812, -0.07937049865722656, -0.072967529296875, -0.06656455993652344, -0.060161590576171875, -0.05375862121582031, -0.04735565185546875, -0.04095268249511719, -0.034549713134765625, -0.028146743774414062, -0.0217437744140625, -0.015340805053710938, -0.008937835693359375, -0.0025348663330078125, 0.00386810302734375, 0.010271072387695312, 0.016674041748046875, 0.023077011108398438, 0.02947998046875, 0.03588294982910156, 0.042285919189453125, 0.04868888854980469, 0.05509185791015625, 0.06149482727050781, 0.06789779663085938, 0.07430076599121094, 0.0807037353515625, 0.08710670471191406, 0.09350967407226562, 0.09991264343261719, 0.10631561279296875, 0.11271858215332031, 0.11912155151367188, 0.12552452087402344, 0.131927490234375, 0.13833045959472656, 0.14473342895507812, 0.1511363983154297, 0.15753936767578125, 0.1639423370361328, 0.17034530639648438, 0.17674827575683594, 0.1831512451171875, 0.18955421447753906, 0.19595718383789062, 0.2023601531982422, 0.20876312255859375, 0.2151660919189453, 0.22156906127929688, 0.22797203063964844, 0.234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 7.0, 11.0, 15.0, 11.0, 17.0, 17.0, 25.0, 26.0, 42.0, 51.0, 61.0, 70.0, 87.0, 112.0, 79.0, 72.0, 63.0, 58.0, 41.0, 26.0, 14.0, 10.0, 18.0, 10.0, 5.0, 5.0, 6.0, 6.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.513429641723633e-05, -5.342625081539154e-05, -5.171820521354675e-05, -5.0010159611701965e-05, -4.830211400985718e-05, -4.659406840801239e-05, -4.48860228061676e-05, -4.3177977204322815e-05, -4.146993160247803e-05, -3.976188600063324e-05, -3.805384039878845e-05, -3.6345794796943665e-05, -3.463774919509888e-05, -3.292970359325409e-05, -3.12216579914093e-05, -2.9513612389564514e-05, -2.7805566787719727e-05, -2.609752118587494e-05, -2.438947558403015e-05, -2.2681429982185364e-05, -2.0973384380340576e-05, -1.926533877849579e-05, -1.7557293176651e-05, -1.5849247574806213e-05, -1.4141201972961426e-05, -1.2433156371116638e-05, -1.072511076927185e-05, -9.017065167427063e-06, -7.309019565582275e-06, -5.600973963737488e-06, -3.8929283618927e-06, -2.1848827600479126e-06, -4.76837158203125e-07, 1.2312084436416626e-06, 2.93925404548645e-06, 4.647299647331238e-06, 6.355345249176025e-06, 8.063390851020813e-06, 9.7714364528656e-06, 1.1479482054710388e-05, 1.3187527656555176e-05, 1.4895573258399963e-05, 1.660361886024475e-05, 1.831166446208954e-05, 2.0019710063934326e-05, 2.1727755665779114e-05, 2.34358012676239e-05, 2.514384686946869e-05, 2.6851892471313477e-05, 2.8559938073158264e-05, 3.0267983675003052e-05, 3.197602927684784e-05, 3.368407487869263e-05, 3.5392120480537415e-05, 3.71001660823822e-05, 3.880821168422699e-05, 4.051625728607178e-05, 4.2224302887916565e-05, 4.393234848976135e-05, 4.564039409160614e-05, 4.734843969345093e-05, 4.9056485295295715e-05, 5.07645308971405e-05, 5.247257649898529e-05, 5.418062210083008e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 8.0, 9.0, 18.0, 21.0, 33.0, 58.0, 97.0, 178.0, 363.0, 764.0, 2064.0, 7410.0, 47481.0, 722429.0, 240396.0, 20374.0, 4337.0, 1391.0, 579.0, 238.0, 117.0, 79.0, 43.0, 27.0, 13.0, 10.0, 8.0, 3.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2454833984375, -0.23751258850097656, -0.22954177856445312, -0.2215709686279297, -0.21360015869140625, -0.2056293487548828, -0.19765853881835938, -0.18968772888183594, -0.1817169189453125, -0.17374610900878906, -0.16577529907226562, -0.1578044891357422, -0.14983367919921875, -0.1418628692626953, -0.13389205932617188, -0.12592124938964844, -0.117950439453125, -0.10997962951660156, -0.10200881958007812, -0.09403800964355469, -0.08606719970703125, -0.07809638977050781, -0.07012557983398438, -0.06215476989746094, -0.0541839599609375, -0.04621315002441406, -0.038242340087890625, -0.030271530151367188, -0.02230072021484375, -0.014329910278320312, -0.006359100341796875, 0.0016117095947265625, 0.00958251953125, 0.017553329467773438, 0.025524139404296875, 0.03349494934082031, 0.04146575927734375, 0.04943656921386719, 0.057407379150390625, 0.06537818908691406, 0.0733489990234375, 0.08131980895996094, 0.08929061889648438, 0.09726142883300781, 0.10523223876953125, 0.11320304870605469, 0.12117385864257812, 0.12914466857910156, 0.137115478515625, 0.14508628845214844, 0.15305709838867188, 0.1610279083251953, 0.16899871826171875, 0.1769695281982422, 0.18494033813476562, 0.19291114807128906, 0.2008819580078125, 0.20885276794433594, 0.21682357788085938, 0.2247943878173828, 0.23276519775390625, 0.2407360076904297, 0.24870681762695312, 0.25667762756347656, 0.2646484375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 14.0, 9.0, 13.0, 19.0, 22.0, 27.0, 46.0, 71.0, 75.0, 103.0, 118.0, 109.0, 84.0, 71.0, 58.0, 40.0, 26.0, 23.0, 17.0, 19.0, 8.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2354736328125, -0.2294139862060547, -0.22335433959960938, -0.21729469299316406, -0.21123504638671875, -0.20517539978027344, -0.19911575317382812, -0.1930561065673828, -0.1869964599609375, -0.1809368133544922, -0.17487716674804688, -0.16881752014160156, -0.16275787353515625, -0.15669822692871094, -0.15063858032226562, -0.1445789337158203, -0.138519287109375, -0.1324596405029297, -0.12639999389648438, -0.12034034729003906, -0.11428070068359375, -0.10822105407714844, -0.10216140747070312, -0.09610176086425781, -0.0900421142578125, -0.08398246765136719, -0.07792282104492188, -0.07186317443847656, -0.06580352783203125, -0.05974388122558594, -0.053684234619140625, -0.04762458801269531, -0.04156494140625, -0.03550529479980469, -0.029445648193359375, -0.023386001586914062, -0.01732635498046875, -0.011266708374023438, -0.005207061767578125, 0.0008525848388671875, 0.0069122314453125, 0.012971878051757812, 0.019031524658203125, 0.025091171264648438, 0.03115081787109375, 0.03721046447753906, 0.043270111083984375, 0.04932975769042969, 0.055389404296875, 0.06144905090332031, 0.06750869750976562, 0.07356834411621094, 0.07962799072265625, 0.08568763732910156, 0.09174728393554688, 0.09780693054199219, 0.1038665771484375, 0.10992622375488281, 0.11598587036132812, 0.12204551696777344, 0.12810516357421875, 0.13416481018066406, 0.14022445678710938, 0.1462841033935547, 0.15234375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 6.0, 15.0, 25.0, 61.0, 145.0, 250.0, 267.0, 131.0, 56.0, 25.0, 6.0, 4.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.136523723602295, -3.000941276550293, -2.865358829498291, -2.72977614402771, -2.594193696975708, -2.458611249923706, -2.323028564453125, -2.187446117401123, -2.051863670349121, -1.9162812232971191, -1.7806986570358276, -1.6451160907745361, -1.5095336437225342, -1.3739511966705322, -1.2383686304092407, -1.1027860641479492, -0.9672036170959473, -0.8316211104393005, -0.6960386037826538, -0.5604560971260071, -0.42487359046936035, -0.2892910838127136, -0.1537085771560669, -0.018126070499420166, 0.11745643615722656, 0.2530389428138733, 0.38862144947052, 0.5242039561271667, 0.6597864627838135, 0.7953689694404602, 0.9309514760971069, 1.0665340423583984, 1.2021164894104004, 1.3376989364624023, 1.4732815027236938, 1.6088640689849854, 1.7444465160369873, 1.8800289630889893, 2.0156116485595703, 2.1511940956115723, 2.286776542663574, 2.422358989715576, 2.557941436767578, 2.693524122238159, 2.829106569290161, 2.964689016342163, 3.100271701812744, 3.235854148864746, 3.371436595916748, 3.50701904296875, 3.642601490020752, 3.778184175491333, 3.913766622543335, 4.049349308013916, 4.184931755065918, 4.32051420211792, 4.456096649169922, 4.591679096221924, 4.727261543273926, 4.862843990325928, 4.99842643737793, 5.13400936126709, 5.269591808319092, 5.405174255371094, 5.540756702423096]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 12.0, 13.0, 20.0, 17.0, 13.0, 25.0, 29.0, 22.0, 38.0, 30.0, 33.0, 45.0, 49.0, 51.0, 50.0, 48.0, 61.0, 61.0, 54.0, 49.0, 41.0, 31.0, 35.0, 26.0, 22.0, 24.0, 20.0, 17.0, 8.0, 11.0, 4.0, 7.0, 6.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5769604444503784, -1.5185120105743408, -1.4600635766983032, -1.4016151428222656, -1.343166708946228, -1.2847182750701904, -1.2262698411941528, -1.1678214073181152, -1.1093729734420776, -1.05092453956604, -0.9924761056900024, -0.9340276718139648, -0.8755792379379272, -0.8171308040618896, -0.758682370185852, -0.7002339363098145, -0.6417855024337769, -0.5833370685577393, -0.5248886346817017, -0.46644020080566406, -0.40799176692962646, -0.34954333305358887, -0.29109489917755127, -0.23264646530151367, -0.17419803142547607, -0.11574959754943848, -0.05730116367340088, 0.0011472702026367188, 0.059595704078674316, 0.11804413795471191, 0.1764925718307495, 0.2349410057067871, 0.29338955879211426, 0.35183799266815186, 0.41028642654418945, 0.46873486042022705, 0.5271832942962646, 0.5856317281723022, 0.6440801620483398, 0.7025285959243774, 0.760977029800415, 0.8194254636764526, 0.8778738975524902, 0.9363223314285278, 0.9947707653045654, 1.053219199180603, 1.1116676330566406, 1.1701160669326782, 1.2285645008087158, 1.2870129346847534, 1.345461368560791, 1.4039098024368286, 1.4623582363128662, 1.5208066701889038, 1.5792551040649414, 1.637703537940979, 1.6961519718170166, 1.7546004056930542, 1.8130488395690918, 1.8714972734451294, 1.929945707321167, 1.9883941411972046, 2.046842575073242, 2.1052908897399902, 2.1637394428253174]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 8.0, 5.0, 2.0, 7.0, 11.0, 5.0, 15.0, 24.0, 23.0, 39.0, 52.0, 68.0, 104.0, 146.0, 253.0, 365.0, 625.0, 935.0, 1710.0, 3165.0, 5882.0, 11843.0, 25741.0, 62853.0, 182617.0, 659197.0, 1785870.0, 1024822.0, 273529.0, 87398.0, 34447.0, 15435.0, 7676.0, 3869.0, 2192.0, 1252.0, 801.0, 443.0, 281.0, 186.0, 136.0, 76.0, 60.0, 33.0, 21.0, 31.0, 12.0, 11.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.1337890625, -0.13003826141357422, -0.12628746032714844, -0.12253665924072266, -0.11878585815429688, -0.1150350570678711, -0.11128425598144531, -0.10753345489501953, -0.10378265380859375, -0.10003185272216797, -0.09628105163574219, -0.0925302505493164, -0.08877944946289062, -0.08502864837646484, -0.08127784729003906, -0.07752704620361328, -0.0737762451171875, -0.07002544403076172, -0.06627464294433594, -0.06252384185791016, -0.058773040771484375, -0.055022239685058594, -0.05127143859863281, -0.04752063751220703, -0.04376983642578125, -0.04001903533935547, -0.03626823425292969, -0.032517433166503906, -0.028766632080078125, -0.025015830993652344, -0.021265029907226562, -0.01751422882080078, -0.013763427734375, -0.010012626647949219, -0.0062618255615234375, -0.0025110244750976562, 0.001239776611328125, 0.004990577697753906, 0.008741378784179688, 0.012492179870605469, 0.01624298095703125, 0.01999378204345703, 0.023744583129882812, 0.027495384216308594, 0.031246185302734375, 0.034996986389160156, 0.03874778747558594, 0.04249858856201172, 0.0462493896484375, 0.05000019073486328, 0.05375099182128906, 0.057501792907714844, 0.061252593994140625, 0.0650033950805664, 0.06875419616699219, 0.07250499725341797, 0.07625579833984375, 0.08000659942626953, 0.08375740051269531, 0.0875082015991211, 0.09125900268554688, 0.09500980377197266, 0.09876060485839844, 0.10251140594482422, 0.10626220703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 11.0, 17.0, 17.0, 28.0, 36.0, 39.0, 42.0, 54.0, 62.0, 68.0, 57.0, 70.0, 68.0, 55.0, 70.0, 52.0, 50.0, 44.0, 40.0, 29.0, 17.0, 25.0, 17.0, 12.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1878662109375, -0.18338871002197266, -0.1789112091064453, -0.17443370819091797, -0.16995620727539062, -0.16547870635986328, -0.16100120544433594, -0.1565237045288086, -0.15204620361328125, -0.1475687026977539, -0.14309120178222656, -0.13861370086669922, -0.13413619995117188, -0.12965869903564453, -0.1251811981201172, -0.12070369720458984, -0.1162261962890625, -0.11174869537353516, -0.10727119445800781, -0.10279369354248047, -0.09831619262695312, -0.09383869171142578, -0.08936119079589844, -0.0848836898803711, -0.08040618896484375, -0.0759286880493164, -0.07145118713378906, -0.06697368621826172, -0.062496185302734375, -0.05801868438720703, -0.05354118347167969, -0.049063682556152344, -0.044586181640625, -0.040108680725097656, -0.03563117980957031, -0.03115367889404297, -0.026676177978515625, -0.02219867706298828, -0.017721176147460938, -0.013243675231933594, -0.00876617431640625, -0.004288673400878906, 0.0001888275146484375, 0.004666328430175781, 0.009143829345703125, 0.013621330261230469, 0.018098831176757812, 0.022576332092285156, 0.0270538330078125, 0.031531333923339844, 0.03600883483886719, 0.04048633575439453, 0.044963836669921875, 0.04944133758544922, 0.05391883850097656, 0.058396339416503906, 0.06287384033203125, 0.0673513412475586, 0.07182884216308594, 0.07630634307861328, 0.08078384399414062, 0.08526134490966797, 0.08973884582519531, 0.09421634674072266, 0.09869384765625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 23.0, 34.0, 55.0, 93.0, 192.0, 376.0, 796.0, 2085.0, 5852.0, 21323.0, 105633.0, 1117408.0, 2663998.0, 222047.0, 38343.0, 9975.0, 3284.0, 1401.0, 643.0, 317.0, 157.0, 103.0, 54.0, 23.0, 21.0, 15.0, 9.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3173828125, -0.3075218200683594, -0.29766082763671875, -0.2877998352050781, -0.2779388427734375, -0.2680778503417969, -0.25821685791015625, -0.24835586547851562, -0.238494873046875, -0.22863388061523438, -0.21877288818359375, -0.20891189575195312, -0.1990509033203125, -0.18918991088867188, -0.17932891845703125, -0.16946792602539062, -0.15960693359375, -0.14974594116210938, -0.13988494873046875, -0.13002395629882812, -0.1201629638671875, -0.11030197143554688, -0.10044097900390625, -0.09057998657226562, -0.080718994140625, -0.07085800170898438, -0.06099700927734375, -0.051136016845703125, -0.0412750244140625, -0.031414031982421875, -0.02155303955078125, -0.011692047119140625, -0.0018310546875, 0.008029937744140625, 0.01789093017578125, 0.027751922607421875, 0.0376129150390625, 0.047473907470703125, 0.05733489990234375, 0.06719589233398438, 0.077056884765625, 0.08691787719726562, 0.09677886962890625, 0.10663986206054688, 0.1165008544921875, 0.12636184692382812, 0.13622283935546875, 0.14608383178710938, 0.15594482421875, 0.16580581665039062, 0.17566680908203125, 0.18552780151367188, 0.1953887939453125, 0.20524978637695312, 0.21511077880859375, 0.22497177124023438, 0.234832763671875, 0.24469375610351562, 0.25455474853515625, 0.2644157409667969, 0.2742767333984375, 0.2841377258300781, 0.29399871826171875, 0.3038597106933594, 0.313720703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0, 11.0, 6.0, 14.0, 16.0, 20.0, 20.0, 35.0, 41.0, 55.0, 71.0, 91.0, 138.0, 185.0, 266.0, 331.0, 438.0, 491.0, 478.0, 356.0, 254.0, 154.0, 146.0, 100.0, 72.0, 56.0, 44.0, 36.0, 21.0, 21.0, 18.0, 14.0, 10.0, 9.0, 18.0, 3.0, 14.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.231201171875, -0.22312545776367188, -0.21504974365234375, -0.20697402954101562, -0.1988983154296875, -0.19082260131835938, -0.18274688720703125, -0.17467117309570312, -0.166595458984375, -0.15851974487304688, -0.15044403076171875, -0.14236831665039062, -0.1342926025390625, -0.12621688842773438, -0.11814117431640625, -0.11006546020507812, -0.10198974609375, -0.09391403198242188, -0.08583831787109375, -0.07776260375976562, -0.0696868896484375, -0.061611175537109375, -0.05353546142578125, -0.045459747314453125, -0.037384033203125, -0.029308319091796875, -0.02123260498046875, -0.013156890869140625, -0.0050811767578125, 0.002994537353515625, 0.01107025146484375, 0.019145965576171875, 0.0272216796875, 0.035297393798828125, 0.04337310791015625, 0.051448822021484375, 0.0595245361328125, 0.06760025024414062, 0.07567596435546875, 0.08375167846679688, 0.091827392578125, 0.09990310668945312, 0.10797882080078125, 0.11605453491210938, 0.1241302490234375, 0.13220596313476562, 0.14028167724609375, 0.14835739135742188, 0.15643310546875, 0.16450881958007812, 0.17258453369140625, 0.18066024780273438, 0.1887359619140625, 0.19681167602539062, 0.20488739013671875, 0.21296310424804688, 0.221038818359375, 0.22911453247070312, 0.23719024658203125, 0.24526596069335938, 0.2533416748046875, 0.2614173889160156, 0.26949310302734375, 0.2775688171386719, 0.28564453125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 13.0, 29.0, 100.0, 253.0, 358.0, 159.0, 48.0, 16.0, 10.0, 4.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.392030715942383, -8.187795639038086, -7.983559608459473, -7.779324054718018, -7.5750885009765625, -7.370852947235107, -7.166617393493652, -6.962381839752197, -6.758146286010742, -6.553910732269287, -6.349675178527832, -6.145439624786377, -5.941204071044922, -5.736968517303467, -5.532732963562012, -5.328497409820557, -5.124261856079102, -4.9200263023376465, -4.715790748596191, -4.511555194854736, -4.307319641113281, -4.103084087371826, -3.898848533630371, -3.694612979888916, -3.490377426147461, -3.286141872406006, -3.081906318664551, -2.8776707649230957, -2.6734352111816406, -2.4691996574401855, -2.2649641036987305, -2.0607285499572754, -1.8564934730529785, -1.6522579193115234, -1.4480223655700684, -1.2437868118286133, -1.0395512580871582, -0.8353157043457031, -0.631080150604248, -0.42684459686279297, -0.2226090431213379, -0.018373489379882812, 0.18586206436157227, 0.39009761810302734, 0.5943331718444824, 0.7985687255859375, 1.0028042793273926, 1.2070398330688477, 1.4112753868103027, 1.6155109405517578, 1.819746494293213, 2.023982048034668, 2.228217601776123, 2.432453155517578, 2.636688709259033, 2.8409242630004883, 3.0451598167419434, 3.2493953704833984, 3.4536309242248535, 3.6578664779663086, 3.8621020317077637, 4.066337585449219, 4.270573139190674, 4.474808692932129, 4.679044246673584]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 6.0, 1.0, 6.0, 9.0, 8.0, 14.0, 15.0, 10.0, 18.0, 20.0, 22.0, 27.0, 38.0, 35.0, 40.0, 43.0, 36.0, 43.0, 50.0, 40.0, 42.0, 44.0, 37.0, 47.0, 31.0, 37.0, 38.0, 30.0, 31.0, 32.0, 22.0, 20.0, 18.0, 20.0, 12.0, 16.0, 10.0, 3.0, 9.0, 9.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1628868579864502, -1.1204020977020264, -1.077917456626892, -1.0354326963424683, -0.9929479956626892, -0.9504632949829102, -0.9079785346984863, -0.8654938340187073, -0.8230091333389282, -0.7805244326591492, -0.7380396723747253, -0.6955549716949463, -0.6530702710151672, -0.6105855703353882, -0.5681008100509644, -0.5256161093711853, -0.4831313490867615, -0.44064661860466003, -0.398161917924881, -0.35567718744277954, -0.3131924867630005, -0.27070775628089905, -0.2282230257987976, -0.18573832511901855, -0.14325359463691711, -0.10076887905597687, -0.058284156024456024, -0.01579943299293518, 0.026685282588005066, 0.06916999816894531, 0.11165472865104675, 0.1541394293308258, 0.19662415981292725, 0.2391088753938675, 0.28159359097480774, 0.3240783214569092, 0.36656302213668823, 0.4090477526187897, 0.4515324831008911, 0.49401718378067017, 0.5365018844604492, 0.5789865851402283, 0.6214713454246521, 0.6639560461044312, 0.7064407467842102, 0.7489254474639893, 0.7914102077484131, 0.8338949084281921, 0.876379668712616, 0.918864369392395, 0.9613491296768188, 1.0038337707519531, 1.046318531036377, 1.0888032913208008, 1.1312880516052246, 1.1737726926803589, 1.2162574529647827, 1.2587422132492065, 1.3012268543243408, 1.3437116146087646, 1.3861963748931885, 1.4286810159683228, 1.4711657762527466, 1.5136504173278809, 1.5561351776123047]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 9.0, 18.0, 20.0, 35.0, 58.0, 86.0, 102.0, 162.0, 294.0, 447.0, 795.0, 1255.0, 2303.0, 4278.0, 7832.0, 15813.0, 32746.0, 69091.0, 162592.0, 346912.0, 226870.0, 92236.0, 41725.0, 20201.0, 10382.0, 5301.0, 2839.0, 1696.0, 970.0, 541.0, 343.0, 234.0, 109.0, 71.0, 62.0, 47.0, 22.0, 13.0, 10.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2041015625, -0.19765853881835938, -0.19121551513671875, -0.18477249145507812, -0.1783294677734375, -0.17188644409179688, -0.16544342041015625, -0.15900039672851562, -0.152557373046875, -0.14611434936523438, -0.13967132568359375, -0.13322830200195312, -0.1267852783203125, -0.12034225463867188, -0.11389923095703125, -0.10745620727539062, -0.10101318359375, -0.09457015991210938, -0.08812713623046875, -0.08168411254882812, -0.0752410888671875, -0.06879806518554688, -0.06235504150390625, -0.055912017822265625, -0.049468994140625, -0.043025970458984375, -0.03658294677734375, -0.030139923095703125, -0.0236968994140625, -0.017253875732421875, -0.01081085205078125, -0.004367828369140625, 0.0020751953125, 0.008518218994140625, 0.01496124267578125, 0.021404266357421875, 0.0278472900390625, 0.034290313720703125, 0.04073333740234375, 0.047176361083984375, 0.053619384765625, 0.060062408447265625, 0.06650543212890625, 0.07294845581054688, 0.0793914794921875, 0.08583450317382812, 0.09227752685546875, 0.09872055053710938, 0.10516357421875, 0.11160659790039062, 0.11804962158203125, 0.12449264526367188, 0.1309356689453125, 0.13737869262695312, 0.14382171630859375, 0.15026473999023438, 0.156707763671875, 0.16315078735351562, 0.16959381103515625, 0.17603683471679688, 0.1824798583984375, 0.18892288208007812, 0.19536590576171875, 0.20180892944335938, 0.208251953125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 9.0, 12.0, 14.0, 16.0, 17.0, 21.0, 17.0, 22.0, 28.0, 32.0, 31.0, 33.0, 45.0, 40.0, 55.0, 40.0, 52.0, 40.0, 39.0, 35.0, 38.0, 41.0, 40.0, 48.0, 28.0, 30.0, 39.0, 17.0, 23.0, 19.0, 8.0, 12.0, 14.0, 9.0, 6.0, 6.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10955810546875, -0.10635948181152344, -0.10316085815429688, -0.09996223449707031, -0.09676361083984375, -0.09356498718261719, -0.09036636352539062, -0.08716773986816406, -0.0839691162109375, -0.08077049255371094, -0.07757186889648438, -0.07437324523925781, -0.07117462158203125, -0.06797599792480469, -0.06477737426757812, -0.06157875061035156, -0.058380126953125, -0.05518150329589844, -0.051982879638671875, -0.04878425598144531, -0.04558563232421875, -0.04238700866699219, -0.039188385009765625, -0.03598976135253906, -0.0327911376953125, -0.029592514038085938, -0.026393890380859375, -0.023195266723632812, -0.01999664306640625, -0.016798019409179688, -0.013599395751953125, -0.010400772094726562, -0.0072021484375, -0.0040035247802734375, -0.000804901123046875, 0.0023937225341796875, 0.00559234619140625, 0.008790969848632812, 0.011989593505859375, 0.015188217163085938, 0.0183868408203125, 0.021585464477539062, 0.024784088134765625, 0.027982711791992188, 0.03118133544921875, 0.03437995910644531, 0.037578582763671875, 0.04077720642089844, 0.043975830078125, 0.04717445373535156, 0.050373077392578125, 0.05357170104980469, 0.05677032470703125, 0.05996894836425781, 0.06316757202148438, 0.06636619567871094, 0.0695648193359375, 0.07276344299316406, 0.07596206665039062, 0.07916069030761719, 0.08235931396484375, 0.08555793762207031, 0.08875656127929688, 0.09195518493652344, 0.09515380859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 7.0, 4.0, 11.0, 13.0, 15.0, 26.0, 37.0, 51.0, 87.0, 130.0, 201.0, 266.0, 408.0, 728.0, 1212.0, 2478.0, 6136.0, 24253.0, 201141.0, 736550.0, 56349.0, 10658.0, 3672.0, 1686.0, 950.0, 522.0, 311.0, 218.0, 150.0, 86.0, 53.0, 50.0, 29.0, 17.0, 17.0, 10.0, 8.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6083984375, -0.590087890625, -0.57177734375, -0.553466796875, -0.53515625, -0.516845703125, -0.49853515625, -0.480224609375, -0.4619140625, -0.443603515625, -0.42529296875, -0.406982421875, -0.388671875, -0.370361328125, -0.35205078125, -0.333740234375, -0.3154296875, -0.297119140625, -0.27880859375, -0.260498046875, -0.2421875, -0.223876953125, -0.20556640625, -0.187255859375, -0.1689453125, -0.150634765625, -0.13232421875, -0.114013671875, -0.095703125, -0.077392578125, -0.05908203125, -0.040771484375, -0.0224609375, -0.004150390625, 0.01416015625, 0.032470703125, 0.05078125, 0.069091796875, 0.08740234375, 0.105712890625, 0.1240234375, 0.142333984375, 0.16064453125, 0.178955078125, 0.197265625, 0.215576171875, 0.23388671875, 0.252197265625, 0.2705078125, 0.288818359375, 0.30712890625, 0.325439453125, 0.34375, 0.362060546875, 0.38037109375, 0.398681640625, 0.4169921875, 0.435302734375, 0.45361328125, 0.471923828125, 0.490234375, 0.508544921875, 0.52685546875, 0.545166015625, 0.5634765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 6.0, 5.0, 10.0, 18.0, 16.0, 19.0, 18.0, 29.0, 28.0, 37.0, 42.0, 42.0, 60.0, 50.0, 48.0, 47.0, 53.0, 43.0, 67.0, 58.0, 56.0, 38.0, 29.0, 34.0, 31.0, 20.0, 17.0, 12.0, 14.0, 9.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5222854614257812, -0.5040435791015625, -0.48580169677734375, -0.467559814453125, -0.44931793212890625, -0.4310760498046875, -0.41283416748046875, -0.39459228515625, -0.37635040283203125, -0.3581085205078125, -0.33986663818359375, -0.321624755859375, -0.30338287353515625, -0.2851409912109375, -0.26689910888671875, -0.2486572265625, -0.23041534423828125, -0.2121734619140625, -0.19393157958984375, -0.175689697265625, -0.15744781494140625, -0.1392059326171875, -0.12096405029296875, -0.10272216796875, -0.08448028564453125, -0.0662384033203125, -0.04799652099609375, -0.029754638671875, -0.01151275634765625, 0.0067291259765625, 0.02497100830078125, 0.043212890625, 0.06145477294921875, 0.0796966552734375, 0.09793853759765625, 0.116180419921875, 0.13442230224609375, 0.1526641845703125, 0.17090606689453125, 0.18914794921875, 0.20738983154296875, 0.2256317138671875, 0.24387359619140625, 0.262115478515625, 0.28035736083984375, 0.2985992431640625, 0.31684112548828125, 0.3350830078125, 0.35332489013671875, 0.3715667724609375, 0.38980865478515625, 0.408050537109375, 0.42629241943359375, 0.4445343017578125, 0.46277618408203125, 0.48101806640625, 0.49925994873046875, 0.5175018310546875, 0.5357437133789062, 0.553985595703125, 0.5722274780273438, 0.5904693603515625, 0.6087112426757812, 0.626953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 4.0, 6.0, 9.0, 19.0, 20.0, 30.0, 50.0, 92.0, 104.0, 235.0, 312.0, 596.0, 1101.0, 2209.0, 5225.0, 14661.0, 48318.0, 196828.0, 600233.0, 126519.0, 33682.0, 10377.0, 3972.0, 1713.0, 908.0, 466.0, 291.0, 188.0, 109.0, 69.0, 58.0, 47.0, 28.0, 28.0, 10.0, 8.0, 6.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1326904296875, -0.12845802307128906, -0.12422561645507812, -0.11999320983886719, -0.11576080322265625, -0.11152839660644531, -0.10729598999023438, -0.10306358337402344, -0.0988311767578125, -0.09459877014160156, -0.09036636352539062, -0.08613395690917969, -0.08190155029296875, -0.07766914367675781, -0.07343673706054688, -0.06920433044433594, -0.064971923828125, -0.06073951721191406, -0.056507110595703125, -0.05227470397949219, -0.04804229736328125, -0.04380989074707031, -0.039577484130859375, -0.03534507751464844, -0.0311126708984375, -0.026880264282226562, -0.022647857666015625, -0.018415451049804688, -0.01418304443359375, -0.009950637817382812, -0.005718231201171875, -0.0014858245849609375, 0.00274658203125, 0.0069789886474609375, 0.011211395263671875, 0.015443801879882812, 0.01967620849609375, 0.023908615112304688, 0.028141021728515625, 0.03237342834472656, 0.0366058349609375, 0.04083824157714844, 0.045070648193359375, 0.04930305480957031, 0.05353546142578125, 0.05776786804199219, 0.062000274658203125, 0.06623268127441406, 0.070465087890625, 0.07469749450683594, 0.07892990112304688, 0.08316230773925781, 0.08739471435546875, 0.09162712097167969, 0.09585952758789062, 0.10009193420410156, 0.1043243408203125, 0.10855674743652344, 0.11278915405273438, 0.11702156066894531, 0.12125396728515625, 0.1254863739013672, 0.12971878051757812, 0.13395118713378906, 0.13818359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 8.0, 11.0, 9.0, 5.0, 14.0, 15.0, 22.0, 20.0, 27.0, 29.0, 44.0, 53.0, 60.0, 71.0, 65.0, 73.0, 63.0, 65.0, 51.0, 42.0, 41.0, 33.0, 27.0, 24.0, 15.0, 17.0, 17.0, 14.0, 11.0, 6.0, 5.0, 8.0, 4.0, 9.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.155801773071289e-05, -4.990771412849426e-05, -4.8257410526275635e-05, -4.660710692405701e-05, -4.495680332183838e-05, -4.330649971961975e-05, -4.165619611740112e-05, -4.0005892515182495e-05, -3.835558891296387e-05, -3.670528531074524e-05, -3.505498170852661e-05, -3.3404678106307983e-05, -3.1754374504089355e-05, -3.0104070901870728e-05, -2.84537672996521e-05, -2.680346369743347e-05, -2.5153160095214844e-05, -2.3502856492996216e-05, -2.1852552890777588e-05, -2.020224928855896e-05, -1.8551945686340332e-05, -1.6901642084121704e-05, -1.5251338481903076e-05, -1.3601034879684448e-05, -1.195073127746582e-05, -1.0300427675247192e-05, -8.650124073028564e-06, -6.9998204708099365e-06, -5.349516868591309e-06, -3.6992132663726807e-06, -2.0489096641540527e-06, -3.986060619354248e-07, 1.2516975402832031e-06, 2.902001142501831e-06, 4.552304744720459e-06, 6.202608346939087e-06, 7.852911949157715e-06, 9.503215551376343e-06, 1.115351915359497e-05, 1.2803822755813599e-05, 1.4454126358032227e-05, 1.6104429960250854e-05, 1.7754733562469482e-05, 1.940503716468811e-05, 2.1055340766906738e-05, 2.2705644369125366e-05, 2.4355947971343994e-05, 2.6006251573562622e-05, 2.765655517578125e-05, 2.9306858777999878e-05, 3.0957162380218506e-05, 3.2607465982437134e-05, 3.425776958465576e-05, 3.590807318687439e-05, 3.755837678909302e-05, 3.9208680391311646e-05, 4.0858983993530273e-05, 4.25092875957489e-05, 4.415959119796753e-05, 4.580989480018616e-05, 4.7460198402404785e-05, 4.911050200462341e-05, 5.076080560684204e-05, 5.241110920906067e-05, 5.40614128112793e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 13.0, 20.0, 35.0, 54.0, 74.0, 125.0, 225.0, 337.0, 621.0, 1177.0, 2425.0, 5690.0, 19470.0, 119657.0, 716388.0, 147900.0, 22736.0, 6194.0, 2570.0, 1200.0, 645.0, 367.0, 195.0, 150.0, 96.0, 41.0, 39.0, 27.0, 15.0, 15.0, 7.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.175048828125, -0.16950035095214844, -0.16395187377929688, -0.1584033966064453, -0.15285491943359375, -0.1473064422607422, -0.14175796508789062, -0.13620948791503906, -0.1306610107421875, -0.12511253356933594, -0.11956405639648438, -0.11401557922363281, -0.10846710205078125, -0.10291862487792969, -0.09737014770507812, -0.09182167053222656, -0.086273193359375, -0.08072471618652344, -0.07517623901367188, -0.06962776184082031, -0.06407928466796875, -0.05853080749511719, -0.052982330322265625, -0.04743385314941406, -0.0418853759765625, -0.03633689880371094, -0.030788421630859375, -0.025239944458007812, -0.01969146728515625, -0.014142990112304688, -0.008594512939453125, -0.0030460357666015625, 0.00250244140625, 0.008050918579101562, 0.013599395751953125, 0.019147872924804688, 0.02469635009765625, 0.030244827270507812, 0.035793304443359375, 0.04134178161621094, 0.0468902587890625, 0.05243873596191406, 0.057987213134765625, 0.06353569030761719, 0.06908416748046875, 0.07463264465332031, 0.08018112182617188, 0.08572959899902344, 0.091278076171875, 0.09682655334472656, 0.10237503051757812, 0.10792350769042969, 0.11347198486328125, 0.11902046203613281, 0.12456893920898438, 0.13011741638183594, 0.1356658935546875, 0.14121437072753906, 0.14676284790039062, 0.1523113250732422, 0.15785980224609375, 0.1634082794189453, 0.16895675659179688, 0.17450523376464844, 0.1800537109375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 14.0, 13.0, 20.0, 20.0, 37.0, 41.0, 37.0, 37.0, 41.0, 66.0, 58.0, 64.0, 48.0, 56.0, 58.0, 73.0, 41.0, 42.0, 37.0, 26.0, 23.0, 26.0, 14.0, 19.0, 9.0, 8.0, 13.0, 10.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10552978515625, -0.1015329360961914, -0.09753608703613281, -0.09353923797607422, -0.08954238891601562, -0.08554553985595703, -0.08154869079589844, -0.07755184173583984, -0.07355499267578125, -0.06955814361572266, -0.06556129455566406, -0.06156444549560547, -0.057567596435546875, -0.05357074737548828, -0.04957389831542969, -0.045577049255371094, -0.0415802001953125, -0.037583351135253906, -0.03358650207519531, -0.02958965301513672, -0.025592803955078125, -0.02159595489501953, -0.017599105834960938, -0.013602256774902344, -0.00960540771484375, -0.005608558654785156, -0.0016117095947265625, 0.0023851394653320312, 0.006381988525390625, 0.010378837585449219, 0.014375686645507812, 0.018372535705566406, 0.022369384765625, 0.026366233825683594, 0.030363082885742188, 0.03435993194580078, 0.038356781005859375, 0.04235363006591797, 0.04635047912597656, 0.050347328186035156, 0.05434417724609375, 0.058341026306152344, 0.06233787536621094, 0.06633472442626953, 0.07033157348632812, 0.07432842254638672, 0.07832527160644531, 0.0823221206665039, 0.0863189697265625, 0.0903158187866211, 0.09431266784667969, 0.09830951690673828, 0.10230636596679688, 0.10630321502685547, 0.11030006408691406, 0.11429691314697266, 0.11829376220703125, 0.12229061126708984, 0.12628746032714844, 0.13028430938720703, 0.13428115844726562, 0.13827800750732422, 0.1422748565673828, 0.1462717056274414, 0.1502685546875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 14.0, 35.0, 129.0, 331.0, 286.0, 131.0, 45.0, 14.0, 5.0, 5.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.505383491516113, -8.30266284942627, -8.099943161010742, -7.897222995758057, -7.694502830505371, -7.4917826652526855, -7.2890625, -7.086341857910156, -6.883622169494629, -6.680902004241943, -6.478181838989258, -6.275461673736572, -6.072741508483887, -5.870021343231201, -5.667301177978516, -5.464580535888672, -5.261860370635986, -5.059140205383301, -4.856420040130615, -4.65369987487793, -4.450979709625244, -4.248259544372559, -4.045538902282715, -3.8428189754486084, -3.640098810195923, -3.4373786449432373, -3.2346584796905518, -3.031938076019287, -2.8292179107666016, -2.626497745513916, -2.4237775802612305, -2.221057415008545, -2.0183377265930176, -1.815617561340332, -1.6128973960876465, -1.4101771116256714, -1.2074569463729858, -1.0047367811203003, -0.8020164966583252, -0.5992963314056396, -0.3965761661529541, -0.19385597109794617, 0.008864223957061768, 0.2115844488143921, 0.41430461406707764, 0.6170247793197632, 0.8197450637817383, 1.0224652290344238, 1.2251853942871094, 1.427905559539795, 1.6306257247924805, 1.8333460092544556, 2.0360660552978516, 2.238786220550537, 2.4415066242218018, 2.6442267894744873, 2.846946954727173, 3.0496671199798584, 3.252387285232544, 3.4551076889038086, 3.657827854156494, 3.8605480194091797, 4.063268184661865, 4.265988349914551, 4.468708515167236]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 5.0, 5.0, 11.0, 11.0, 14.0, 15.0, 13.0, 21.0, 15.0, 22.0, 25.0, 26.0, 38.0, 46.0, 41.0, 45.0, 54.0, 61.0, 83.0, 76.0, 52.0, 40.0, 46.0, 33.0, 41.0, 31.0, 29.0, 20.0, 18.0, 17.0, 8.0, 15.0, 9.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3481132984161377, -2.279743194580078, -2.2113728523254395, -2.143002510070801, -2.074632406234741, -2.0062623023986816, -1.937891960144043, -1.8695217370986938, -1.8011515140533447, -1.7327812910079956, -1.6644110679626465, -1.5960408449172974, -1.5276706218719482, -1.4593003988265991, -1.39093017578125, -1.3225599527359009, -1.2541897296905518, -1.1858195066452026, -1.1174492835998535, -1.0490790605545044, -0.9807088375091553, -0.9123386144638062, -0.843968391418457, -0.7755981683731079, -0.7072279453277588, -0.6388577222824097, -0.5704874992370605, -0.5021172761917114, -0.4337470531463623, -0.3653768301010132, -0.29700660705566406, -0.22863638401031494, -0.16026592254638672, -0.0918956995010376, -0.023525476455688477, 0.044844746589660645, 0.11321496963500977, 0.1815851926803589, 0.249955415725708, 0.31832563877105713, 0.38669586181640625, 0.45506608486175537, 0.5234363079071045, 0.5918065309524536, 0.6601767539978027, 0.7285469770431519, 0.796917200088501, 0.8652874231338501, 0.9336576461791992, 1.0020278692245483, 1.0703980922698975, 1.1387683153152466, 1.2071385383605957, 1.2755087614059448, 1.343878984451294, 1.412249207496643, 1.4806194305419922, 1.5489896535873413, 1.6173598766326904, 1.6857300996780396, 1.7541003227233887, 1.8224705457687378, 1.890840768814087, 1.959210991859436, 2.027581214904785]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 10.0, 20.0, 27.0, 37.0, 71.0, 98.0, 181.0, 306.0, 622.0, 1258.0, 2763.0, 6842.0, 19419.0, 68575.0, 361072.0, 2166388.0, 1313465.0, 187781.0, 42647.0, 13385.0, 4985.0, 2133.0, 993.0, 500.0, 277.0, 172.0, 82.0, 56.0, 32.0, 24.0, 16.0, 12.0, 10.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.17930221557617188, -0.17366790771484375, -0.16803359985351562, -0.1623992919921875, -0.15676498413085938, -0.15113067626953125, -0.14549636840820312, -0.139862060546875, -0.13422775268554688, -0.12859344482421875, -0.12295913696289062, -0.1173248291015625, -0.11169052124023438, -0.10605621337890625, -0.10042190551757812, -0.09478759765625, -0.08915328979492188, -0.08351898193359375, -0.07788467407226562, -0.0722503662109375, -0.06661605834960938, -0.06098175048828125, -0.055347442626953125, -0.049713134765625, -0.044078826904296875, -0.03844451904296875, -0.032810211181640625, -0.0271759033203125, -0.021541595458984375, -0.01590728759765625, -0.010272979736328125, -0.004638671875, 0.000995635986328125, 0.00662994384765625, 0.012264251708984375, 0.0178985595703125, 0.023532867431640625, 0.02916717529296875, 0.034801483154296875, 0.040435791015625, 0.046070098876953125, 0.05170440673828125, 0.057338714599609375, 0.0629730224609375, 0.06860733032226562, 0.07424163818359375, 0.07987594604492188, 0.08551025390625, 0.09114456176757812, 0.09677886962890625, 0.10241317749023438, 0.1080474853515625, 0.11368179321289062, 0.11931610107421875, 0.12495040893554688, 0.130584716796875, 0.13621902465820312, 0.14185333251953125, 0.14748764038085938, 0.1531219482421875, 0.15875625610351562, 0.16439056396484375, 0.17002487182617188, 0.1756591796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 11.0, 4.0, 8.0, 12.0, 11.0, 15.0, 23.0, 27.0, 24.0, 41.0, 38.0, 34.0, 43.0, 48.0, 50.0, 51.0, 54.0, 44.0, 55.0, 57.0, 68.0, 38.0, 52.0, 34.0, 27.0, 36.0, 25.0, 9.0, 17.0, 14.0, 9.0, 9.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1497802734375, -0.14585590362548828, -0.14193153381347656, -0.13800716400146484, -0.13408279418945312, -0.1301584243774414, -0.1262340545654297, -0.12230968475341797, -0.11838531494140625, -0.11446094512939453, -0.11053657531738281, -0.1066122055053711, -0.10268783569335938, -0.09876346588134766, -0.09483909606933594, -0.09091472625732422, -0.0869903564453125, -0.08306598663330078, -0.07914161682128906, -0.07521724700927734, -0.07129287719726562, -0.0673685073852539, -0.06344413757324219, -0.05951976776123047, -0.05559539794921875, -0.05167102813720703, -0.04774665832519531, -0.043822288513183594, -0.039897918701171875, -0.035973548889160156, -0.03204917907714844, -0.02812480926513672, -0.024200439453125, -0.02027606964111328, -0.016351699829101562, -0.012427330017089844, -0.008502960205078125, -0.004578590393066406, -0.0006542205810546875, 0.0032701492309570312, 0.00719451904296875, 0.011118888854980469, 0.015043258666992188, 0.018967628479003906, 0.022891998291015625, 0.026816368103027344, 0.030740737915039062, 0.03466510772705078, 0.0385894775390625, 0.04251384735107422, 0.04643821716308594, 0.050362586975097656, 0.054286956787109375, 0.058211326599121094, 0.06213569641113281, 0.06606006622314453, 0.06998443603515625, 0.07390880584716797, 0.07783317565917969, 0.0817575454711914, 0.08568191528320312, 0.08960628509521484, 0.09353065490722656, 0.09745502471923828, 0.10137939453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 15.0, 11.0, 17.0, 26.0, 25.0, 53.0, 77.0, 116.0, 148.0, 264.0, 429.0, 716.0, 1432.0, 3168.0, 7208.0, 19921.0, 67401.0, 344770.0, 2585449.0, 976330.0, 133291.0, 33479.0, 11266.0, 4320.0, 1914.0, 1029.0, 488.0, 342.0, 191.0, 115.0, 67.0, 40.0, 49.0, 21.0, 29.0, 7.0, 16.0, 7.0, 6.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2403564453125, -0.2322711944580078, -0.22418594360351562, -0.21610069274902344, -0.20801544189453125, -0.19993019104003906, -0.19184494018554688, -0.1837596893310547, -0.1756744384765625, -0.1675891876220703, -0.15950393676757812, -0.15141868591308594, -0.14333343505859375, -0.13524818420410156, -0.12716293334960938, -0.11907768249511719, -0.110992431640625, -0.10290718078613281, -0.09482192993164062, -0.08673667907714844, -0.07865142822265625, -0.07056617736816406, -0.062480926513671875, -0.05439567565917969, -0.0463104248046875, -0.03822517395019531, -0.030139923095703125, -0.022054672241210938, -0.01396942138671875, -0.0058841705322265625, 0.002201080322265625, 0.010286331176757812, 0.01837158203125, 0.026456832885742188, 0.034542083740234375, 0.04262733459472656, 0.05071258544921875, 0.05879783630371094, 0.06688308715820312, 0.07496833801269531, 0.0830535888671875, 0.09113883972167969, 0.09922409057617188, 0.10730934143066406, 0.11539459228515625, 0.12347984313964844, 0.13156509399414062, 0.1396503448486328, 0.147735595703125, 0.1558208465576172, 0.16390609741210938, 0.17199134826660156, 0.18007659912109375, 0.18816184997558594, 0.19624710083007812, 0.2043323516845703, 0.2124176025390625, 0.2205028533935547, 0.22858810424804688, 0.23667335510253906, 0.24475860595703125, 0.25284385681152344, 0.2609291076660156, 0.2690143585205078, 0.277099609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 7.0, 5.0, 9.0, 3.0, 15.0, 20.0, 19.0, 31.0, 43.0, 58.0, 73.0, 116.0, 166.0, 250.0, 340.0, 517.0, 584.0, 549.0, 382.0, 273.0, 177.0, 119.0, 84.0, 50.0, 50.0, 29.0, 24.0, 23.0, 10.0, 10.0, 7.0, 3.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36279296875, -0.3525733947753906, -0.34235382080078125, -0.3321342468261719, -0.3219146728515625, -0.3116950988769531, -0.30147552490234375, -0.2912559509277344, -0.281036376953125, -0.2708168029785156, -0.26059722900390625, -0.2503776550292969, -0.2401580810546875, -0.22993850708007812, -0.21971893310546875, -0.20949935913085938, -0.19927978515625, -0.18906021118164062, -0.17884063720703125, -0.16862106323242188, -0.1584014892578125, -0.14818191528320312, -0.13796234130859375, -0.12774276733398438, -0.117523193359375, -0.10730361938476562, -0.09708404541015625, -0.08686447143554688, -0.0766448974609375, -0.06642532348632812, -0.05620574951171875, -0.045986175537109375, -0.0357666015625, -0.025547027587890625, -0.01532745361328125, -0.005107879638671875, 0.0051116943359375, 0.015331268310546875, 0.02555084228515625, 0.035770416259765625, 0.045989990234375, 0.056209564208984375, 0.06642913818359375, 0.07664871215820312, 0.0868682861328125, 0.09708786010742188, 0.10730743408203125, 0.11752700805664062, 0.12774658203125, 0.13796615600585938, 0.14818572998046875, 0.15840530395507812, 0.1686248779296875, 0.17884445190429688, 0.18906402587890625, 0.19928359985351562, 0.209503173828125, 0.21972274780273438, 0.22994232177734375, 0.24016189575195312, 0.2503814697265625, 0.2606010437011719, 0.27082061767578125, 0.2810401916503906, 0.291259765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 13.0, 20.0, 86.0, 276.0, 320.0, 188.0, 57.0, 13.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.473925590515137, -9.255084037780762, -9.036242485046387, -8.817400932312012, -8.598559379577637, -8.379717826843262, -8.16087532043457, -7.9420342445373535, -7.7231926918029785, -7.5043511390686035, -7.2855095863342285, -7.066667556762695, -6.84782600402832, -6.628984451293945, -6.41014289855957, -6.191301345825195, -5.97245979309082, -5.753618240356445, -5.53477668762207, -5.315935134887695, -5.097093105316162, -4.878251552581787, -4.659409999847412, -4.440568447113037, -4.221726417541504, -4.002884864807129, -3.784043073654175, -3.5652015209198, -3.346359968185425, -3.1275181770324707, -2.9086766242980957, -2.6898350715637207, -2.4709935188293457, -2.2521519660949707, -2.0333101749420166, -1.8144686222076416, -1.5956270694732666, -1.376785397529602, -1.1579437255859375, -0.9391021728515625, -0.720260500907898, -0.5014188885688782, -0.282577246427536, -0.06373560428619385, 0.15510600805282593, 0.3739476203918457, 0.5927892923355103, 0.8116308450698853, 1.0304725170135498, 1.2493141889572144, 1.4681557416915894, 1.686997413635254, 1.905838966369629, 2.124680519104004, 2.343522310256958, 2.562363862991333, 2.781205654144287, 3.000047206878662, 3.218888998031616, 3.437730550765991, 3.656572103500366, 3.8754138946533203, 4.094255447387695, 4.31309700012207, 4.531938552856445]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 7.0, 9.0, 2.0, 11.0, 8.0, 19.0, 18.0, 23.0, 25.0, 28.0, 25.0, 40.0, 43.0, 38.0, 45.0, 39.0, 40.0, 43.0, 54.0, 54.0, 49.0, 51.0, 41.0, 44.0, 33.0, 33.0, 30.0, 23.0, 30.0, 21.0, 16.0, 11.0, 15.0, 7.0, 9.0, 7.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7584247589111328, -1.7045485973358154, -1.6506723165512085, -1.5967961549758911, -1.5429198741912842, -1.4890437126159668, -1.4351675510406494, -1.3812912702560425, -1.3274149894714355, -1.2735388278961182, -1.2196625471115112, -1.1657863855361938, -1.111910104751587, -1.0580339431762695, -1.0041577816009521, -0.9502815008163452, -0.8964053392410278, -0.8425291180610657, -0.7886528968811035, -0.7347767353057861, -0.6809004545211792, -0.6270242929458618, -0.5731480717658997, -0.5192718505859375, -0.46539562940597534, -0.4115194082260132, -0.357643187046051, -0.30376699566841125, -0.2498907744884491, -0.19601455330848694, -0.14213836193084717, -0.08826214075088501, -0.03438591957092285, 0.01949029415845871, 0.07336650788784027, 0.12724271416664124, 0.1811189353466034, 0.23499515652656555, 0.2888713479042053, 0.3427475690841675, 0.39662379026412964, 0.4505000114440918, 0.504376232624054, 0.5582524538040161, 0.6121286153793335, 0.6660048961639404, 0.7198810577392578, 0.77375727891922, 0.8276335000991821, 0.8815097212791443, 0.9353859424591064, 0.9892621040344238, 1.0431383848190308, 1.0970145463943481, 1.150890827178955, 1.2047669887542725, 1.2586431503295898, 1.3125193119049072, 1.3663955926895142, 1.4202717542648315, 1.4741480350494385, 1.5280241966247559, 1.5819003582000732, 1.6357766389846802, 1.689652919769287]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 13.0, 16.0, 17.0, 25.0, 52.0, 70.0, 98.0, 178.0, 278.0, 446.0, 714.0, 1167.0, 2028.0, 3697.0, 6842.0, 13964.0, 31560.0, 87727.0, 328798.0, 392624.0, 108090.0, 36748.0, 15802.0, 7745.0, 4171.0, 2322.0, 1267.0, 773.0, 496.0, 308.0, 180.0, 136.0, 72.0, 46.0, 32.0, 13.0, 16.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2666015625, -0.259002685546875, -0.25140380859375, -0.243804931640625, -0.2362060546875, -0.228607177734375, -0.22100830078125, -0.213409423828125, -0.205810546875, -0.198211669921875, -0.19061279296875, -0.183013916015625, -0.1754150390625, -0.167816162109375, -0.16021728515625, -0.152618408203125, -0.14501953125, -0.137420654296875, -0.12982177734375, -0.122222900390625, -0.1146240234375, -0.107025146484375, -0.09942626953125, -0.091827392578125, -0.084228515625, -0.076629638671875, -0.06903076171875, -0.061431884765625, -0.0538330078125, -0.046234130859375, -0.03863525390625, -0.031036376953125, -0.0234375, -0.015838623046875, -0.00823974609375, -0.000640869140625, 0.0069580078125, 0.014556884765625, 0.02215576171875, 0.029754638671875, 0.037353515625, 0.044952392578125, 0.05255126953125, 0.060150146484375, 0.0677490234375, 0.075347900390625, 0.08294677734375, 0.090545654296875, 0.09814453125, 0.105743408203125, 0.11334228515625, 0.120941162109375, 0.1285400390625, 0.136138916015625, 0.14373779296875, 0.151336669921875, 0.158935546875, 0.166534423828125, 0.17413330078125, 0.181732177734375, 0.1893310546875, 0.196929931640625, 0.20452880859375, 0.212127685546875, 0.2197265625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 13.0, 12.0, 7.0, 12.0, 13.0, 18.0, 18.0, 20.0, 36.0, 31.0, 37.0, 28.0, 36.0, 52.0, 54.0, 46.0, 46.0, 41.0, 41.0, 47.0, 45.0, 44.0, 36.0, 30.0, 40.0, 30.0, 31.0, 30.0, 24.0, 20.0, 15.0, 6.0, 9.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.131591796875, -0.12789249420166016, -0.12419319152832031, -0.12049388885498047, -0.11679458618164062, -0.11309528350830078, -0.10939598083496094, -0.1056966781616211, -0.10199737548828125, -0.0982980728149414, -0.09459877014160156, -0.09089946746826172, -0.08720016479492188, -0.08350086212158203, -0.07980155944824219, -0.07610225677490234, -0.0724029541015625, -0.06870365142822266, -0.06500434875488281, -0.06130504608154297, -0.057605743408203125, -0.05390644073486328, -0.05020713806152344, -0.046507835388183594, -0.04280853271484375, -0.039109230041503906, -0.03540992736816406, -0.03171062469482422, -0.028011322021484375, -0.02431201934814453, -0.020612716674804688, -0.016913414001464844, -0.013214111328125, -0.009514808654785156, -0.0058155059814453125, -0.0021162033081054688, 0.001583099365234375, 0.005282402038574219, 0.008981704711914062, 0.012681007385253906, 0.01638031005859375, 0.020079612731933594, 0.023778915405273438, 0.02747821807861328, 0.031177520751953125, 0.03487682342529297, 0.03857612609863281, 0.042275428771972656, 0.0459747314453125, 0.049674034118652344, 0.05337333679199219, 0.05707263946533203, 0.060771942138671875, 0.06447124481201172, 0.06817054748535156, 0.0718698501586914, 0.07556915283203125, 0.0792684555053711, 0.08296775817871094, 0.08666706085205078, 0.09036636352539062, 0.09406566619873047, 0.09776496887207031, 0.10146427154541016, 0.10516357421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 4.0, 10.0, 9.0, 14.0, 25.0, 36.0, 48.0, 63.0, 87.0, 112.0, 172.0, 308.0, 535.0, 853.0, 1669.0, 4409.0, 14917.0, 88223.0, 808526.0, 103413.0, 16345.0, 4643.0, 1767.0, 860.0, 509.0, 307.0, 221.0, 143.0, 85.0, 64.0, 44.0, 36.0, 37.0, 22.0, 12.0, 5.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55517578125, -0.5386199951171875, -0.522064208984375, -0.5055084228515625, -0.48895263671875, -0.4723968505859375, -0.455841064453125, -0.4392852783203125, -0.4227294921875, -0.4061737060546875, -0.389617919921875, -0.3730621337890625, -0.35650634765625, -0.3399505615234375, -0.323394775390625, -0.3068389892578125, -0.290283203125, -0.2737274169921875, -0.257171630859375, -0.2406158447265625, -0.22406005859375, -0.2075042724609375, -0.190948486328125, -0.1743927001953125, -0.1578369140625, -0.1412811279296875, -0.124725341796875, -0.1081695556640625, -0.09161376953125, -0.0750579833984375, -0.058502197265625, -0.0419464111328125, -0.025390625, -0.0088348388671875, 0.007720947265625, 0.0242767333984375, 0.04083251953125, 0.0573883056640625, 0.073944091796875, 0.0904998779296875, 0.1070556640625, 0.1236114501953125, 0.140167236328125, 0.1567230224609375, 0.17327880859375, 0.1898345947265625, 0.206390380859375, 0.2229461669921875, 0.239501953125, 0.2560577392578125, 0.272613525390625, 0.2891693115234375, 0.30572509765625, 0.3222808837890625, 0.338836669921875, 0.3553924560546875, 0.3719482421875, 0.3885040283203125, 0.405059814453125, 0.4216156005859375, 0.43817138671875, 0.4547271728515625, 0.471282958984375, 0.4878387451171875, 0.50439453125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 7.0, 11.0, 7.0, 14.0, 14.0, 16.0, 15.0, 26.0, 22.0, 26.0, 38.0, 38.0, 42.0, 42.0, 45.0, 55.0, 42.0, 45.0, 49.0, 43.0, 38.0, 49.0, 44.0, 34.0, 29.0, 25.0, 29.0, 24.0, 23.0, 18.0, 7.0, 15.0, 3.0, 12.0, 7.0, 4.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.50537109375, -0.4907646179199219, -0.47615814208984375, -0.4615516662597656, -0.4469451904296875, -0.4323387145996094, -0.41773223876953125, -0.4031257629394531, -0.388519287109375, -0.3739128112792969, -0.35930633544921875, -0.3446998596191406, -0.3300933837890625, -0.3154869079589844, -0.30088043212890625, -0.2862739562988281, -0.27166748046875, -0.2570610046386719, -0.24245452880859375, -0.22784805297851562, -0.2132415771484375, -0.19863510131835938, -0.18402862548828125, -0.16942214965820312, -0.154815673828125, -0.14020919799804688, -0.12560272216796875, -0.11099624633789062, -0.0963897705078125, -0.08178329467773438, -0.06717681884765625, -0.052570343017578125, -0.0379638671875, -0.023357391357421875, -0.00875091552734375, 0.005855560302734375, 0.0204620361328125, 0.035068511962890625, 0.04967498779296875, 0.06428146362304688, 0.078887939453125, 0.09349441528320312, 0.10810089111328125, 0.12270736694335938, 0.1373138427734375, 0.15192031860351562, 0.16652679443359375, 0.18113327026367188, 0.19573974609375, 0.21034622192382812, 0.22495269775390625, 0.23955917358398438, 0.2541656494140625, 0.2687721252441406, 0.28337860107421875, 0.2979850769042969, 0.312591552734375, 0.3271980285644531, 0.34180450439453125, 0.3564109802246094, 0.3710174560546875, 0.3856239318847656, 0.40023040771484375, 0.4148368835449219, 0.429443359375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 2.0, 3.0, 2.0, 10.0, 7.0, 6.0, 17.0, 22.0, 34.0, 62.0, 87.0, 138.0, 248.0, 391.0, 680.0, 1188.0, 2440.0, 5728.0, 15442.0, 56370.0, 288585.0, 562250.0, 80696.0, 20724.0, 7268.0, 2925.0, 1356.0, 750.0, 409.0, 239.0, 161.0, 104.0, 46.0, 31.0, 33.0, 31.0, 16.0, 15.0, 5.0, 6.0, 10.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.1475830078125, -0.1429882049560547, -0.13839340209960938, -0.13379859924316406, -0.12920379638671875, -0.12460899353027344, -0.12001419067382812, -0.11541938781738281, -0.1108245849609375, -0.10622978210449219, -0.10163497924804688, -0.09704017639160156, -0.09244537353515625, -0.08785057067871094, -0.08325576782226562, -0.07866096496582031, -0.074066162109375, -0.06947135925292969, -0.06487655639648438, -0.06028175354003906, -0.05568695068359375, -0.05109214782714844, -0.046497344970703125, -0.04190254211425781, -0.0373077392578125, -0.03271293640136719, -0.028118133544921875, -0.023523330688476562, -0.01892852783203125, -0.014333724975585938, -0.009738922119140625, -0.0051441192626953125, -0.00054931640625, 0.0040454864501953125, 0.008640289306640625, 0.013235092163085938, 0.01782989501953125, 0.022424697875976562, 0.027019500732421875, 0.03161430358886719, 0.0362091064453125, 0.04080390930175781, 0.045398712158203125, 0.04999351501464844, 0.05458831787109375, 0.05918312072753906, 0.06377792358398438, 0.06837272644042969, 0.072967529296875, 0.07756233215332031, 0.08215713500976562, 0.08675193786621094, 0.09134674072265625, 0.09594154357910156, 0.10053634643554688, 0.10513114929199219, 0.1097259521484375, 0.11432075500488281, 0.11891555786132812, 0.12351036071777344, 0.12810516357421875, 0.13269996643066406, 0.13729476928710938, 0.1418895721435547, 0.146484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 6.0, 12.0, 11.0, 16.0, 26.0, 26.0, 26.0, 34.0, 32.0, 64.0, 57.0, 105.0, 84.0, 90.0, 76.0, 72.0, 52.0, 34.0, 38.0, 25.0, 23.0, 15.0, 16.0, 13.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.358457565307617e-05, -5.1723793148994446e-05, -4.986301064491272e-05, -4.8002228140830994e-05, -4.614144563674927e-05, -4.428066313266754e-05, -4.2419880628585815e-05, -4.055909812450409e-05, -3.869831562042236e-05, -3.683753311634064e-05, -3.497675061225891e-05, -3.3115968108177185e-05, -3.125518560409546e-05, -2.9394403100013733e-05, -2.7533620595932007e-05, -2.567283809185028e-05, -2.3812055587768555e-05, -2.195127308368683e-05, -2.0090490579605103e-05, -1.8229708075523376e-05, -1.636892557144165e-05, -1.4508143067359924e-05, -1.2647360563278198e-05, -1.0786578059196472e-05, -8.925795555114746e-06, -7.06501305103302e-06, -5.204230546951294e-06, -3.343448042869568e-06, -1.4826655387878418e-06, 3.781169652938843e-07, 2.2388994693756104e-06, 4.0996819734573364e-06, 5.9604644775390625e-06, 7.821246981620789e-06, 9.682029485702515e-06, 1.154281198978424e-05, 1.3403594493865967e-05, 1.5264376997947693e-05, 1.712515950202942e-05, 1.8985942006111145e-05, 2.084672451019287e-05, 2.2707507014274597e-05, 2.4568289518356323e-05, 2.642907202243805e-05, 2.8289854526519775e-05, 3.01506370306015e-05, 3.201141953468323e-05, 3.3872202038764954e-05, 3.573298454284668e-05, 3.7593767046928406e-05, 3.945454955101013e-05, 4.131533205509186e-05, 4.3176114559173584e-05, 4.503689706325531e-05, 4.6897679567337036e-05, 4.875846207141876e-05, 5.061924457550049e-05, 5.2480027079582214e-05, 5.434080958366394e-05, 5.6201592087745667e-05, 5.806237459182739e-05, 5.992315709590912e-05, 6.178393959999084e-05, 6.364472210407257e-05, 6.55055046081543e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 16.0, 17.0, 22.0, 42.0, 41.0, 61.0, 60.0, 84.0, 133.0, 187.0, 313.0, 467.0, 786.0, 1330.0, 2435.0, 5431.0, 14079.0, 48888.0, 226883.0, 598864.0, 105635.0, 25937.0, 8553.0, 3586.0, 1808.0, 1012.0, 608.0, 375.0, 269.0, 168.0, 111.0, 87.0, 73.0, 43.0, 35.0, 20.0, 15.0, 14.0, 9.0, 13.0, 4.0, 5.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12408256530761719, -0.12011337280273438, -0.11614418029785156, -0.11217498779296875, -0.10820579528808594, -0.10423660278320312, -0.10026741027832031, -0.0962982177734375, -0.09232902526855469, -0.08835983276367188, -0.08439064025878906, -0.08042144775390625, -0.07645225524902344, -0.07248306274414062, -0.06851387023925781, -0.064544677734375, -0.06057548522949219, -0.056606292724609375, -0.05263710021972656, -0.04866790771484375, -0.04469871520996094, -0.040729522705078125, -0.03676033020019531, -0.0327911376953125, -0.028821945190429688, -0.024852752685546875, -0.020883560180664062, -0.01691436767578125, -0.012945175170898438, -0.008975982666015625, -0.0050067901611328125, -0.00103759765625, 0.0029315948486328125, 0.006900787353515625, 0.010869979858398438, 0.01483917236328125, 0.018808364868164062, 0.022777557373046875, 0.026746749877929688, 0.0307159423828125, 0.03468513488769531, 0.038654327392578125, 0.04262351989746094, 0.04659271240234375, 0.05056190490722656, 0.054531097412109375, 0.05850028991699219, 0.062469482421875, 0.06643867492675781, 0.07040786743164062, 0.07437705993652344, 0.07834625244140625, 0.08231544494628906, 0.08628463745117188, 0.09025382995605469, 0.0942230224609375, 0.09819221496582031, 0.10216140747070312, 0.10613059997558594, 0.11009979248046875, 0.11406898498535156, 0.11803817749023438, 0.12200736999511719, 0.1259765625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 5.0, 8.0, 4.0, 9.0, 6.0, 13.0, 22.0, 25.0, 15.0, 31.0, 45.0, 59.0, 46.0, 62.0, 69.0, 67.0, 71.0, 72.0, 65.0, 51.0, 47.0, 47.0, 30.0, 25.0, 28.0, 20.0, 11.0, 7.0, 7.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.12371826171875, -0.1200723648071289, -0.11642646789550781, -0.11278057098388672, -0.10913467407226562, -0.10548877716064453, -0.10184288024902344, -0.09819698333740234, -0.09455108642578125, -0.09090518951416016, -0.08725929260253906, -0.08361339569091797, -0.07996749877929688, -0.07632160186767578, -0.07267570495605469, -0.0690298080444336, -0.0653839111328125, -0.061738014221191406, -0.05809211730957031, -0.05444622039794922, -0.050800323486328125, -0.04715442657470703, -0.04350852966308594, -0.039862632751464844, -0.03621673583984375, -0.032570838928222656, -0.028924942016601562, -0.02527904510498047, -0.021633148193359375, -0.01798725128173828, -0.014341354370117188, -0.010695457458496094, -0.007049560546875, -0.0034036636352539062, 0.0002422332763671875, 0.0038881301879882812, 0.007534027099609375, 0.011179924011230469, 0.014825820922851562, 0.018471717834472656, 0.02211761474609375, 0.025763511657714844, 0.029409408569335938, 0.03305530548095703, 0.036701202392578125, 0.04034709930419922, 0.04399299621582031, 0.047638893127441406, 0.0512847900390625, 0.054930686950683594, 0.05857658386230469, 0.06222248077392578, 0.06586837768554688, 0.06951427459716797, 0.07316017150878906, 0.07680606842041016, 0.08045196533203125, 0.08409786224365234, 0.08774375915527344, 0.09138965606689453, 0.09503555297851562, 0.09868144989013672, 0.10232734680175781, 0.1059732437133789, 0.109619140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 8.0, 18.0, 41.0, 104.0, 269.0, 332.0, 134.0, 42.0, 20.0, 9.0, 4.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.369033813476562, -8.191421508789062, -8.013809204101562, -7.836196422576904, -7.658584117889404, -7.480971813201904, -7.303359031677246, -7.125746726989746, -6.948134422302246, -6.770522117614746, -6.592909812927246, -6.415297031402588, -6.237684726715088, -6.060072422027588, -5.88245964050293, -5.70484733581543, -5.52723503112793, -5.34962272644043, -5.17201042175293, -4.9943976402282715, -4.8167853355407715, -4.6391730308532715, -4.461560249328613, -4.283947944641113, -4.106335639953613, -3.9287233352661133, -3.751110792160034, -3.573498249053955, -3.395885944366455, -3.218273639678955, -3.040661096572876, -2.863048553466797, -2.685436725616455, -2.507824420928955, -2.330211877822876, -2.152599334716797, -1.9749870300292969, -1.7973746061325073, -1.6197621822357178, -1.4421497583389282, -1.2645373344421387, -1.0869249105453491, -0.9093124866485596, -0.73170006275177, -0.5540876388549805, -0.3764752149581909, -0.19886279106140137, -0.021250367164611816, 0.15636205673217773, 0.3339744806289673, 0.5115869045257568, 0.6891993284225464, 0.8668117523193359, 1.0444241762161255, 1.222036600112915, 1.3996490240097046, 1.5772614479064941, 1.7548738718032837, 1.9324862957000732, 2.1100988388061523, 2.2877111434936523, 2.4653234481811523, 2.6429359912872314, 2.8205485343933105, 2.9981608390808105]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 14.0, 15.0, 17.0, 18.0, 27.0, 30.0, 33.0, 33.0, 35.0, 43.0, 68.0, 84.0, 78.0, 82.0, 70.0, 52.0, 48.0, 33.0, 50.0, 30.0, 14.0, 21.0, 24.0, 21.0, 14.0, 7.0, 10.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4731509685516357, -2.3982748985290527, -2.3233985900878906, -2.2485225200653076, -2.1736464500427246, -2.0987701416015625, -2.0238940715789795, -1.9490180015563965, -1.874141812324524, -1.7992656230926514, -1.7243895530700684, -1.6495133638381958, -1.5746371746063232, -1.4997611045837402, -1.4248849153518677, -1.3500087261199951, -1.275132656097412, -1.2002564668655396, -1.1253803968429565, -1.050504207611084, -0.9756280779838562, -0.9007519483566284, -0.8258757591247559, -0.7509996294975281, -0.6761234998703003, -0.6012473702430725, -0.5263712406158447, -0.45149505138397217, -0.3766189217567444, -0.3017427921295166, -0.22686663269996643, -0.15199047327041626, -0.07711410522460938, -0.002237960696220398, 0.07263818383216858, 0.14751432836055756, 0.22239047288894653, 0.2972666025161743, 0.3721427619457245, 0.44701892137527466, 0.5218950510025024, 0.5967711806297302, 0.671647310256958, 0.7465234994888306, 0.8213996291160583, 0.8962757587432861, 0.9711519479751587, 1.0460281372070312, 1.1209042072296143, 1.1957803964614868, 1.2706564664840698, 1.3455326557159424, 1.4204087257385254, 1.495284914970398, 1.5701611042022705, 1.6450371742248535, 1.719913363456726, 1.7947895526885986, 1.8696656227111816, 1.9445418119430542, 2.0194180011749268, 2.0942940711975098, 2.1691701412200928, 2.244046449661255, 2.318922519683838]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 10.0, 33.0, 31.0, 49.0, 77.0, 109.0, 191.0, 281.0, 573.0, 1061.0, 2460.0, 5292.0, 13562.0, 40813.0, 179739.0, 1252908.0, 2221355.0, 373127.0, 68679.0, 19827.0, 7492.0, 3203.0, 1526.0, 773.0, 440.0, 237.0, 137.0, 77.0, 52.0, 33.0, 28.0, 20.0, 19.0, 10.0, 8.0, 8.0, 9.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1661376953125, -0.1609783172607422, -0.15581893920898438, -0.15065956115722656, -0.14550018310546875, -0.14034080505371094, -0.13518142700195312, -0.1300220489501953, -0.1248626708984375, -0.11970329284667969, -0.11454391479492188, -0.10938453674316406, -0.10422515869140625, -0.09906578063964844, -0.09390640258789062, -0.08874702453613281, -0.083587646484375, -0.07842826843261719, -0.07326889038085938, -0.06810951232910156, -0.06295013427734375, -0.05779075622558594, -0.052631378173828125, -0.04747200012207031, -0.0423126220703125, -0.03715324401855469, -0.031993865966796875, -0.026834487915039062, -0.02167510986328125, -0.016515731811523438, -0.011356353759765625, -0.0061969757080078125, -0.00103759765625, 0.0041217803955078125, 0.009281158447265625, 0.014440536499023438, 0.01959991455078125, 0.024759292602539062, 0.029918670654296875, 0.03507804870605469, 0.0402374267578125, 0.04539680480957031, 0.050556182861328125, 0.05571556091308594, 0.06087493896484375, 0.06603431701660156, 0.07119369506835938, 0.07635307312011719, 0.081512451171875, 0.08667182922363281, 0.09183120727539062, 0.09699058532714844, 0.10214996337890625, 0.10730934143066406, 0.11246871948242188, 0.11762809753417969, 0.1227874755859375, 0.1279468536376953, 0.13310623168945312, 0.13826560974121094, 0.14342498779296875, 0.14858436584472656, 0.15374374389648438, 0.1589031219482422, 0.1640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 5.0, 10.0, 14.0, 10.0, 10.0, 16.0, 12.0, 20.0, 18.0, 23.0, 27.0, 25.0, 31.0, 34.0, 34.0, 49.0, 47.0, 43.0, 41.0, 25.0, 45.0, 43.0, 35.0, 47.0, 32.0, 34.0, 43.0, 35.0, 34.0, 23.0, 27.0, 24.0, 12.0, 8.0, 8.0, 11.0, 9.0, 8.0, 7.0, 5.0, 6.0, 7.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.091064453125, -0.0878896713256836, -0.08471488952636719, -0.08154010772705078, -0.07836532592773438, -0.07519054412841797, -0.07201576232910156, -0.06884098052978516, -0.06566619873046875, -0.062491416931152344, -0.05931663513183594, -0.05614185333251953, -0.052967071533203125, -0.04979228973388672, -0.04661750793457031, -0.043442726135253906, -0.0402679443359375, -0.037093162536621094, -0.03391838073730469, -0.03074359893798828, -0.027568817138671875, -0.02439403533935547, -0.021219253540039062, -0.018044471740722656, -0.01486968994140625, -0.011694908142089844, -0.008520126342773438, -0.005345344543457031, -0.002170562744140625, 0.0010042190551757812, 0.0041790008544921875, 0.007353782653808594, 0.010528564453125, 0.013703346252441406, 0.016878128051757812, 0.02005290985107422, 0.023227691650390625, 0.02640247344970703, 0.029577255249023438, 0.032752037048339844, 0.03592681884765625, 0.039101600646972656, 0.04227638244628906, 0.04545116424560547, 0.048625946044921875, 0.05180072784423828, 0.05497550964355469, 0.058150291442871094, 0.0613250732421875, 0.0644998550415039, 0.06767463684082031, 0.07084941864013672, 0.07402420043945312, 0.07719898223876953, 0.08037376403808594, 0.08354854583740234, 0.08672332763671875, 0.08989810943603516, 0.09307289123535156, 0.09624767303466797, 0.09942245483398438, 0.10259723663330078, 0.10577201843261719, 0.1089468002319336, 0.11212158203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 3.0, 7.0, 15.0, 19.0, 28.0, 59.0, 151.0, 384.0, 1319.0, 6478.0, 59933.0, 3209393.0, 882666.0, 28467.0, 3847.0, 934.0, 305.0, 130.0, 61.0, 27.0, 23.0, 14.0, 5.0, 5.0, 4.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.71484375, -0.6977615356445312, -0.6806793212890625, -0.6635971069335938, -0.646514892578125, -0.6294326782226562, -0.6123504638671875, -0.5952682495117188, -0.57818603515625, -0.5611038208007812, -0.5440216064453125, -0.5269393920898438, -0.509857177734375, -0.49277496337890625, -0.4756927490234375, -0.45861053466796875, -0.4415283203125, -0.42444610595703125, -0.4073638916015625, -0.39028167724609375, -0.373199462890625, -0.35611724853515625, -0.3390350341796875, -0.32195281982421875, -0.30487060546875, -0.28778839111328125, -0.2707061767578125, -0.25362396240234375, -0.236541748046875, -0.21945953369140625, -0.2023773193359375, -0.18529510498046875, -0.168212890625, -0.15113067626953125, -0.1340484619140625, -0.11696624755859375, -0.099884033203125, -0.08280181884765625, -0.0657196044921875, -0.04863739013671875, -0.03155517578125, -0.01447296142578125, 0.0026092529296875, 0.01969146728515625, 0.036773681640625, 0.05385589599609375, 0.0709381103515625, 0.08802032470703125, 0.1051025390625, 0.12218475341796875, 0.1392669677734375, 0.15634918212890625, 0.173431396484375, 0.19051361083984375, 0.2075958251953125, 0.22467803955078125, 0.24176025390625, 0.25884246826171875, 0.2759246826171875, 0.29300689697265625, 0.310089111328125, 0.32717132568359375, 0.3442535400390625, 0.36133575439453125, 0.37841796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 10.0, 15.0, 17.0, 30.0, 41.0, 95.0, 116.0, 244.0, 472.0, 851.0, 900.0, 566.0, 288.0, 163.0, 94.0, 52.0, 40.0, 19.0, 16.0, 18.0, 8.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376953125, -0.36353302001953125, -0.3501129150390625, -0.33669281005859375, -0.323272705078125, -0.30985260009765625, -0.2964324951171875, -0.28301239013671875, -0.26959228515625, -0.25617218017578125, -0.2427520751953125, -0.22933197021484375, -0.215911865234375, -0.20249176025390625, -0.1890716552734375, -0.17565155029296875, -0.1622314453125, -0.14881134033203125, -0.1353912353515625, -0.12197113037109375, -0.108551025390625, -0.09513092041015625, -0.0817108154296875, -0.06829071044921875, -0.05487060546875, -0.04145050048828125, -0.0280303955078125, -0.01461029052734375, -0.001190185546875, 0.01222991943359375, 0.0256500244140625, 0.03907012939453125, 0.052490234375, 0.06591033935546875, 0.0793304443359375, 0.09275054931640625, 0.106170654296875, 0.11959075927734375, 0.1330108642578125, 0.14643096923828125, 0.15985107421875, 0.17327117919921875, 0.1866912841796875, 0.20011138916015625, 0.213531494140625, 0.22695159912109375, 0.2403717041015625, 0.25379180908203125, 0.2672119140625, 0.28063201904296875, 0.2940521240234375, 0.30747222900390625, 0.320892333984375, 0.33431243896484375, 0.3477325439453125, 0.36115264892578125, 0.37457275390625, 0.38799285888671875, 0.4014129638671875, 0.41483306884765625, 0.428253173828125, 0.44167327880859375, 0.4550933837890625, 0.46851348876953125, 0.48193359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 9.0, 4.0, 11.0, 42.0, 88.0, 240.0, 266.0, 184.0, 81.0, 36.0, 15.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.497735977172852, -5.35775089263916, -5.217765808105469, -5.0777812004089355, -4.937796115875244, -4.797811031341553, -4.657825946807861, -4.51784086227417, -4.377856254577637, -4.237871170043945, -4.097886085510254, -3.9579012393951416, -3.8179163932800293, -3.677931308746338, -3.5379462242126465, -3.397961139678955, -3.2579760551452637, -3.1179909706115723, -2.97800612449646, -2.8380210399627686, -2.6980361938476562, -2.558051109313965, -2.4180660247802734, -2.278080940246582, -2.1380960941314697, -1.9981111288070679, -1.858126163482666, -1.7181410789489746, -1.5781561136245728, -1.438171148300171, -1.2981860637664795, -1.1582010984420776, -1.0182161331176758, -0.8782311677932739, -0.7382461428642273, -0.5982611179351807, -0.4582761526107788, -0.31829118728637695, -0.17830616235733032, -0.03832113742828369, 0.10166382789611816, 0.2416488230228424, 0.38163381814956665, 0.5216188430786133, 0.6616038084030151, 0.801588773727417, 0.9415737986564636, 1.0815588235855103, 1.221543788909912, 1.361528754234314, 1.5015137195587158, 1.6414988040924072, 1.781483769416809, 1.921468734741211, 2.0614538192749023, 2.2014389038085938, 2.341423749923706, 2.4814088344573975, 2.6213936805725098, 2.761378765106201, 2.9013638496398926, 3.041348695755005, 3.1813337802886963, 3.3213186264038086, 3.4613037109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 17.0, 14.0, 23.0, 27.0, 36.0, 36.0, 41.0, 49.0, 45.0, 68.0, 62.0, 72.0, 72.0, 58.0, 50.0, 60.0, 52.0, 35.0, 38.0, 30.0, 25.0, 18.0, 13.0, 13.0, 8.0, 8.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.732755184173584, -1.6779906749725342, -1.6232261657714844, -1.5684616565704346, -1.5136971473693848, -1.458932638168335, -1.4041681289672852, -1.349403738975525, -1.294639229774475, -1.2398747205734253, -1.1851102113723755, -1.1303457021713257, -1.0755811929702759, -1.0208168029785156, -0.966052234172821, -0.911287784576416, -0.8565232157707214, -0.8017587065696716, -0.7469941973686218, -0.6922297477722168, -0.637465238571167, -0.5827007293701172, -0.5279362201690674, -0.47317174077033997, -0.41840723156929016, -0.36364272236824036, -0.30887824296951294, -0.25411373376846313, -0.19934923946857452, -0.1445847451686859, -0.08982023596763611, -0.03505575656890869, 0.019708752632141113, 0.07447324693202972, 0.12923774123191833, 0.18400225043296814, 0.23876674473285675, 0.29353123903274536, 0.34829574823379517, 0.4030602276325226, 0.4578247368335724, 0.5125892162322998, 0.5673537254333496, 0.6221182346343994, 0.6768827438354492, 0.731647253036499, 0.7864117622375488, 0.8411762118339539, 0.8959407210350037, 0.9507052302360535, 1.0054696798324585, 1.0602341890335083, 1.114998698234558, 1.169763207435608, 1.2245277166366577, 1.2792922258377075, 1.3340567350387573, 1.3888212442398071, 1.443585753440857, 1.4983502626419067, 1.5531147718429565, 1.6078791618347168, 1.6626436710357666, 1.7174081802368164, 1.7721726894378662]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 5.0, 12.0, 18.0, 16.0, 27.0, 26.0, 46.0, 72.0, 87.0, 112.0, 154.0, 271.0, 404.0, 555.0, 913.0, 1471.0, 2527.0, 4439.0, 8414.0, 18729.0, 49721.0, 158918.0, 377455.0, 275115.0, 91186.0, 30715.0, 12538.0, 6007.0, 3307.0, 1863.0, 1179.0, 749.0, 494.0, 307.0, 209.0, 142.0, 99.0, 62.0, 57.0, 41.0, 31.0, 18.0, 12.0, 7.0, 7.0, 4.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.165283203125, -0.16023826599121094, -0.15519332885742188, -0.1501483917236328, -0.14510345458984375, -0.1400585174560547, -0.13501358032226562, -0.12996864318847656, -0.1249237060546875, -0.11987876892089844, -0.11483383178710938, -0.10978889465332031, -0.10474395751953125, -0.09969902038574219, -0.09465408325195312, -0.08960914611816406, -0.084564208984375, -0.07951927185058594, -0.07447433471679688, -0.06942939758300781, -0.06438446044921875, -0.05933952331542969, -0.054294586181640625, -0.04924964904785156, -0.0442047119140625, -0.03915977478027344, -0.034114837646484375, -0.029069900512695312, -0.02402496337890625, -0.018980026245117188, -0.013935089111328125, -0.008890151977539062, -0.00384521484375, 0.0011997222900390625, 0.006244659423828125, 0.011289596557617188, 0.01633453369140625, 0.021379470825195312, 0.026424407958984375, 0.03146934509277344, 0.0365142822265625, 0.04155921936035156, 0.046604156494140625, 0.05164909362792969, 0.05669403076171875, 0.06173896789550781, 0.06678390502929688, 0.07182884216308594, 0.076873779296875, 0.08191871643066406, 0.08696365356445312, 0.09200859069824219, 0.09705352783203125, 0.10209846496582031, 0.10714340209960938, 0.11218833923339844, 0.1172332763671875, 0.12227821350097656, 0.12732315063476562, 0.1323680877685547, 0.13741302490234375, 0.1424579620361328, 0.14750289916992188, 0.15254783630371094, 0.1575927734375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 5.0, 11.0, 8.0, 12.0, 18.0, 7.0, 20.0, 23.0, 25.0, 16.0, 23.0, 31.0, 39.0, 35.0, 38.0, 37.0, 45.0, 47.0, 37.0, 42.0, 44.0, 39.0, 51.0, 39.0, 42.0, 38.0, 35.0, 27.0, 25.0, 22.0, 22.0, 16.0, 14.0, 9.0, 12.0, 11.0, 9.0, 3.0, 7.0, 9.0, 2.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11248779296875, -0.10889911651611328, -0.10531044006347656, -0.10172176361083984, -0.09813308715820312, -0.0945444107055664, -0.09095573425292969, -0.08736705780029297, -0.08377838134765625, -0.08018970489501953, -0.07660102844238281, -0.0730123519897461, -0.06942367553710938, -0.06583499908447266, -0.06224632263183594, -0.05865764617919922, -0.0550689697265625, -0.05148029327392578, -0.04789161682128906, -0.044302940368652344, -0.040714263916015625, -0.037125587463378906, -0.03353691101074219, -0.02994823455810547, -0.02635955810546875, -0.02277088165283203, -0.019182205200195312, -0.015593528747558594, -0.012004852294921875, -0.008416175842285156, -0.0048274993896484375, -0.0012388229370117188, 0.002349853515625, 0.005938529968261719, 0.009527206420898438, 0.013115882873535156, 0.016704559326171875, 0.020293235778808594, 0.023881912231445312, 0.02747058868408203, 0.03105926513671875, 0.03464794158935547, 0.03823661804199219, 0.041825294494628906, 0.045413970947265625, 0.049002647399902344, 0.05259132385253906, 0.05618000030517578, 0.0597686767578125, 0.06335735321044922, 0.06694602966308594, 0.07053470611572266, 0.07412338256835938, 0.0777120590209961, 0.08130073547363281, 0.08488941192626953, 0.08847808837890625, 0.09206676483154297, 0.09565544128417969, 0.0992441177368164, 0.10283279418945312, 0.10642147064208984, 0.11001014709472656, 0.11359882354736328, 0.1171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 14.0, 23.0, 35.0, 40.0, 54.0, 106.0, 153.0, 305.0, 749.0, 1972.0, 6954.0, 46463.0, 780002.0, 190601.0, 15388.0, 3467.0, 1159.0, 476.0, 217.0, 127.0, 69.0, 54.0, 28.0, 25.0, 10.0, 10.0, 8.0, 7.0, 6.0, 2.0, 5.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.402587890625, -0.3890533447265625, -0.375518798828125, -0.3619842529296875, -0.34844970703125, -0.3349151611328125, -0.321380615234375, -0.3078460693359375, -0.2943115234375, -0.2807769775390625, -0.267242431640625, -0.2537078857421875, -0.24017333984375, -0.2266387939453125, -0.213104248046875, -0.1995697021484375, -0.18603515625, -0.1725006103515625, -0.158966064453125, -0.1454315185546875, -0.13189697265625, -0.1183624267578125, -0.104827880859375, -0.0912933349609375, -0.0777587890625, -0.0642242431640625, -0.050689697265625, -0.0371551513671875, -0.02362060546875, -0.0100860595703125, 0.003448486328125, 0.0169830322265625, 0.030517578125, 0.0440521240234375, 0.057586669921875, 0.0711212158203125, 0.08465576171875, 0.0981903076171875, 0.111724853515625, 0.1252593994140625, 0.1387939453125, 0.1523284912109375, 0.165863037109375, 0.1793975830078125, 0.19293212890625, 0.2064666748046875, 0.220001220703125, 0.2335357666015625, 0.2470703125, 0.2606048583984375, 0.274139404296875, 0.2876739501953125, 0.30120849609375, 0.3147430419921875, 0.328277587890625, 0.3418121337890625, 0.3553466796875, 0.3688812255859375, 0.382415771484375, 0.3959503173828125, 0.40948486328125, 0.4230194091796875, 0.436553955078125, 0.4500885009765625, 0.463623046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 8.0, 2.0, 2.0, 10.0, 10.0, 10.0, 25.0, 16.0, 27.0, 23.0, 44.0, 31.0, 49.0, 65.0, 67.0, 64.0, 63.0, 84.0, 78.0, 57.0, 46.0, 60.0, 35.0, 24.0, 28.0, 20.0, 15.0, 14.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.5228958129882812, -0.5037994384765625, -0.48470306396484375, -0.465606689453125, -0.44651031494140625, -0.4274139404296875, -0.40831756591796875, -0.38922119140625, -0.37012481689453125, -0.3510284423828125, -0.33193206787109375, -0.312835693359375, -0.29373931884765625, -0.2746429443359375, -0.25554656982421875, -0.2364501953125, -0.21735382080078125, -0.1982574462890625, -0.17916107177734375, -0.160064697265625, -0.14096832275390625, -0.1218719482421875, -0.10277557373046875, -0.08367919921875, -0.06458282470703125, -0.0454864501953125, -0.02639007568359375, -0.007293701171875, 0.01180267333984375, 0.0308990478515625, 0.04999542236328125, 0.069091796875, 0.08818817138671875, 0.1072845458984375, 0.12638092041015625, 0.145477294921875, 0.16457366943359375, 0.1836700439453125, 0.20276641845703125, 0.22186279296875, 0.24095916748046875, 0.2600555419921875, 0.27915191650390625, 0.298248291015625, 0.31734466552734375, 0.3364410400390625, 0.35553741455078125, 0.3746337890625, 0.39373016357421875, 0.4128265380859375, 0.43192291259765625, 0.451019287109375, 0.47011566162109375, 0.4892120361328125, 0.5083084106445312, 0.52740478515625, 0.5465011596679688, 0.5655975341796875, 0.5846939086914062, 0.603790283203125, 0.6228866577148438, 0.6419830322265625, 0.6610794067382812, 0.68017578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 3.0, 3.0, 4.0, 9.0, 14.0, 20.0, 35.0, 42.0, 91.0, 171.0, 379.0, 755.0, 1933.0, 5547.0, 19890.0, 104822.0, 698566.0, 174689.0, 29481.0, 7749.0, 2449.0, 941.0, 443.0, 204.0, 123.0, 71.0, 40.0, 31.0, 11.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1837158203125, -0.17908000946044922, -0.17444419860839844, -0.16980838775634766, -0.16517257690429688, -0.1605367660522461, -0.1559009552001953, -0.15126514434814453, -0.14662933349609375, -0.14199352264404297, -0.1373577117919922, -0.1327219009399414, -0.12808609008789062, -0.12345027923583984, -0.11881446838378906, -0.11417865753173828, -0.1095428466796875, -0.10490703582763672, -0.10027122497558594, -0.09563541412353516, -0.09099960327148438, -0.0863637924194336, -0.08172798156738281, -0.07709217071533203, -0.07245635986328125, -0.06782054901123047, -0.06318473815917969, -0.058548927307128906, -0.053913116455078125, -0.049277305603027344, -0.04464149475097656, -0.04000568389892578, -0.035369873046875, -0.03073406219482422, -0.026098251342773438, -0.021462440490722656, -0.016826629638671875, -0.012190818786621094, -0.0075550079345703125, -0.0029191970825195312, 0.00171661376953125, 0.006352424621582031, 0.010988235473632812, 0.015624046325683594, 0.020259857177734375, 0.024895668029785156, 0.029531478881835938, 0.03416728973388672, 0.0388031005859375, 0.04343891143798828, 0.04807472229003906, 0.052710533142089844, 0.057346343994140625, 0.061982154846191406, 0.06661796569824219, 0.07125377655029297, 0.07588958740234375, 0.08052539825439453, 0.08516120910644531, 0.0897970199584961, 0.09443283081054688, 0.09906864166259766, 0.10370445251464844, 0.10834026336669922, 0.11297607421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 7.0, 7.0, 5.0, 7.0, 9.0, 10.0, 15.0, 16.0, 25.0, 32.0, 43.0, 45.0, 56.0, 62.0, 70.0, 83.0, 66.0, 69.0, 68.0, 68.0, 56.0, 35.0, 27.0, 23.0, 25.0, 14.0, 8.0, 6.0, 6.0, 7.0, 2.0, 2.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.4868717193603516e-05, -3.3629126846790314e-05, -3.238953649997711e-05, -3.114994615316391e-05, -2.9910355806350708e-05, -2.8670765459537506e-05, -2.7431175112724304e-05, -2.6191584765911102e-05, -2.49519944190979e-05, -2.37124040722847e-05, -2.2472813725471497e-05, -2.1233223378658295e-05, -1.9993633031845093e-05, -1.875404268503189e-05, -1.751445233821869e-05, -1.6274861991405487e-05, -1.5035271644592285e-05, -1.3795681297779083e-05, -1.2556090950965881e-05, -1.131650060415268e-05, -1.0076910257339478e-05, -8.837319910526276e-06, -7.597729563713074e-06, -6.358139216899872e-06, -5.11854887008667e-06, -3.878958523273468e-06, -2.639368176460266e-06, -1.3997778296470642e-06, -1.601874828338623e-07, 1.0794028639793396e-06, 2.3189932107925415e-06, 3.5585835576057434e-06, 4.798173904418945e-06, 6.037764251232147e-06, 7.277354598045349e-06, 8.516944944858551e-06, 9.756535291671753e-06, 1.0996125638484955e-05, 1.2235715985298157e-05, 1.3475306332111359e-05, 1.471489667892456e-05, 1.5954487025737762e-05, 1.7194077372550964e-05, 1.8433667719364166e-05, 1.9673258066177368e-05, 2.091284841299057e-05, 2.2152438759803772e-05, 2.3392029106616974e-05, 2.4631619453430176e-05, 2.5871209800243378e-05, 2.711080014705658e-05, 2.835039049386978e-05, 2.9589980840682983e-05, 3.0829571187496185e-05, 3.206916153430939e-05, 3.330875188112259e-05, 3.454834222793579e-05, 3.578793257474899e-05, 3.7027522921562195e-05, 3.82671132683754e-05, 3.95067036151886e-05, 4.07462939620018e-05, 4.1985884308815e-05, 4.3225474655628204e-05, 4.4465065002441406e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 4.0, 16.0, 16.0, 15.0, 33.0, 51.0, 62.0, 153.0, 274.0, 585.0, 1293.0, 3791.0, 14833.0, 92487.0, 725559.0, 176661.0, 24051.0, 5397.0, 1751.0, 744.0, 315.0, 183.0, 102.0, 64.0, 36.0, 27.0, 14.0, 13.0, 7.0, 4.0, 7.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13134765625, -0.12601852416992188, -0.12068939208984375, -0.11536026000976562, -0.1100311279296875, -0.10470199584960938, -0.09937286376953125, -0.09404373168945312, -0.088714599609375, -0.08338546752929688, -0.07805633544921875, -0.07272720336914062, -0.0673980712890625, -0.062068939208984375, -0.05673980712890625, -0.051410675048828125, -0.04608154296875, -0.040752410888671875, -0.03542327880859375, -0.030094146728515625, -0.0247650146484375, -0.019435882568359375, -0.01410675048828125, -0.008777618408203125, -0.003448486328125, 0.001880645751953125, 0.00720977783203125, 0.012538909912109375, 0.0178680419921875, 0.023197174072265625, 0.02852630615234375, 0.033855438232421875, 0.0391845703125, 0.044513702392578125, 0.04984283447265625, 0.055171966552734375, 0.0605010986328125, 0.06583023071289062, 0.07115936279296875, 0.07648849487304688, 0.081817626953125, 0.08714675903320312, 0.09247589111328125, 0.09780502319335938, 0.1031341552734375, 0.10846328735351562, 0.11379241943359375, 0.11912155151367188, 0.12445068359375, 0.12977981567382812, 0.13510894775390625, 0.14043807983398438, 0.1457672119140625, 0.15109634399414062, 0.15642547607421875, 0.16175460815429688, 0.167083740234375, 0.17241287231445312, 0.17774200439453125, 0.18307113647460938, 0.1884002685546875, 0.19372940063476562, 0.19905853271484375, 0.20438766479492188, 0.209716796875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 9.0, 3.0, 19.0, 13.0, 13.0, 35.0, 46.0, 48.0, 71.0, 81.0, 88.0, 95.0, 91.0, 112.0, 70.0, 48.0, 39.0, 34.0, 21.0, 24.0, 10.0, 6.0, 4.0, 5.0, 2.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.123291015625, -0.11867713928222656, -0.11406326293945312, -0.10944938659667969, -0.10483551025390625, -0.10022163391113281, -0.09560775756835938, -0.09099388122558594, -0.0863800048828125, -0.08176612854003906, -0.07715225219726562, -0.07253837585449219, -0.06792449951171875, -0.06331062316894531, -0.058696746826171875, -0.05408287048339844, -0.049468994140625, -0.04485511779785156, -0.040241241455078125, -0.03562736511230469, -0.03101348876953125, -0.026399612426757812, -0.021785736083984375, -0.017171859741210938, -0.0125579833984375, -0.007944107055664062, -0.003330230712890625, 0.0012836456298828125, 0.00589752197265625, 0.010511398315429688, 0.015125274658203125, 0.019739151000976562, 0.02435302734375, 0.028966903686523438, 0.033580780029296875, 0.03819465637207031, 0.04280853271484375, 0.04742240905761719, 0.052036285400390625, 0.05665016174316406, 0.0612640380859375, 0.06587791442871094, 0.07049179077148438, 0.07510566711425781, 0.07971954345703125, 0.08433341979980469, 0.08894729614257812, 0.09356117248535156, 0.098175048828125, 0.10278892517089844, 0.10740280151367188, 0.11201667785644531, 0.11663055419921875, 0.12124443054199219, 0.12585830688476562, 0.13047218322753906, 0.1350860595703125, 0.13969993591308594, 0.14431381225585938, 0.1489276885986328, 0.15354156494140625, 0.1581554412841797, 0.16276931762695312, 0.16738319396972656, 0.1719970703125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 8.0, 24.0, 55.0, 93.0, 169.0, 288.0, 137.0, 90.0, 50.0, 26.0, 16.0, 7.0, 12.0, 5.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021078586578369, -1.9377696514129639, -1.8544608354568481, -1.7711519002914429, -1.6878430843353271, -1.6045341491699219, -1.5212252140045166, -1.4379163980484009, -1.3546075820922852, -1.2712986469268799, -1.1879898309707642, -1.1046808958053589, -1.0213720798492432, -0.9380631446838379, -0.8547542691230774, -0.7714453935623169, -0.6881364583969116, -0.6048275828361511, -0.5215187072753906, -0.43820980191230774, -0.35490092635154724, -0.27159205079078674, -0.18828314542770386, -0.10497426986694336, -0.02166539430618286, 0.061643488705158234, 0.14495237171649933, 0.22826126217842102, 0.3115701377391815, 0.394879013299942, 0.4781879186630249, 0.5614967942237854, 0.6448056697845459, 0.7281145453453064, 0.8114234209060669, 0.8947323560714722, 0.9780411720275879, 1.0613501071929932, 1.1446590423583984, 1.2279678583145142, 1.3112766742706299, 1.3945856094360352, 1.4778944253921509, 1.5612033605575562, 1.6445121765136719, 1.7278211116790771, 1.8111300468444824, 1.8944388628005981, 1.9777477979660034, 2.061056613922119, 2.1443655490875244, 2.2276744842529297, 2.310983419418335, 2.394292116165161, 2.4776010513305664, 2.5609099864959717, 2.644218921661377, 2.7275278568267822, 2.8108367919921875, 2.8941454887390137, 2.977454423904419, 3.060763359069824, 3.1440722942352295, 3.2273812294006348, 3.310689926147461]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 6.0, 5.0, 4.0, 6.0, 10.0, 8.0, 9.0, 18.0, 25.0, 21.0, 20.0, 30.0, 34.0, 34.0, 55.0, 44.0, 79.0, 84.0, 100.0, 71.0, 64.0, 30.0, 42.0, 40.0, 28.0, 22.0, 28.0, 21.0, 12.0, 12.0, 10.0, 9.0, 6.0, 5.0, 7.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.5481157302856445, -2.479661226272583, -2.4112067222595215, -2.34275221824646, -2.2742977142333984, -2.205843448638916, -2.1373889446258545, -2.068934440612793, -2.0004799365997314, -1.93202543258667, -1.8635709285736084, -1.7951165437698364, -1.726662039756775, -1.6582075357437134, -1.5897531509399414, -1.5212986469268799, -1.4528441429138184, -1.3843896389007568, -1.3159351348876953, -1.2474807500839233, -1.1790262460708618, -1.1105717420578003, -1.0421173572540283, -0.9736628532409668, -0.9052083492279053, -0.8367538452148438, -0.768299400806427, -0.6998449563980103, -0.6313904523849487, -0.5629359483718872, -0.49448150396347046, -0.4260270297527313, -0.3575727939605713, -0.28911831974983215, -0.22066384553909302, -0.15220937132835388, -0.08375489711761475, -0.01530042290687561, 0.053154051303863525, 0.12160852551460266, 0.1900629997253418, 0.25851747393608093, 0.32697194814682007, 0.3954264223575592, 0.46388089656829834, 0.5323354005813599, 0.6007898449897766, 0.6692442893981934, 0.7376987934112549, 0.8061532974243164, 0.8746077418327332, 0.9430621862411499, 1.0115166902542114, 1.079971194267273, 1.148425579071045, 1.2168800830841064, 1.285334587097168, 1.3537890911102295, 1.422243595123291, 1.490697979927063, 1.5591524839401245, 1.627606987953186, 1.696061372756958, 1.7645158767700195, 1.832970380783081]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 13.0, 8.0, 13.0, 21.0, 18.0, 34.0, 47.0, 73.0, 93.0, 138.0, 304.0, 478.0, 825.0, 1603.0, 3170.0, 7134.0, 19490.0, 73770.0, 418065.0, 2278868.0, 1160617.0, 172508.0, 35938.0, 11567.0, 4588.0, 2200.0, 1112.0, 585.0, 345.0, 229.0, 124.0, 86.0, 50.0, 51.0, 34.0, 21.0, 23.0, 13.0, 6.0, 3.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1309814453125, -0.12608718872070312, -0.12119293212890625, -0.11629867553710938, -0.1114044189453125, -0.10651016235351562, -0.10161590576171875, -0.09672164916992188, -0.091827392578125, -0.08693313598632812, -0.08203887939453125, -0.07714462280273438, -0.0722503662109375, -0.06735610961914062, -0.06246185302734375, -0.057567596435546875, -0.05267333984375, -0.047779083251953125, -0.04288482666015625, -0.037990570068359375, -0.0330963134765625, -0.028202056884765625, -0.02330780029296875, -0.018413543701171875, -0.013519287109375, -0.008625030517578125, -0.00373077392578125, 0.001163482666015625, 0.0060577392578125, 0.010951995849609375, 0.01584625244140625, 0.020740509033203125, 0.025634765625, 0.030529022216796875, 0.03542327880859375, 0.040317535400390625, 0.0452117919921875, 0.050106048583984375, 0.05500030517578125, 0.059894561767578125, 0.064788818359375, 0.06968307495117188, 0.07457733154296875, 0.07947158813476562, 0.0843658447265625, 0.08926010131835938, 0.09415435791015625, 0.09904861450195312, 0.10394287109375, 0.10883712768554688, 0.11373138427734375, 0.11862564086914062, 0.1235198974609375, 0.12841415405273438, 0.13330841064453125, 0.13820266723632812, 0.143096923828125, 0.14799118041992188, 0.15288543701171875, 0.15777969360351562, 0.1626739501953125, 0.16756820678710938, 0.17246246337890625, 0.17735671997070312, 0.1822509765625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 8.0, 10.0, 7.0, 7.0, 11.0, 13.0, 20.0, 13.0, 23.0, 25.0, 18.0, 19.0, 28.0, 34.0, 30.0, 38.0, 41.0, 37.0, 52.0, 45.0, 36.0, 32.0, 38.0, 41.0, 50.0, 42.0, 31.0, 30.0, 23.0, 20.0, 26.0, 16.0, 33.0, 16.0, 15.0, 9.0, 6.0, 9.0, 12.0, 9.0, 4.0, 1.0, 4.0, 5.0, 7.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1064453125, -0.10318946838378906, -0.09993362426757812, -0.09667778015136719, -0.09342193603515625, -0.09016609191894531, -0.08691024780273438, -0.08365440368652344, -0.0803985595703125, -0.07714271545410156, -0.07388687133789062, -0.07063102722167969, -0.06737518310546875, -0.06411933898925781, -0.060863494873046875, -0.05760765075683594, -0.054351806640625, -0.05109596252441406, -0.047840118408203125, -0.04458427429199219, -0.04132843017578125, -0.03807258605957031, -0.034816741943359375, -0.03156089782714844, -0.0283050537109375, -0.025049209594726562, -0.021793365478515625, -0.018537521362304688, -0.01528167724609375, -0.012025833129882812, -0.008769989013671875, -0.0055141448974609375, -0.00225830078125, 0.0009975433349609375, 0.004253387451171875, 0.0075092315673828125, 0.01076507568359375, 0.014020919799804688, 0.017276763916015625, 0.020532608032226562, 0.0237884521484375, 0.027044296264648438, 0.030300140380859375, 0.03355598449707031, 0.03681182861328125, 0.04006767272949219, 0.043323516845703125, 0.04657936096191406, 0.049835205078125, 0.05309104919433594, 0.056346893310546875, 0.05960273742675781, 0.06285858154296875, 0.06611442565917969, 0.06937026977539062, 0.07262611389160156, 0.0758819580078125, 0.07913780212402344, 0.08239364624023438, 0.08564949035644531, 0.08890533447265625, 0.09216117858886719, 0.09541702270507812, 0.09867286682128906, 0.1019287109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 9.0, 7.0, 12.0, 13.0, 42.0, 48.0, 71.0, 121.0, 257.0, 590.0, 1647.0, 5637.0, 29773.0, 356561.0, 3566164.0, 204520.0, 21795.0, 4554.0, 1376.0, 507.0, 221.0, 119.0, 76.0, 44.0, 33.0, 21.0, 21.0, 4.0, 12.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40869140625, -0.3968162536621094, -0.38494110107421875, -0.3730659484863281, -0.3611907958984375, -0.3493156433105469, -0.33744049072265625, -0.3255653381347656, -0.313690185546875, -0.3018150329589844, -0.28993988037109375, -0.2780647277832031, -0.2661895751953125, -0.2543144226074219, -0.24243927001953125, -0.23056411743164062, -0.21868896484375, -0.20681381225585938, -0.19493865966796875, -0.18306350708007812, -0.1711883544921875, -0.15931320190429688, -0.14743804931640625, -0.13556289672851562, -0.123687744140625, -0.11181259155273438, -0.09993743896484375, -0.08806228637695312, -0.0761871337890625, -0.06431198120117188, -0.05243682861328125, -0.040561676025390625, -0.0286865234375, -0.016811370849609375, -0.00493621826171875, 0.006938934326171875, 0.0188140869140625, 0.030689239501953125, 0.04256439208984375, 0.054439544677734375, 0.066314697265625, 0.07818984985351562, 0.09006500244140625, 0.10194015502929688, 0.1138153076171875, 0.12569046020507812, 0.13756561279296875, 0.14944076538085938, 0.16131591796875, 0.17319107055664062, 0.18506622314453125, 0.19694137573242188, 0.2088165283203125, 0.22069168090820312, 0.23256683349609375, 0.24444198608398438, 0.256317138671875, 0.2681922912597656, 0.28006744384765625, 0.2919425964355469, 0.3038177490234375, 0.3156929016113281, 0.32756805419921875, 0.3394432067871094, 0.351318359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 9.0, 11.0, 16.0, 21.0, 26.0, 33.0, 53.0, 67.0, 139.0, 196.0, 340.0, 554.0, 789.0, 684.0, 401.0, 264.0, 159.0, 88.0, 62.0, 34.0, 33.0, 24.0, 21.0, 18.0, 8.0, 3.0, 2.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30810546875, -0.29840087890625, -0.2886962890625, -0.27899169921875, -0.269287109375, -0.25958251953125, -0.2498779296875, -0.24017333984375, -0.23046875, -0.22076416015625, -0.2110595703125, -0.20135498046875, -0.191650390625, -0.18194580078125, -0.1722412109375, -0.16253662109375, -0.15283203125, -0.14312744140625, -0.1334228515625, -0.12371826171875, -0.114013671875, -0.10430908203125, -0.0946044921875, -0.08489990234375, -0.0751953125, -0.06549072265625, -0.0557861328125, -0.04608154296875, -0.036376953125, -0.02667236328125, -0.0169677734375, -0.00726318359375, 0.00244140625, 0.01214599609375, 0.0218505859375, 0.03155517578125, 0.041259765625, 0.05096435546875, 0.0606689453125, 0.07037353515625, 0.080078125, 0.08978271484375, 0.0994873046875, 0.10919189453125, 0.118896484375, 0.12860107421875, 0.1383056640625, 0.14801025390625, 0.15771484375, 0.16741943359375, 0.1771240234375, 0.18682861328125, 0.196533203125, 0.20623779296875, 0.2159423828125, 0.22564697265625, 0.2353515625, 0.24505615234375, 0.2547607421875, 0.26446533203125, 0.274169921875, 0.28387451171875, 0.2935791015625, 0.30328369140625, 0.31298828125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 6.0, 9.0, 10.0, 18.0, 34.0, 107.0, 206.0, 225.0, 197.0, 118.0, 44.0, 15.0, 6.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9273905754089355, -3.8071742057800293, -3.686957597732544, -3.5667412281036377, -3.4465246200561523, -3.326308250427246, -3.2060916423797607, -3.0858752727508545, -2.965658664703369, -2.845442295074463, -2.7252256870269775, -2.6050093173980713, -2.484792709350586, -2.3645763397216797, -2.2443597316741943, -2.124143362045288, -2.0039267539978027, -1.883710265159607, -1.7634937763214111, -1.6432772874832153, -1.5230607986450195, -1.4028444290161133, -1.282627820968628, -1.1624114513397217, -1.0421950817108154, -0.9219785928726196, -0.8017621040344238, -0.681545615196228, -0.5613291263580322, -0.4411126971244812, -0.3208962082862854, -0.2006797194480896, -0.08046317100524902, 0.03975331038236618, 0.15996979176998138, 0.280186265707016, 0.4004027545452118, 0.5206192135810852, 0.640835702419281, 0.7610521912574768, 0.8812686800956726, 1.0014851093292236, 1.1217015981674194, 1.2419180870056152, 1.362134575843811, 1.4823510646820068, 1.6025675535202026, 1.7227840423583984, 1.8430005311965942, 1.96321702003479, 2.0834333896636963, 2.2036499977111816, 2.323866367340088, 2.4440829753875732, 2.5642993450164795, 2.684515953063965, 2.804732322692871, 2.9249486923217773, 3.0451653003692627, 3.165381669998169, 3.2855982780456543, 3.4058146476745605, 3.526031255722046, 3.646247625350952, 3.7664642333984375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 12.0, 10.0, 9.0, 15.0, 11.0, 16.0, 23.0, 29.0, 21.0, 24.0, 29.0, 42.0, 38.0, 48.0, 35.0, 54.0, 41.0, 47.0, 40.0, 33.0, 39.0, 43.0, 44.0, 48.0, 31.0, 37.0, 25.0, 24.0, 21.0, 19.0, 14.0, 16.0, 7.0, 12.0, 11.0, 11.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.117948293685913, -1.0799614191055298, -1.0419745445251465, -1.0039876699447632, -0.9660007953643799, -0.9280139207839966, -0.8900269865989685, -0.8520401120185852, -0.8140532374382019, -0.7760663628578186, -0.7380794882774353, -0.700092613697052, -0.6621056795120239, -0.6241188049316406, -0.5861319303512573, -0.548145055770874, -0.5101581811904907, -0.4721713066101074, -0.4341844320297241, -0.39619752764701843, -0.35821065306663513, -0.32022377848625183, -0.28223687410354614, -0.24424999952316284, -0.20626312494277954, -0.16827625036239624, -0.13028936088085175, -0.09230247884988785, -0.05431559681892395, -0.01632872223854065, 0.021658167243003845, 0.05964505672454834, 0.09763193130493164, 0.13561880588531494, 0.17360569536685944, 0.21159258484840393, 0.24957945942878723, 0.28756633400917053, 0.3255532383918762, 0.3635401129722595, 0.4015269875526428, 0.4395138621330261, 0.4775007367134094, 0.5154876112937927, 0.5534745454788208, 0.5914614200592041, 0.6294482946395874, 0.6674351692199707, 0.705422043800354, 0.7434089183807373, 0.7813957929611206, 0.8193826675415039, 0.8573695421218872, 0.8953564167022705, 0.9333433508872986, 0.9713302254676819, 1.00931715965271, 1.0473040342330933, 1.0852909088134766, 1.1232777833938599, 1.1612646579742432, 1.1992515325546265, 1.2372384071350098, 1.2752254009246826, 1.3132121562957764]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 17.0, 14.0, 21.0, 34.0, 61.0, 64.0, 103.0, 161.0, 226.0, 369.0, 600.0, 1063.0, 2035.0, 4293.0, 10553.0, 32026.0, 134745.0, 494091.0, 278270.0, 59961.0, 17188.0, 6313.0, 2830.0, 1417.0, 751.0, 464.0, 267.0, 195.0, 140.0, 71.0, 61.0, 39.0, 32.0, 20.0, 14.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2095947265625, -0.2029895782470703, -0.19638442993164062, -0.18977928161621094, -0.18317413330078125, -0.17656898498535156, -0.16996383666992188, -0.1633586883544922, -0.1567535400390625, -0.1501483917236328, -0.14354324340820312, -0.13693809509277344, -0.13033294677734375, -0.12372779846191406, -0.11712265014648438, -0.11051750183105469, -0.103912353515625, -0.09730720520019531, -0.09070205688476562, -0.08409690856933594, -0.07749176025390625, -0.07088661193847656, -0.06428146362304688, -0.05767631530761719, -0.0510711669921875, -0.04446601867675781, -0.037860870361328125, -0.03125572204589844, -0.02465057373046875, -0.018045425415039062, -0.011440277099609375, -0.0048351287841796875, 0.00177001953125, 0.008375167846679688, 0.014980316162109375, 0.021585464477539062, 0.02819061279296875, 0.03479576110839844, 0.041400909423828125, 0.04800605773925781, 0.0546112060546875, 0.06121635437011719, 0.06782150268554688, 0.07442665100097656, 0.08103179931640625, 0.08763694763183594, 0.09424209594726562, 0.10084724426269531, 0.107452392578125, 0.11405754089355469, 0.12066268920898438, 0.12726783752441406, 0.13387298583984375, 0.14047813415527344, 0.14708328247070312, 0.1536884307861328, 0.1602935791015625, 0.1668987274169922, 0.17350387573242188, 0.18010902404785156, 0.18671417236328125, 0.19331932067871094, 0.19992446899414062, 0.2065296173095703, 0.213134765625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 4.0, 5.0, 8.0, 11.0, 12.0, 18.0, 16.0, 25.0, 20.0, 24.0, 30.0, 34.0, 36.0, 39.0, 28.0, 40.0, 43.0, 59.0, 36.0, 55.0, 49.0, 40.0, 37.0, 52.0, 40.0, 30.0, 27.0, 17.0, 27.0, 20.0, 17.0, 12.0, 15.0, 18.0, 11.0, 12.0, 5.0, 4.0, 6.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11529541015625, -0.11155891418457031, -0.10782241821289062, -0.10408592224121094, -0.10034942626953125, -0.09661293029785156, -0.09287643432617188, -0.08913993835449219, -0.0854034423828125, -0.08166694641113281, -0.07793045043945312, -0.07419395446777344, -0.07045745849609375, -0.06672096252441406, -0.06298446655273438, -0.05924797058105469, -0.055511474609375, -0.05177497863769531, -0.048038482666015625, -0.04430198669433594, -0.04056549072265625, -0.03682899475097656, -0.033092498779296875, -0.029356002807617188, -0.0256195068359375, -0.021883010864257812, -0.018146514892578125, -0.014410018920898438, -0.01067352294921875, -0.0069370269775390625, -0.003200531005859375, 0.0005359649658203125, 0.0042724609375, 0.008008956909179688, 0.011745452880859375, 0.015481948852539062, 0.01921844482421875, 0.022954940795898438, 0.026691436767578125, 0.030427932739257812, 0.0341644287109375, 0.03790092468261719, 0.041637420654296875, 0.04537391662597656, 0.04911041259765625, 0.05284690856933594, 0.056583404541015625, 0.06031990051269531, 0.064056396484375, 0.06779289245605469, 0.07152938842773438, 0.07526588439941406, 0.07900238037109375, 0.08273887634277344, 0.08647537231445312, 0.09021186828613281, 0.0939483642578125, 0.09768486022949219, 0.10142135620117188, 0.10515785217285156, 0.10889434814453125, 0.11263084411621094, 0.11636734008789062, 0.12010383605957031, 0.12384033203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 2.0, 6.0, 6.0, 10.0, 7.0, 11.0, 17.0, 26.0, 34.0, 43.0, 50.0, 64.0, 99.0, 123.0, 190.0, 279.0, 493.0, 940.0, 1938.0, 4956.0, 18751.0, 133671.0, 762224.0, 100904.0, 15310.0, 4301.0, 1734.0, 858.0, 473.0, 299.0, 216.0, 127.0, 94.0, 57.0, 55.0, 56.0, 35.0, 21.0, 16.0, 16.0, 11.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.334716796875, -0.3252716064453125, -0.315826416015625, -0.3063812255859375, -0.29693603515625, -0.2874908447265625, -0.278045654296875, -0.2686004638671875, -0.2591552734375, -0.2497100830078125, -0.240264892578125, -0.2308197021484375, -0.22137451171875, -0.2119293212890625, -0.202484130859375, -0.1930389404296875, -0.18359375, -0.1741485595703125, -0.164703369140625, -0.1552581787109375, -0.14581298828125, -0.1363677978515625, -0.126922607421875, -0.1174774169921875, -0.1080322265625, -0.0985870361328125, -0.089141845703125, -0.0796966552734375, -0.07025146484375, -0.0608062744140625, -0.051361083984375, -0.0419158935546875, -0.032470703125, -0.0230255126953125, -0.013580322265625, -0.0041351318359375, 0.00531005859375, 0.0147552490234375, 0.024200439453125, 0.0336456298828125, 0.0430908203125, 0.0525360107421875, 0.061981201171875, 0.0714263916015625, 0.08087158203125, 0.0903167724609375, 0.099761962890625, 0.1092071533203125, 0.11865234375, 0.1280975341796875, 0.137542724609375, 0.1469879150390625, 0.15643310546875, 0.1658782958984375, 0.175323486328125, 0.1847686767578125, 0.1942138671875, 0.2036590576171875, 0.213104248046875, 0.2225494384765625, 0.23199462890625, 0.2414398193359375, 0.250885009765625, 0.2603302001953125, 0.269775390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 3.0, 8.0, 11.0, 12.0, 8.0, 17.0, 24.0, 35.0, 32.0, 63.0, 55.0, 66.0, 65.0, 59.0, 71.0, 61.0, 68.0, 62.0, 59.0, 42.0, 30.0, 26.0, 26.0, 20.0, 11.0, 14.0, 19.0, 8.0, 9.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59765625, -0.5797653198242188, -0.5618743896484375, -0.5439834594726562, -0.526092529296875, -0.5082015991210938, -0.4903106689453125, -0.47241973876953125, -0.45452880859375, -0.43663787841796875, -0.4187469482421875, -0.40085601806640625, -0.382965087890625, -0.36507415771484375, -0.3471832275390625, -0.32929229736328125, -0.3114013671875, -0.29351043701171875, -0.2756195068359375, -0.25772857666015625, -0.239837646484375, -0.22194671630859375, -0.2040557861328125, -0.18616485595703125, -0.16827392578125, -0.15038299560546875, -0.1324920654296875, -0.11460113525390625, -0.096710205078125, -0.07881927490234375, -0.0609283447265625, -0.04303741455078125, -0.025146484375, -0.00725555419921875, 0.0106353759765625, 0.02852630615234375, 0.046417236328125, 0.06430816650390625, 0.0821990966796875, 0.10009002685546875, 0.11798095703125, 0.13587188720703125, 0.1537628173828125, 0.17165374755859375, 0.189544677734375, 0.20743560791015625, 0.2253265380859375, 0.24321746826171875, 0.2611083984375, 0.27899932861328125, 0.2968902587890625, 0.31478118896484375, 0.332672119140625, 0.35056304931640625, 0.3684539794921875, 0.38634490966796875, 0.40423583984375, 0.42212677001953125, 0.4400177001953125, 0.45790863037109375, 0.475799560546875, 0.49369049072265625, 0.5115814208984375, 0.5294723510742188, 0.54736328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 7.0, 12.0, 16.0, 16.0, 11.0, 18.0, 27.0, 28.0, 45.0, 50.0, 113.0, 121.0, 197.0, 280.0, 485.0, 777.0, 1349.0, 2467.0, 4758.0, 9456.0, 21701.0, 57711.0, 201066.0, 573704.0, 108826.0, 35663.0, 14656.0, 6955.0, 3481.0, 1766.0, 1023.0, 618.0, 385.0, 247.0, 153.0, 104.0, 77.0, 47.0, 41.0, 26.0, 18.0, 21.0, 13.0, 5.0, 7.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.0733642578125, -0.0710906982421875, -0.068817138671875, -0.0665435791015625, -0.06427001953125, -0.0619964599609375, -0.059722900390625, -0.0574493408203125, -0.05517578125, -0.0529022216796875, -0.050628662109375, -0.0483551025390625, -0.04608154296875, -0.0438079833984375, -0.041534423828125, -0.0392608642578125, -0.0369873046875, -0.0347137451171875, -0.032440185546875, -0.0301666259765625, -0.02789306640625, -0.0256195068359375, -0.023345947265625, -0.0210723876953125, -0.018798828125, -0.0165252685546875, -0.014251708984375, -0.0119781494140625, -0.00970458984375, -0.0074310302734375, -0.005157470703125, -0.0028839111328125, -0.0006103515625, 0.0016632080078125, 0.003936767578125, 0.0062103271484375, 0.00848388671875, 0.0107574462890625, 0.013031005859375, 0.0153045654296875, 0.017578125, 0.0198516845703125, 0.022125244140625, 0.0243988037109375, 0.02667236328125, 0.0289459228515625, 0.031219482421875, 0.0334930419921875, 0.0357666015625, 0.0380401611328125, 0.040313720703125, 0.0425872802734375, 0.04486083984375, 0.0471343994140625, 0.049407958984375, 0.0516815185546875, 0.053955078125, 0.0562286376953125, 0.058502197265625, 0.0607757568359375, 0.06304931640625, 0.0653228759765625, 0.067596435546875, 0.0698699951171875, 0.0721435546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 9.0, 3.0, 7.0, 10.0, 14.0, 12.0, 23.0, 21.0, 29.0, 44.0, 55.0, 45.0, 70.0, 72.0, 77.0, 72.0, 70.0, 68.0, 54.0, 41.0, 46.0, 26.0, 17.0, 21.0, 12.0, 8.0, 9.0, 7.0, 7.0, 7.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0], "bins": [-3.7550926208496094e-05, -3.6495737731456757e-05, -3.544054925441742e-05, -3.438536077737808e-05, -3.3330172300338745e-05, -3.227498382329941e-05, -3.121979534626007e-05, -3.0164606869220734e-05, -2.9109418392181396e-05, -2.805422991514206e-05, -2.6999041438102722e-05, -2.5943852961063385e-05, -2.4888664484024048e-05, -2.383347600698471e-05, -2.2778287529945374e-05, -2.1723099052906036e-05, -2.06679105758667e-05, -1.9612722098827362e-05, -1.8557533621788025e-05, -1.7502345144748688e-05, -1.644715666770935e-05, -1.5391968190670013e-05, -1.4336779713630676e-05, -1.3281591236591339e-05, -1.2226402759552002e-05, -1.1171214282512665e-05, -1.0116025805473328e-05, -9.06083732843399e-06, -8.005648851394653e-06, -6.950460374355316e-06, -5.895271897315979e-06, -4.840083420276642e-06, -3.7848949432373047e-06, -2.7297064661979675e-06, -1.6745179891586304e-06, -6.193295121192932e-07, 4.3585896492004395e-07, 1.491047441959381e-06, 2.5462359189987183e-06, 3.6014243960380554e-06, 4.656612873077393e-06, 5.71180135011673e-06, 6.766989827156067e-06, 7.822178304195404e-06, 8.877366781234741e-06, 9.932555258274078e-06, 1.0987743735313416e-05, 1.2042932212352753e-05, 1.309812068939209e-05, 1.4153309166431427e-05, 1.5208497643470764e-05, 1.62636861205101e-05, 1.731887459754944e-05, 1.8374063074588776e-05, 1.9429251551628113e-05, 2.048444002866745e-05, 2.1539628505706787e-05, 2.2594816982746124e-05, 2.365000545978546e-05, 2.47051939368248e-05, 2.5760382413864136e-05, 2.6815570890903473e-05, 2.787075936794281e-05, 2.8925947844982147e-05, 2.9981136322021484e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 9.0, 7.0, 11.0, 30.0, 23.0, 41.0, 63.0, 119.0, 187.0, 313.0, 594.0, 1202.0, 2590.0, 7228.0, 23952.0, 123938.0, 734041.0, 118745.0, 23332.0, 7019.0, 2600.0, 1122.0, 556.0, 300.0, 174.0, 116.0, 78.0, 59.0, 29.0, 22.0, 13.0, 10.0, 8.0, 7.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12335205078125, -0.11955547332763672, -0.11575889587402344, -0.11196231842041016, -0.10816574096679688, -0.1043691635131836, -0.10057258605957031, -0.09677600860595703, -0.09297943115234375, -0.08918285369873047, -0.08538627624511719, -0.0815896987915039, -0.07779312133789062, -0.07399654388427734, -0.07019996643066406, -0.06640338897705078, -0.0626068115234375, -0.05881023406982422, -0.05501365661621094, -0.051217079162597656, -0.047420501708984375, -0.043623924255371094, -0.03982734680175781, -0.03603076934814453, -0.03223419189453125, -0.02843761444091797, -0.024641036987304688, -0.020844459533691406, -0.017047882080078125, -0.013251304626464844, -0.009454727172851562, -0.005658149719238281, -0.001861572265625, 0.0019350051879882812, 0.0057315826416015625, 0.009528160095214844, 0.013324737548828125, 0.017121315002441406, 0.020917892456054688, 0.02471446990966797, 0.02851104736328125, 0.03230762481689453, 0.03610420227050781, 0.039900779724121094, 0.043697357177734375, 0.047493934631347656, 0.05129051208496094, 0.05508708953857422, 0.0588836669921875, 0.06268024444580078, 0.06647682189941406, 0.07027339935302734, 0.07406997680664062, 0.0778665542602539, 0.08166313171386719, 0.08545970916748047, 0.08925628662109375, 0.09305286407470703, 0.09684944152832031, 0.1006460189819336, 0.10444259643554688, 0.10823917388916016, 0.11203575134277344, 0.11583232879638672, 0.11962890625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 10.0, 4.0, 8.0, 8.0, 14.0, 29.0, 42.0, 39.0, 80.0, 110.0, 106.0, 109.0, 112.0, 84.0, 63.0, 53.0, 38.0, 29.0, 13.0, 23.0, 14.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.17626953125, -0.1721038818359375, -0.167938232421875, -0.1637725830078125, -0.15960693359375, -0.1554412841796875, -0.151275634765625, -0.1471099853515625, -0.1429443359375, -0.1387786865234375, -0.134613037109375, -0.1304473876953125, -0.12628173828125, -0.1221160888671875, -0.117950439453125, -0.1137847900390625, -0.109619140625, -0.1054534912109375, -0.101287841796875, -0.0971221923828125, -0.09295654296875, -0.0887908935546875, -0.084625244140625, -0.0804595947265625, -0.0762939453125, -0.0721282958984375, -0.067962646484375, -0.0637969970703125, -0.05963134765625, -0.0554656982421875, -0.051300048828125, -0.0471343994140625, -0.04296875, -0.0388031005859375, -0.034637451171875, -0.0304718017578125, -0.02630615234375, -0.0221405029296875, -0.017974853515625, -0.0138092041015625, -0.0096435546875, -0.0054779052734375, -0.001312255859375, 0.0028533935546875, 0.00701904296875, 0.0111846923828125, 0.015350341796875, 0.0195159912109375, 0.023681640625, 0.0278472900390625, 0.032012939453125, 0.0361785888671875, 0.04034423828125, 0.0445098876953125, 0.048675537109375, 0.0528411865234375, 0.0570068359375, 0.0611724853515625, 0.065338134765625, 0.0695037841796875, 0.07366943359375, 0.0778350830078125, 0.082000732421875, 0.0861663818359375, 0.09033203125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 15.0, 4.0, 18.0, 31.0, 77.0, 107.0, 232.0, 246.0, 106.0, 58.0, 34.0, 16.0, 16.0, 9.0, 5.0, 7.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.111006021499634, -3.0370190143585205, -2.963031768798828, -2.889044761657715, -2.8150575160980225, -2.741070508956909, -2.667083263397217, -2.5930962562561035, -2.519109010696411, -2.445122003555298, -2.3711347579956055, -2.297147750854492, -2.2231605052948, -2.1491734981536865, -2.075186252593994, -2.001199245452881, -1.927212119102478, -1.8532249927520752, -1.7792378664016724, -1.7052507400512695, -1.6312636137008667, -1.5572764873504639, -1.4832894802093506, -1.4093022346496582, -1.335315227508545, -1.261328101158142, -1.1873409748077393, -1.1133538484573364, -1.0393667221069336, -0.9653795957565308, -0.8913925290107727, -0.8174054026603699, -0.7434182167053223, -0.6694310903549194, -0.5954439640045166, -0.5214568376541138, -0.4474697411060333, -0.3734826147556305, -0.29949551820755005, -0.22550839185714722, -0.15152126550674438, -0.07753414660692215, -0.0035470277070999146, 0.07044008374214172, 0.14442721009254456, 0.2184143364429474, 0.29240143299102783, 0.36638855934143066, 0.4403756856918335, 0.5143628120422363, 0.5883499383926392, 0.662337064743042, 0.7363241910934448, 0.8103113174438477, 0.8842983841896057, 0.9582855105400085, 1.0322725772857666, 1.1062597036361694, 1.1802468299865723, 1.254233956336975, 1.328221082687378, 1.4022082090377808, 1.4761953353881836, 1.5501823425292969, 1.6241695880889893]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 11.0, 15.0, 10.0, 8.0, 13.0, 6.0, 16.0, 24.0, 30.0, 29.0, 23.0, 29.0, 20.0, 42.0, 41.0, 54.0, 75.0, 70.0, 81.0, 57.0, 41.0, 37.0, 26.0, 28.0, 23.0, 32.0, 19.0, 11.0, 14.0, 21.0, 10.0, 6.0, 9.0, 12.0, 7.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.3790278434753418, -1.3324027061462402, -1.2857776880264282, -1.2391525506973267, -1.192527413368225, -1.1459022760391235, -1.0992772579193115, -1.05265212059021, -1.0060269832611084, -0.9594019055366516, -0.91277676820755, -0.8661516904830933, -0.8195265531539917, -0.7729014754295349, -0.7262763977050781, -0.6796512603759766, -0.6330261826515198, -0.586401104927063, -0.5397759675979614, -0.49315088987350464, -0.4465257525444031, -0.3999006748199463, -0.3532755672931671, -0.30665045976638794, -0.26002535223960876, -0.2134002447128296, -0.16677513718605042, -0.12015004456043243, -0.07352493703365326, -0.026899829506874084, 0.019725263118743896, 0.06635037064552307, 0.11297547817230225, 0.15960058569908142, 0.2062256932258606, 0.2528507709503174, 0.29947590827941895, 0.34610098600387573, 0.3927260935306549, 0.4393512010574341, 0.48597630858421326, 0.5326014161109924, 0.5792264938354492, 0.6258516311645508, 0.6724767088890076, 0.7191018462181091, 0.7657269239425659, 0.8123520612716675, 0.8589771389961243, 0.905602216720581, 0.9522273540496826, 0.9988524317741394, 1.0454775094985962, 1.0921026468276978, 1.1387277841567993, 1.1853528022766113, 1.231977939605713, 1.2786030769348145, 1.3252280950546265, 1.371853232383728, 1.4184783697128296, 1.4651035070419312, 1.5117285251617432, 1.5583536624908447, 1.6049787998199463]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 9.0, 8.0, 10.0, 11.0, 17.0, 18.0, 36.0, 63.0, 99.0, 123.0, 266.0, 499.0, 865.0, 1824.0, 3897.0, 10196.0, 33266.0, 153906.0, 981703.0, 2357448.0, 527707.0, 87842.0, 21315.0, 7126.0, 3006.0, 1304.0, 700.0, 379.0, 235.0, 143.0, 80.0, 62.0, 30.0, 34.0, 15.0, 8.0, 6.0, 8.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1868896484375, -0.18160057067871094, -0.17631149291992188, -0.1710224151611328, -0.16573333740234375, -0.1604442596435547, -0.15515518188476562, -0.14986610412597656, -0.1445770263671875, -0.13928794860839844, -0.13399887084960938, -0.1287097930908203, -0.12342071533203125, -0.11813163757324219, -0.11284255981445312, -0.10755348205566406, -0.102264404296875, -0.09697532653808594, -0.09168624877929688, -0.08639717102050781, -0.08110809326171875, -0.07581901550292969, -0.07052993774414062, -0.06524085998535156, -0.0599517822265625, -0.05466270446777344, -0.049373626708984375, -0.04408454895019531, -0.03879547119140625, -0.03350639343261719, -0.028217315673828125, -0.022928237915039062, -0.01763916015625, -0.012350082397460938, -0.007061004638671875, -0.0017719268798828125, 0.00351715087890625, 0.008806228637695312, 0.014095306396484375, 0.019384384155273438, 0.0246734619140625, 0.029962539672851562, 0.035251617431640625, 0.04054069519042969, 0.04582977294921875, 0.05111885070800781, 0.056407928466796875, 0.06169700622558594, 0.066986083984375, 0.07227516174316406, 0.07756423950195312, 0.08285331726074219, 0.08814239501953125, 0.09343147277832031, 0.09872055053710938, 0.10400962829589844, 0.1092987060546875, 0.11458778381347656, 0.11987686157226562, 0.1251659393310547, 0.13045501708984375, 0.1357440948486328, 0.14103317260742188, 0.14632225036621094, 0.151611328125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 9.0, 9.0, 14.0, 7.0, 14.0, 15.0, 23.0, 19.0, 22.0, 32.0, 28.0, 35.0, 30.0, 28.0, 33.0, 32.0, 33.0, 38.0, 33.0, 47.0, 39.0, 30.0, 39.0, 42.0, 33.0, 36.0, 30.0, 29.0, 28.0, 20.0, 20.0, 21.0, 18.0, 11.0, 19.0, 10.0, 16.0, 6.0, 9.0, 7.0, 4.0, 7.0, 10.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09674072265625, -0.09358024597167969, -0.09041976928710938, -0.08725929260253906, -0.08409881591796875, -0.08093833923339844, -0.07777786254882812, -0.07461738586425781, -0.0714569091796875, -0.06829643249511719, -0.06513595581054688, -0.06197547912597656, -0.05881500244140625, -0.05565452575683594, -0.052494049072265625, -0.04933357238769531, -0.046173095703125, -0.04301261901855469, -0.039852142333984375, -0.03669166564941406, -0.03353118896484375, -0.030370712280273438, -0.027210235595703125, -0.024049758911132812, -0.0208892822265625, -0.017728805541992188, -0.014568328857421875, -0.011407852172851562, -0.00824737548828125, -0.0050868988037109375, -0.001926422119140625, 0.0012340545654296875, 0.00439453125, 0.0075550079345703125, 0.010715484619140625, 0.013875961303710938, 0.01703643798828125, 0.020196914672851562, 0.023357391357421875, 0.026517868041992188, 0.0296783447265625, 0.03283882141113281, 0.035999298095703125, 0.03915977478027344, 0.04232025146484375, 0.04548072814941406, 0.048641204833984375, 0.05180168151855469, 0.054962158203125, 0.05812263488769531, 0.061283111572265625, 0.06444358825683594, 0.06760406494140625, 0.07076454162597656, 0.07392501831054688, 0.07708549499511719, 0.0802459716796875, 0.08340644836425781, 0.08656692504882812, 0.08972740173339844, 0.09288787841796875, 0.09604835510253906, 0.09920883178710938, 0.10236930847167969, 0.10552978515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 2.0, 11.0, 14.0, 16.0, 22.0, 46.0, 57.0, 80.0, 164.0, 290.0, 722.0, 2207.0, 9794.0, 76444.0, 2255857.0, 1771199.0, 64800.0, 8844.0, 2189.0, 758.0, 331.0, 161.0, 83.0, 51.0, 37.0, 31.0, 13.0, 9.0, 13.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.363037109375, -0.3516807556152344, -0.34032440185546875, -0.3289680480957031, -0.3176116943359375, -0.3062553405761719, -0.29489898681640625, -0.2835426330566406, -0.272186279296875, -0.2608299255371094, -0.24947357177734375, -0.23811721801757812, -0.2267608642578125, -0.21540451049804688, -0.20404815673828125, -0.19269180297851562, -0.18133544921875, -0.16997909545898438, -0.15862274169921875, -0.14726638793945312, -0.1359100341796875, -0.12455368041992188, -0.11319732666015625, -0.10184097290039062, -0.090484619140625, -0.07912826538085938, -0.06777191162109375, -0.056415557861328125, -0.0450592041015625, -0.033702850341796875, -0.02234649658203125, -0.010990142822265625, 0.0003662109375, 0.011722564697265625, 0.02307891845703125, 0.034435272216796875, 0.0457916259765625, 0.057147979736328125, 0.06850433349609375, 0.07986068725585938, 0.091217041015625, 0.10257339477539062, 0.11392974853515625, 0.12528610229492188, 0.1366424560546875, 0.14799880981445312, 0.15935516357421875, 0.17071151733398438, 0.18206787109375, 0.19342422485351562, 0.20478057861328125, 0.21613693237304688, 0.2274932861328125, 0.23884963989257812, 0.25020599365234375, 0.2615623474121094, 0.272918701171875, 0.2842750549316406, 0.29563140869140625, 0.3069877624511719, 0.3183441162109375, 0.3297004699707031, 0.34105682373046875, 0.3524131774902344, 0.36376953125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 14.0, 17.0, 33.0, 33.0, 41.0, 60.0, 74.0, 121.0, 155.0, 250.0, 398.0, 580.0, 630.0, 552.0, 353.0, 239.0, 148.0, 99.0, 77.0, 56.0, 42.0, 23.0, 11.0, 13.0, 12.0, 8.0, 9.0, 2.0, 6.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2025146484375, -0.1938915252685547, -0.18526840209960938, -0.17664527893066406, -0.16802215576171875, -0.15939903259277344, -0.15077590942382812, -0.1421527862548828, -0.1335296630859375, -0.12490653991699219, -0.11628341674804688, -0.10766029357910156, -0.09903717041015625, -0.09041404724121094, -0.08179092407226562, -0.07316780090332031, -0.064544677734375, -0.05592155456542969, -0.047298431396484375, -0.03867530822753906, -0.03005218505859375, -0.021429061889648438, -0.012805938720703125, -0.0041828155517578125, 0.0044403076171875, 0.013063430786132812, 0.021686553955078125, 0.030309677124023438, 0.03893280029296875, 0.04755592346191406, 0.056179046630859375, 0.06480216979980469, 0.07342529296875, 0.08204841613769531, 0.09067153930664062, 0.09929466247558594, 0.10791778564453125, 0.11654090881347656, 0.12516403198242188, 0.1337871551513672, 0.1424102783203125, 0.1510334014892578, 0.15965652465820312, 0.16827964782714844, 0.17690277099609375, 0.18552589416503906, 0.19414901733398438, 0.2027721405029297, 0.211395263671875, 0.2200183868408203, 0.22864151000976562, 0.23726463317871094, 0.24588775634765625, 0.25451087951660156, 0.2631340026855469, 0.2717571258544922, 0.2803802490234375, 0.2890033721923828, 0.2976264953613281, 0.30624961853027344, 0.31487274169921875, 0.32349586486816406, 0.3321189880371094, 0.3407421112060547, 0.349365234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 5.0, 6.0, 8.0, 28.0, 38.0, 58.0, 88.0, 105.0, 154.0, 123.0, 127.0, 90.0, 59.0, 35.0, 25.0, 12.0, 7.0, 3.0, 4.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2555696964263916, -2.1898317337036133, -2.124093532562256, -2.0583555698394775, -1.9926173686981201, -1.9268792867660522, -1.8611412048339844, -1.795403242111206, -1.7296650409698486, -1.6639269590377808, -1.598188877105713, -1.532450795173645, -1.4667127132415771, -1.4009746313095093, -1.3352365493774414, -1.269498586654663, -1.2037605047225952, -1.1380224227905273, -1.0722843408584595, -1.0065462589263916, -0.9408081769943237, -0.8750700950622559, -0.8093320727348328, -0.7435939908027649, -0.677855908870697, -0.6121178269386292, -0.5463797450065613, -0.4806416928768158, -0.4149036109447479, -0.34916552901268005, -0.28342747688293457, -0.2176893949508667, -0.15195119380950928, -0.086213119328022, -0.02047504484653473, 0.04526302218437195, 0.11100110411643982, 0.1767391860485077, 0.24247723817825317, 0.30821532011032104, 0.3739534020423889, 0.4396914839744568, 0.5054295659065247, 0.5711675882339478, 0.6369056701660156, 0.7026437520980835, 0.7683818340301514, 0.8341199159622192, 0.8998579978942871, 0.965596079826355, 1.0313341617584229, 1.0970722436904907, 1.1628103256225586, 1.2285484075546265, 1.2942864894866943, 1.3600244522094727, 1.42576265335083, 1.491500735282898, 1.5572388172149658, 1.6229768991470337, 1.6887149810791016, 1.7544530630111694, 1.8201911449432373, 1.8859291076660156, 1.9516671895980835]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 8.0, 8.0, 20.0, 13.0, 37.0, 26.0, 37.0, 43.0, 55.0, 63.0, 57.0, 67.0, 58.0, 87.0, 65.0, 52.0, 56.0, 43.0, 49.0, 38.0, 27.0, 23.0, 16.0, 16.0, 12.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3563575744628906, -1.3047322034835815, -1.253106713294983, -1.2014813423156738, -1.1498559713363647, -1.0982306003570557, -1.046605110168457, -0.994979739189148, -0.9433543086051941, -0.8917288780212402, -0.8401035070419312, -0.7884780764579773, -0.7368526458740234, -0.6852272748947144, -0.6336018443107605, -0.5819764137268066, -0.5303510427474976, -0.4787256419658661, -0.4271002411842346, -0.37547481060028076, -0.3238494098186493, -0.2722240090370178, -0.22059857845306396, -0.1689731776714325, -0.11734777688980103, -0.06572236865758896, -0.014096960425376892, 0.03752845525741577, 0.08915385603904724, 0.1407792568206787, 0.19240468740463257, 0.24403008818626404, 0.2956554889678955, 0.347280889749527, 0.39890629053115845, 0.4505317211151123, 0.5021570920944214, 0.5537825226783752, 0.6054079532623291, 0.6570333242416382, 0.708658754825592, 0.7602841854095459, 0.811909556388855, 0.8635349869728088, 0.9151604175567627, 0.9667857885360718, 1.0184111595153809, 1.0700366497039795, 1.1216620206832886, 1.1732873916625977, 1.2249128818511963, 1.2765382528305054, 1.3281636238098145, 1.379789113998413, 1.4314144849777222, 1.4830398559570312, 1.5346653461456299, 1.586290717124939, 1.6379162073135376, 1.6895415782928467, 1.7411669492721558, 1.7927923202514648, 1.8444178104400635, 1.8960431814193726, 1.9476685523986816]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 5.0, 7.0, 6.0, 14.0, 14.0, 26.0, 32.0, 50.0, 55.0, 100.0, 121.0, 159.0, 295.0, 510.0, 714.0, 1224.0, 2232.0, 4188.0, 8322.0, 18460.0, 44435.0, 132203.0, 398092.0, 289317.0, 87478.0, 32535.0, 13706.0, 6495.0, 3249.0, 1676.0, 1019.0, 609.0, 389.0, 267.0, 173.0, 119.0, 75.0, 62.0, 38.0, 35.0, 18.0, 9.0, 7.0, 4.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14699935913085938, -0.14189910888671875, -0.13679885864257812, -0.1316986083984375, -0.12659835815429688, -0.12149810791015625, -0.11639785766601562, -0.111297607421875, -0.10619735717773438, -0.10109710693359375, -0.09599685668945312, -0.0908966064453125, -0.08579635620117188, -0.08069610595703125, -0.07559585571289062, -0.07049560546875, -0.06539535522460938, -0.06029510498046875, -0.055194854736328125, -0.0500946044921875, -0.044994354248046875, -0.03989410400390625, -0.034793853759765625, -0.029693603515625, -0.024593353271484375, -0.01949310302734375, -0.014392852783203125, -0.0092926025390625, -0.004192352294921875, 0.00090789794921875, 0.006008148193359375, 0.0111083984375, 0.016208648681640625, 0.02130889892578125, 0.026409149169921875, 0.0315093994140625, 0.036609649658203125, 0.04170989990234375, 0.046810150146484375, 0.051910400390625, 0.057010650634765625, 0.06211090087890625, 0.06721115112304688, 0.0723114013671875, 0.07741165161132812, 0.08251190185546875, 0.08761215209960938, 0.09271240234375, 0.09781265258789062, 0.10291290283203125, 0.10801315307617188, 0.1131134033203125, 0.11821365356445312, 0.12331390380859375, 0.12841415405273438, 0.133514404296875, 0.13861465454101562, 0.14371490478515625, 0.14881515502929688, 0.1539154052734375, 0.15901565551757812, 0.16411590576171875, 0.16921615600585938, 0.17431640625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 6.0, 5.0, 7.0, 7.0, 7.0, 10.0, 20.0, 9.0, 15.0, 21.0, 22.0, 21.0, 25.0, 41.0, 41.0, 45.0, 37.0, 39.0, 45.0, 54.0, 47.0, 47.0, 53.0, 47.0, 34.0, 36.0, 32.0, 26.0, 32.0, 21.0, 26.0, 25.0, 15.0, 16.0, 15.0, 14.0, 11.0, 11.0, 5.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.12103271484375, -0.1172018051147461, -0.11337089538574219, -0.10953998565673828, -0.10570907592773438, -0.10187816619873047, -0.09804725646972656, -0.09421634674072266, -0.09038543701171875, -0.08655452728271484, -0.08272361755371094, -0.07889270782470703, -0.07506179809570312, -0.07123088836669922, -0.06739997863769531, -0.0635690689086914, -0.0597381591796875, -0.055907249450683594, -0.05207633972167969, -0.04824542999267578, -0.044414520263671875, -0.04058361053466797, -0.03675270080566406, -0.032921791076660156, -0.02909088134765625, -0.025259971618652344, -0.021429061889648438, -0.01759815216064453, -0.013767242431640625, -0.009936332702636719, -0.0061054229736328125, -0.0022745132446289062, 0.001556396484375, 0.005387306213378906, 0.009218215942382812, 0.013049125671386719, 0.016880035400390625, 0.02071094512939453, 0.024541854858398438, 0.028372764587402344, 0.03220367431640625, 0.036034584045410156, 0.03986549377441406, 0.04369640350341797, 0.047527313232421875, 0.05135822296142578, 0.05518913269042969, 0.059020042419433594, 0.0628509521484375, 0.0666818618774414, 0.07051277160644531, 0.07434368133544922, 0.07817459106445312, 0.08200550079345703, 0.08583641052246094, 0.08966732025146484, 0.09349822998046875, 0.09732913970947266, 0.10116004943847656, 0.10499095916748047, 0.10882186889648438, 0.11265277862548828, 0.11648368835449219, 0.1203145980834961, 0.1241455078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 8.0, 4.0, 4.0, 7.0, 17.0, 23.0, 45.0, 51.0, 83.0, 180.0, 290.0, 514.0, 1239.0, 3912.0, 23690.0, 757520.0, 241553.0, 14411.0, 2958.0, 959.0, 455.0, 237.0, 135.0, 89.0, 51.0, 44.0, 26.0, 17.0, 8.0, 11.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366943359375, -0.3515815734863281, -0.33621978759765625, -0.3208580017089844, -0.3054962158203125, -0.2901344299316406, -0.27477264404296875, -0.2594108581542969, -0.244049072265625, -0.22868728637695312, -0.21332550048828125, -0.19796371459960938, -0.1826019287109375, -0.16724014282226562, -0.15187835693359375, -0.13651657104492188, -0.12115478515625, -0.10579299926757812, -0.09043121337890625, -0.07506942749023438, -0.0597076416015625, -0.044345855712890625, -0.02898406982421875, -0.013622283935546875, 0.001739501953125, 0.017101287841796875, 0.03246307373046875, 0.047824859619140625, 0.0631866455078125, 0.07854843139648438, 0.09391021728515625, 0.10927200317382812, 0.1246337890625, 0.13999557495117188, 0.15535736083984375, 0.17071914672851562, 0.1860809326171875, 0.20144271850585938, 0.21680450439453125, 0.23216629028320312, 0.247528076171875, 0.2628898620605469, 0.27825164794921875, 0.2936134338378906, 0.3089752197265625, 0.3243370056152344, 0.33969879150390625, 0.3550605773925781, 0.37042236328125, 0.3857841491699219, 0.40114593505859375, 0.4165077209472656, 0.4318695068359375, 0.4472312927246094, 0.46259307861328125, 0.4779548645019531, 0.493316650390625, 0.5086784362792969, 0.5240402221679688, 0.5394020080566406, 0.5547637939453125, 0.5701255798339844, 0.5854873657226562, 0.6008491516113281, 0.6162109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 7.0, 7.0, 15.0, 17.0, 27.0, 28.0, 22.0, 47.0, 45.0, 52.0, 50.0, 57.0, 79.0, 64.0, 68.0, 67.0, 65.0, 63.0, 42.0, 37.0, 24.0, 22.0, 19.0, 17.0, 7.0, 10.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.488525390625, -0.4692726135253906, -0.45001983642578125, -0.4307670593261719, -0.4115142822265625, -0.3922615051269531, -0.37300872802734375, -0.3537559509277344, -0.334503173828125, -0.3152503967285156, -0.29599761962890625, -0.2767448425292969, -0.2574920654296875, -0.23823928833007812, -0.21898651123046875, -0.19973373413085938, -0.18048095703125, -0.16122817993164062, -0.14197540283203125, -0.12272262573242188, -0.1034698486328125, -0.08421707153320312, -0.06496429443359375, -0.045711517333984375, -0.026458740234375, -0.007205963134765625, 0.01204681396484375, 0.031299591064453125, 0.0505523681640625, 0.06980514526367188, 0.08905792236328125, 0.10831069946289062, 0.1275634765625, 0.14681625366210938, 0.16606903076171875, 0.18532180786132812, 0.2045745849609375, 0.22382736206054688, 0.24308013916015625, 0.2623329162597656, 0.281585693359375, 0.3008384704589844, 0.32009124755859375, 0.3393440246582031, 0.3585968017578125, 0.3778495788574219, 0.39710235595703125, 0.4163551330566406, 0.43560791015625, 0.4548606872558594, 0.47411346435546875, 0.4933662414550781, 0.5126190185546875, 0.5318717956542969, 0.5511245727539062, 0.5703773498535156, 0.589630126953125, 0.6088829040527344, 0.6281356811523438, 0.6473884582519531, 0.6666412353515625, 0.6858940124511719, 0.7051467895507812, 0.7243995666503906, 0.74365234375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 5.0, 3.0, 5.0, 15.0, 16.0, 22.0, 51.0, 69.0, 115.0, 147.0, 280.0, 534.0, 1097.0, 2373.0, 5997.0, 20126.0, 120246.0, 785243.0, 86480.0, 16494.0, 5191.0, 2049.0, 899.0, 467.0, 238.0, 140.0, 86.0, 67.0, 34.0, 23.0, 13.0, 9.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1204833984375, -0.1172637939453125, -0.114044189453125, -0.1108245849609375, -0.10760498046875, -0.1043853759765625, -0.101165771484375, -0.0979461669921875, -0.0947265625, -0.0915069580078125, -0.088287353515625, -0.0850677490234375, -0.08184814453125, -0.0786285400390625, -0.075408935546875, -0.0721893310546875, -0.0689697265625, -0.0657501220703125, -0.062530517578125, -0.0593109130859375, -0.05609130859375, -0.0528717041015625, -0.049652099609375, -0.0464324951171875, -0.043212890625, -0.0399932861328125, -0.036773681640625, -0.0335540771484375, -0.03033447265625, -0.0271148681640625, -0.023895263671875, -0.0206756591796875, -0.0174560546875, -0.0142364501953125, -0.011016845703125, -0.0077972412109375, -0.00457763671875, -0.0013580322265625, 0.001861572265625, 0.0050811767578125, 0.00830078125, 0.0115203857421875, 0.014739990234375, 0.0179595947265625, 0.02117919921875, 0.0243988037109375, 0.027618408203125, 0.0308380126953125, 0.0340576171875, 0.0372772216796875, 0.040496826171875, 0.0437164306640625, 0.04693603515625, 0.0501556396484375, 0.053375244140625, 0.0565948486328125, 0.059814453125, 0.0630340576171875, 0.066253662109375, 0.0694732666015625, 0.07269287109375, 0.0759124755859375, 0.079132080078125, 0.0823516845703125, 0.0855712890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 8.0, 4.0, 3.0, 3.0, 5.0, 11.0, 13.0, 14.0, 15.0, 24.0, 29.0, 59.0, 84.0, 95.0, 105.0, 97.0, 103.0, 84.0, 57.0, 41.0, 33.0, 27.0, 12.0, 17.0, 17.0, 8.0, 6.0, 11.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.225969314575195e-05, -4.0903687477111816e-05, -3.954768180847168e-05, -3.819167613983154e-05, -3.6835670471191406e-05, -3.547966480255127e-05, -3.412365913391113e-05, -3.2767653465270996e-05, -3.141164779663086e-05, -3.0055642127990723e-05, -2.8699636459350586e-05, -2.734363079071045e-05, -2.5987625122070312e-05, -2.4631619453430176e-05, -2.327561378479004e-05, -2.1919608116149902e-05, -2.0563602447509766e-05, -1.920759677886963e-05, -1.7851591110229492e-05, -1.6495585441589355e-05, -1.5139579772949219e-05, -1.3783574104309082e-05, -1.2427568435668945e-05, -1.1071562767028809e-05, -9.715557098388672e-06, -8.359551429748535e-06, -7.0035457611083984e-06, -5.647540092468262e-06, -4.291534423828125e-06, -2.9355287551879883e-06, -1.5795230865478516e-06, -2.2351741790771484e-07, 1.1324882507324219e-06, 2.4884939193725586e-06, 3.844499588012695e-06, 5.200505256652832e-06, 6.556510925292969e-06, 7.912516593933105e-06, 9.268522262573242e-06, 1.0624527931213379e-05, 1.1980533599853516e-05, 1.3336539268493652e-05, 1.4692544937133789e-05, 1.6048550605773926e-05, 1.7404556274414062e-05, 1.87605619430542e-05, 2.0116567611694336e-05, 2.1472573280334473e-05, 2.282857894897461e-05, 2.4184584617614746e-05, 2.5540590286254883e-05, 2.689659595489502e-05, 2.8252601623535156e-05, 2.9608607292175293e-05, 3.096461296081543e-05, 3.2320618629455566e-05, 3.36766242980957e-05, 3.503262996673584e-05, 3.6388635635375977e-05, 3.774464130401611e-05, 3.910064697265625e-05, 4.045665264129639e-05, 4.1812658309936523e-05, 4.316866397857666e-05, 4.45246696472168e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 6.0, 10.0, 8.0, 11.0, 22.0, 24.0, 28.0, 44.0, 72.0, 108.0, 195.0, 325.0, 579.0, 1134.0, 2444.0, 5874.0, 19289.0, 83723.0, 697055.0, 185256.0, 35777.0, 9812.0, 3488.0, 1494.0, 703.0, 374.0, 256.0, 150.0, 89.0, 54.0, 36.0, 34.0, 21.0, 15.0, 6.0, 17.0, 4.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0810546875, -0.0782327651977539, -0.07541084289550781, -0.07258892059326172, -0.06976699829101562, -0.06694507598876953, -0.06412315368652344, -0.061301231384277344, -0.05847930908203125, -0.055657386779785156, -0.05283546447753906, -0.05001354217529297, -0.047191619873046875, -0.04436969757080078, -0.04154777526855469, -0.038725852966308594, -0.0359039306640625, -0.033082008361816406, -0.030260086059570312, -0.02743816375732422, -0.024616241455078125, -0.02179431915283203, -0.018972396850585938, -0.016150474548339844, -0.01332855224609375, -0.010506629943847656, -0.0076847076416015625, -0.004862785339355469, -0.002040863037109375, 0.0007810592651367188, 0.0036029815673828125, 0.006424903869628906, 0.009246826171875, 0.012068748474121094, 0.014890670776367188, 0.01771259307861328, 0.020534515380859375, 0.02335643768310547, 0.026178359985351562, 0.029000282287597656, 0.03182220458984375, 0.034644126892089844, 0.03746604919433594, 0.04028797149658203, 0.043109893798828125, 0.04593181610107422, 0.04875373840332031, 0.051575660705566406, 0.0543975830078125, 0.057219505310058594, 0.06004142761230469, 0.06286334991455078, 0.06568527221679688, 0.06850719451904297, 0.07132911682128906, 0.07415103912353516, 0.07697296142578125, 0.07979488372802734, 0.08261680603027344, 0.08543872833251953, 0.08826065063476562, 0.09108257293701172, 0.09390449523925781, 0.0967264175415039, 0.09954833984375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 7.0, 5.0, 5.0, 7.0, 11.0, 14.0, 11.0, 15.0, 17.0, 29.0, 22.0, 36.0, 51.0, 55.0, 65.0, 99.0, 92.0, 94.0, 73.0, 57.0, 51.0, 38.0, 20.0, 29.0, 13.0, 16.0, 15.0, 14.0, 10.0, 8.0, 5.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0838623046875, -0.0811929702758789, -0.07852363586425781, -0.07585430145263672, -0.07318496704101562, -0.07051563262939453, -0.06784629821777344, -0.06517696380615234, -0.06250762939453125, -0.059838294982910156, -0.05716896057128906, -0.05449962615966797, -0.051830291748046875, -0.04916095733642578, -0.04649162292480469, -0.043822288513183594, -0.0411529541015625, -0.038483619689941406, -0.03581428527832031, -0.03314495086669922, -0.030475616455078125, -0.02780628204345703, -0.025136947631835938, -0.022467613220214844, -0.01979827880859375, -0.017128944396972656, -0.014459609985351562, -0.011790275573730469, -0.009120941162109375, -0.006451606750488281, -0.0037822723388671875, -0.0011129379272460938, 0.001556396484375, 0.004225730895996094, 0.0068950653076171875, 0.009564399719238281, 0.012233734130859375, 0.014903068542480469, 0.017572402954101562, 0.020241737365722656, 0.02291107177734375, 0.025580406188964844, 0.028249740600585938, 0.03091907501220703, 0.033588409423828125, 0.03625774383544922, 0.03892707824707031, 0.041596412658691406, 0.0442657470703125, 0.046935081481933594, 0.04960441589355469, 0.05227375030517578, 0.054943084716796875, 0.05761241912841797, 0.06028175354003906, 0.06295108795166016, 0.06562042236328125, 0.06828975677490234, 0.07095909118652344, 0.07362842559814453, 0.07629776000976562, 0.07896709442138672, 0.08163642883300781, 0.0843057632446289, 0.08697509765625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 4.0, 5.0, 5.0, 22.0, 29.0, 119.0, 339.0, 325.0, 94.0, 31.0, 16.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.468199729919434, -4.3328423500061035, -4.197485446929932, -4.062128067016602, -3.9267709255218506, -3.7914137840270996, -3.6560564041137695, -3.5206992626190186, -3.3853421211242676, -3.2499849796295166, -3.1146275997161865, -2.9792704582214355, -2.8439133167266846, -2.7085561752319336, -2.5731987953186035, -2.4378416538238525, -2.3024842739105225, -2.1671271324157715, -2.0317697525024414, -1.8964126110076904, -1.7610554695129395, -1.625698208808899, -1.4903409481048584, -1.3549838066101074, -1.219626545906067, -1.0842692852020264, -0.9489121437072754, -0.8135548830032349, -0.6781976819038391, -0.5428404808044434, -0.40748322010040283, -0.2721260190010071, -0.13676881790161133, -0.0014116019010543823, 0.13394561409950256, 0.2693028450012207, 0.40466004610061646, 0.5400172472000122, 0.6753745079040527, 0.8107317090034485, 0.9460889101028442, 1.0814461708068848, 1.2168033123016357, 1.3521605730056763, 1.4875178337097168, 1.6228749752044678, 1.7582322359085083, 1.8935894966125488, 2.0289466381073, 2.164303779602051, 2.299661159515381, 2.435018301010132, 2.570375442504883, 2.705732822418213, 2.841089963912964, 2.976447105407715, 3.111804485321045, 3.247161626815796, 3.382519006729126, 3.517876148223877, 3.653233289718628, 3.788590431213379, 3.923947811126709, 4.059305191040039, 4.194662094116211]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 7.0, 9.0, 11.0, 9.0, 15.0, 16.0, 15.0, 10.0, 13.0, 23.0, 13.0, 40.0, 32.0, 26.0, 46.0, 48.0, 77.0, 98.0, 91.0, 78.0, 48.0, 19.0, 32.0, 23.0, 27.0, 27.0, 24.0, 13.0, 16.0, 9.0, 16.0, 13.0, 8.0, 5.0, 7.0, 8.0, 2.0, 7.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5876935720443726, -1.5325590372085571, -1.4774245023727417, -1.4222898483276367, -1.3671553134918213, -1.3120207786560059, -1.2568862438201904, -1.201751708984375, -1.1466171741485596, -1.0914826393127441, -1.0363481044769287, -0.9812135100364685, -0.9260789752006531, -0.8709443807601929, -0.8158098459243774, -0.760675311088562, -0.7055407166481018, -0.6504061818122864, -0.5952715873718262, -0.5401370525360107, -0.4850025177001953, -0.4298679530620575, -0.3747333884239197, -0.31959885358810425, -0.26446428894996643, -0.2093297392129898, -0.15419518947601318, -0.09906062483787537, -0.04392607510089874, 0.01120847463607788, 0.0663430392742157, 0.12147757411003113, 0.17661213874816895, 0.23174668848514557, 0.2868812382221222, 0.34201580286026, 0.39715033769607544, 0.45228490233421326, 0.5074194669723511, 0.5625540018081665, 0.6176885366439819, 0.6728230714797974, 0.7279576659202576, 0.783092200756073, 0.8382267355918884, 0.8933613300323486, 0.9484958648681641, 1.0036303997039795, 1.058764934539795, 1.1138994693756104, 1.1690340042114258, 1.2241685390472412, 1.2793031930923462, 1.3344377279281616, 1.389572262763977, 1.4447067975997925, 1.4998414516448975, 1.554975986480713, 1.6101105213165283, 1.6652450561523438, 1.7203797101974487, 1.7755142450332642, 1.8306487798690796, 1.885783314704895, 1.9409178495407104]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 4.0, 4.0, 12.0, 9.0, 22.0, 28.0, 38.0, 49.0, 111.0, 135.0, 228.0, 337.0, 578.0, 922.0, 1526.0, 2530.0, 4625.0, 8723.0, 17166.0, 38454.0, 95556.0, 267121.0, 755823.0, 1514931.0, 945798.0, 335102.0, 115847.0, 45779.0, 20246.0, 9859.0, 5173.0, 2876.0, 1678.0, 1076.0, 685.0, 427.0, 283.0, 163.0, 101.0, 77.0, 54.0, 42.0, 31.0, 20.0, 3.0, 6.0, 14.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1583251953125, -0.15346908569335938, -0.14861297607421875, -0.14375686645507812, -0.1389007568359375, -0.13404464721679688, -0.12918853759765625, -0.12433242797851562, -0.119476318359375, -0.11462020874023438, -0.10976409912109375, -0.10490798950195312, -0.1000518798828125, -0.09519577026367188, -0.09033966064453125, -0.08548355102539062, -0.08062744140625, -0.07577133178710938, -0.07091522216796875, -0.06605911254882812, -0.0612030029296875, -0.056346893310546875, -0.05149078369140625, -0.046634674072265625, -0.041778564453125, -0.036922454833984375, -0.03206634521484375, -0.027210235595703125, -0.0223541259765625, -0.017498016357421875, -0.01264190673828125, -0.007785797119140625, -0.0029296875, 0.001926422119140625, 0.00678253173828125, 0.011638641357421875, 0.0164947509765625, 0.021350860595703125, 0.02620697021484375, 0.031063079833984375, 0.035919189453125, 0.040775299072265625, 0.04563140869140625, 0.050487518310546875, 0.0553436279296875, 0.060199737548828125, 0.06505584716796875, 0.06991195678710938, 0.07476806640625, 0.07962417602539062, 0.08448028564453125, 0.08933639526367188, 0.0941925048828125, 0.09904861450195312, 0.10390472412109375, 0.10876083374023438, 0.113616943359375, 0.11847305297851562, 0.12332916259765625, 0.12818527221679688, 0.1330413818359375, 0.13789749145507812, 0.14275360107421875, 0.14760971069335938, 0.1524658203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 7.0, 3.0, 4.0, 13.0, 11.0, 17.0, 16.0, 19.0, 17.0, 34.0, 21.0, 31.0, 33.0, 28.0, 32.0, 42.0, 44.0, 52.0, 49.0, 41.0, 46.0, 58.0, 41.0, 34.0, 32.0, 40.0, 30.0, 28.0, 31.0, 28.0, 14.0, 18.0, 19.0, 9.0, 11.0, 13.0, 8.0, 11.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11981201171875, -0.11605548858642578, -0.11229896545410156, -0.10854244232177734, -0.10478591918945312, -0.1010293960571289, -0.09727287292480469, -0.09351634979248047, -0.08975982666015625, -0.08600330352783203, -0.08224678039550781, -0.0784902572631836, -0.07473373413085938, -0.07097721099853516, -0.06722068786621094, -0.06346416473388672, -0.0597076416015625, -0.05595111846923828, -0.05219459533691406, -0.048438072204589844, -0.044681549072265625, -0.040925025939941406, -0.03716850280761719, -0.03341197967529297, -0.02965545654296875, -0.02589893341064453, -0.022142410278320312, -0.018385887145996094, -0.014629364013671875, -0.010872840881347656, -0.0071163177490234375, -0.0033597946166992188, 0.000396728515625, 0.004153251647949219, 0.007909774780273438, 0.011666297912597656, 0.015422821044921875, 0.019179344177246094, 0.022935867309570312, 0.02669239044189453, 0.03044891357421875, 0.03420543670654297, 0.03796195983886719, 0.041718482971191406, 0.045475006103515625, 0.049231529235839844, 0.05298805236816406, 0.05674457550048828, 0.0605010986328125, 0.06425762176513672, 0.06801414489746094, 0.07177066802978516, 0.07552719116210938, 0.0792837142944336, 0.08304023742675781, 0.08679676055908203, 0.09055328369140625, 0.09430980682373047, 0.09806632995605469, 0.1018228530883789, 0.10557937622070312, 0.10933589935302734, 0.11309242248535156, 0.11684894561767578, 0.12060546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 8.0, 4.0, 10.0, 14.0, 12.0, 19.0, 44.0, 57.0, 88.0, 116.0, 199.0, 353.0, 661.0, 1634.0, 6828.0, 106835.0, 3953655.0, 113626.0, 6763.0, 1736.0, 696.0, 365.0, 194.0, 124.0, 68.0, 55.0, 33.0, 24.0, 17.0, 9.0, 7.0, 10.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.892578125, -0.8642501831054688, -0.8359222412109375, -0.8075942993164062, -0.779266357421875, -0.7509384155273438, -0.7226104736328125, -0.6942825317382812, -0.66595458984375, -0.6376266479492188, -0.6092987060546875, -0.5809707641601562, -0.552642822265625, -0.5243148803710938, -0.4959869384765625, -0.46765899658203125, -0.4393310546875, -0.41100311279296875, -0.3826751708984375, -0.35434722900390625, -0.326019287109375, -0.29769134521484375, -0.2693634033203125, -0.24103546142578125, -0.21270751953125, -0.18437957763671875, -0.1560516357421875, -0.12772369384765625, -0.099395751953125, -0.07106781005859375, -0.0427398681640625, -0.01441192626953125, 0.013916015625, 0.04224395751953125, 0.0705718994140625, 0.09889984130859375, 0.127227783203125, 0.15555572509765625, 0.1838836669921875, 0.21221160888671875, 0.24053955078125, 0.26886749267578125, 0.2971954345703125, 0.32552337646484375, 0.353851318359375, 0.38217926025390625, 0.4105072021484375, 0.43883514404296875, 0.4671630859375, 0.49549102783203125, 0.5238189697265625, 0.5521469116210938, 0.580474853515625, 0.6088027954101562, 0.6371307373046875, 0.6654586791992188, 0.69378662109375, 0.7221145629882812, 0.7504425048828125, 0.7787704467773438, 0.807098388671875, 0.8354263305664062, 0.8637542724609375, 0.8920822143554688, 0.92041015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 7.0, 11.0, 13.0, 16.0, 16.0, 33.0, 46.0, 62.0, 85.0, 110.0, 152.0, 230.0, 317.0, 441.0, 575.0, 588.0, 383.0, 289.0, 196.0, 152.0, 96.0, 77.0, 51.0, 25.0, 23.0, 20.0, 9.0, 11.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40869140625, -0.3945655822753906, -0.38043975830078125, -0.3663139343261719, -0.3521881103515625, -0.3380622863769531, -0.32393646240234375, -0.3098106384277344, -0.295684814453125, -0.2815589904785156, -0.26743316650390625, -0.2533073425292969, -0.2391815185546875, -0.22505569458007812, -0.21092987060546875, -0.19680404663085938, -0.18267822265625, -0.16855239868164062, -0.15442657470703125, -0.14030075073242188, -0.1261749267578125, -0.11204910278320312, -0.09792327880859375, -0.08379745483398438, -0.069671630859375, -0.055545806884765625, -0.04141998291015625, -0.027294158935546875, -0.0131683349609375, 0.000957489013671875, 0.01508331298828125, 0.029209136962890625, 0.0433349609375, 0.057460784912109375, 0.07158660888671875, 0.08571243286132812, 0.0998382568359375, 0.11396408081054688, 0.12808990478515625, 0.14221572875976562, 0.156341552734375, 0.17046737670898438, 0.18459320068359375, 0.19871902465820312, 0.2128448486328125, 0.22697067260742188, 0.24109649658203125, 0.2552223205566406, 0.26934814453125, 0.2834739685058594, 0.29759979248046875, 0.3117256164550781, 0.3258514404296875, 0.3399772644042969, 0.35410308837890625, 0.3682289123535156, 0.382354736328125, 0.3964805603027344, 0.41060638427734375, 0.4247322082519531, 0.4388580322265625, 0.4529838562011719, 0.46710968017578125, 0.4812355041503906, 0.495361328125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 9.0, 16.0, 26.0, 22.0, 52.0, 85.0, 139.0, 162.0, 157.0, 127.0, 85.0, 44.0, 27.0, 12.0, 4.0, 13.0, 5.0, 1.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5635986328125, -6.395124912261963, -6.226650714874268, -6.0581769943237305, -5.889702796936035, -5.721229076385498, -5.552755355834961, -5.384281158447266, -5.2158074378967285, -5.047333717346191, -4.878859519958496, -4.710385799407959, -4.541912078857422, -4.373437881469727, -4.2049641609191895, -4.036490440368652, -3.868016242980957, -3.699542284011841, -3.5310683250427246, -3.3625946044921875, -3.1941206455230713, -3.025646686553955, -2.857172966003418, -2.6886990070343018, -2.5202250480651855, -2.3517510890960693, -2.183277130126953, -2.014803409576416, -1.8463294506072998, -1.6778554916381836, -1.509381651878357, -1.3409078121185303, -1.172433853149414, -1.0039598941802979, -0.8354860544204712, -0.6670121550559998, -0.4985382556915283, -0.3300643563270569, -0.16159045696258545, 0.006883382797241211, 0.17535734176635742, 0.34383124113082886, 0.5123051404953003, 0.6807790398597717, 0.8492529392242432, 1.0177268981933594, 1.186200737953186, 1.3546745777130127, 1.523148536682129, 1.6916224956512451, 1.8600963354110718, 2.0285701751708984, 2.1970441341400146, 2.365518093109131, 2.533991813659668, 2.702465772628784, 2.8709397315979004, 3.0394136905670166, 3.207887649536133, 3.37636137008667, 3.544835329055786, 3.7133092880249023, 3.8817830085754395, 4.050256729125977, 4.218730926513672]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 2.0, 5.0, 5.0, 8.0, 5.0, 9.0, 15.0, 14.0, 10.0, 21.0, 23.0, 15.0, 27.0, 26.0, 29.0, 33.0, 36.0, 35.0, 23.0, 31.0, 54.0, 42.0, 40.0, 48.0, 45.0, 36.0, 33.0, 36.0, 27.0, 26.0, 23.0, 23.0, 23.0, 25.0, 14.0, 24.0, 15.0, 13.0, 16.0, 7.0, 10.0, 12.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.9179359674453735, -1.856309413909912, -1.7946829795837402, -1.7330564260482788, -1.6714298725128174, -1.6098034381866455, -1.548176884651184, -1.4865503311157227, -1.4249238967895508, -1.3632973432540894, -1.3016709089279175, -1.240044355392456, -1.1784179210662842, -1.1167913675308228, -1.0551648139953613, -0.9935383200645447, -0.931911826133728, -0.8702853322029114, -0.8086588382720947, -0.7470322847366333, -0.6854057908058167, -0.623779296875, -0.5621527433395386, -0.5005262494087219, -0.4388997554779053, -0.3772732615470886, -0.3156467378139496, -0.25402021408081055, -0.1923937201499939, -0.13076722621917725, -0.06914070248603821, -0.00751417875289917, 0.05411243438720703, 0.11573894321918488, 0.17736545205116272, 0.23899196088314056, 0.3006184697151184, 0.36224496364593506, 0.4238714873790741, 0.48549801111221313, 0.5471245050430298, 0.6087509989738464, 0.6703774929046631, 0.7320040464401245, 0.7936305403709412, 0.8552570343017578, 0.9168835878372192, 0.9785100817680359, 1.0401365756988525, 1.101763129234314, 1.1633895635604858, 1.2250161170959473, 1.2866425514221191, 1.3482691049575806, 1.409895658493042, 1.4715220928192139, 1.5331486463546753, 1.5947751998901367, 1.6564016342163086, 1.71802818775177, 1.7796547412872314, 1.8412811756134033, 1.9029077291488647, 1.9645342826843262, 2.026160717010498]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 11.0, 12.0, 9.0, 18.0, 27.0, 53.0, 77.0, 136.0, 232.0, 433.0, 716.0, 1474.0, 2799.0, 6116.0, 15735.0, 49248.0, 223800.0, 588728.0, 110668.0, 28949.0, 10368.0, 4352.0, 2042.0, 1126.0, 568.0, 329.0, 189.0, 112.0, 85.0, 49.0, 31.0, 15.0, 8.0, 13.0, 4.0, 7.0, 4.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.1764507293701172, -0.16918563842773438, -0.16192054748535156, -0.15465545654296875, -0.14739036560058594, -0.14012527465820312, -0.1328601837158203, -0.1255950927734375, -0.11833000183105469, -0.11106491088867188, -0.10379981994628906, -0.09653472900390625, -0.08926963806152344, -0.08200454711914062, -0.07473945617675781, -0.067474365234375, -0.06020927429199219, -0.052944183349609375, -0.04567909240722656, -0.03841400146484375, -0.031148910522460938, -0.023883819580078125, -0.016618728637695312, -0.0093536376953125, -0.0020885467529296875, 0.005176544189453125, 0.012441635131835938, 0.01970672607421875, 0.026971817016601562, 0.034236907958984375, 0.04150199890136719, 0.04876708984375, 0.05603218078613281, 0.06329727172851562, 0.07056236267089844, 0.07782745361328125, 0.08509254455566406, 0.09235763549804688, 0.09962272644042969, 0.1068878173828125, 0.11415290832519531, 0.12141799926757812, 0.12868309020996094, 0.13594818115234375, 0.14321327209472656, 0.15047836303710938, 0.1577434539794922, 0.165008544921875, 0.1722736358642578, 0.17953872680664062, 0.18680381774902344, 0.19406890869140625, 0.20133399963378906, 0.20859909057617188, 0.2158641815185547, 0.2231292724609375, 0.2303943634033203, 0.23765945434570312, 0.24492454528808594, 0.25218963623046875, 0.25945472717285156, 0.2667198181152344, 0.2739849090576172, 0.28125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 7.0, 4.0, 4.0, 6.0, 13.0, 13.0, 20.0, 20.0, 34.0, 38.0, 44.0, 61.0, 55.0, 61.0, 84.0, 71.0, 80.0, 57.0, 54.0, 57.0, 45.0, 49.0, 31.0, 27.0, 20.0, 16.0, 7.0, 15.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.15665817260742188, -0.14827728271484375, -0.13989639282226562, -0.1315155029296875, -0.12313461303710938, -0.11475372314453125, -0.10637283325195312, -0.097991943359375, -0.08961105346679688, -0.08123016357421875, -0.07284927368164062, -0.0644683837890625, -0.056087493896484375, -0.04770660400390625, -0.039325714111328125, -0.03094482421875, -0.022563934326171875, -0.01418304443359375, -0.005802154541015625, 0.0025787353515625, 0.010959625244140625, 0.01934051513671875, 0.027721405029296875, 0.036102294921875, 0.044483184814453125, 0.05286407470703125, 0.061244964599609375, 0.0696258544921875, 0.07800674438476562, 0.08638763427734375, 0.09476852416992188, 0.1031494140625, 0.11153030395507812, 0.11991119384765625, 0.12829208374023438, 0.1366729736328125, 0.14505386352539062, 0.15343475341796875, 0.16181564331054688, 0.170196533203125, 0.17857742309570312, 0.18695831298828125, 0.19533920288085938, 0.2037200927734375, 0.21210098266601562, 0.22048187255859375, 0.22886276245117188, 0.23724365234375, 0.24562454223632812, 0.25400543212890625, 0.2623863220214844, 0.2707672119140625, 0.2791481018066406, 0.28752899169921875, 0.2959098815917969, 0.304290771484375, 0.3126716613769531, 0.32105255126953125, 0.3294334411621094, 0.3378143310546875, 0.3461952209472656, 0.35457611083984375, 0.3629570007324219, 0.371337890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 2.0, 14.0, 12.0, 42.0, 54.0, 75.0, 111.0, 235.0, 641.0, 2246.0, 14532.0, 804249.0, 212356.0, 10811.0, 1878.0, 678.0, 275.0, 134.0, 74.0, 38.0, 19.0, 23.0, 14.0, 9.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.4615020751953125, -0.444976806640625, -0.4284515380859375, -0.41192626953125, -0.3954010009765625, -0.378875732421875, -0.3623504638671875, -0.3458251953125, -0.3292999267578125, -0.312774658203125, -0.2962493896484375, -0.27972412109375, -0.2631988525390625, -0.246673583984375, -0.2301483154296875, -0.213623046875, -0.1970977783203125, -0.180572509765625, -0.1640472412109375, -0.14752197265625, -0.1309967041015625, -0.114471435546875, -0.0979461669921875, -0.0814208984375, -0.0648956298828125, -0.048370361328125, -0.0318450927734375, -0.01531982421875, 0.0012054443359375, 0.017730712890625, 0.0342559814453125, 0.05078125, 0.0673065185546875, 0.083831787109375, 0.1003570556640625, 0.11688232421875, 0.1334075927734375, 0.149932861328125, 0.1664581298828125, 0.1829833984375, 0.1995086669921875, 0.216033935546875, 0.2325592041015625, 0.24908447265625, 0.2656097412109375, 0.282135009765625, 0.2986602783203125, 0.315185546875, 0.3317108154296875, 0.348236083984375, 0.3647613525390625, 0.38128662109375, 0.3978118896484375, 0.414337158203125, 0.4308624267578125, 0.4473876953125, 0.4639129638671875, 0.480438232421875, 0.4969635009765625, 0.51348876953125, 0.5300140380859375, 0.546539306640625, 0.5630645751953125, 0.57958984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 0.0, 9.0, 2.0, 3.0, 3.0, 7.0, 10.0, 10.0, 8.0, 23.0, 16.0, 19.0, 23.0, 26.0, 34.0, 28.0, 33.0, 66.0, 67.0, 68.0, 91.0, 75.0, 62.0, 56.0, 43.0, 30.0, 34.0, 28.0, 21.0, 17.0, 16.0, 11.0, 10.0, 10.0, 10.0, 13.0, 8.0, 8.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6016921997070312, -0.5759429931640625, -0.5501937866210938, -0.524444580078125, -0.49869537353515625, -0.4729461669921875, -0.44719696044921875, -0.42144775390625, -0.39569854736328125, -0.3699493408203125, -0.34420013427734375, -0.318450927734375, -0.29270172119140625, -0.2669525146484375, -0.24120330810546875, -0.2154541015625, -0.18970489501953125, -0.1639556884765625, -0.13820648193359375, -0.112457275390625, -0.08670806884765625, -0.0609588623046875, -0.03520965576171875, -0.00946044921875, 0.01628875732421875, 0.0420379638671875, 0.06778717041015625, 0.093536376953125, 0.11928558349609375, 0.1450347900390625, 0.17078399658203125, 0.196533203125, 0.22228240966796875, 0.2480316162109375, 0.27378082275390625, 0.299530029296875, 0.32527923583984375, 0.3510284423828125, 0.37677764892578125, 0.40252685546875, 0.42827606201171875, 0.4540252685546875, 0.47977447509765625, 0.505523681640625, 0.5312728881835938, 0.5570220947265625, 0.5827713012695312, 0.6085205078125, 0.6342697143554688, 0.6600189208984375, 0.6857681274414062, 0.711517333984375, 0.7372665405273438, 0.7630157470703125, 0.7887649536132812, 0.81451416015625, 0.8402633666992188, 0.8660125732421875, 0.8917617797851562, 0.917510986328125, 0.9432601928710938, 0.9690093994140625, 0.9947586059570312, 1.0205078125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 1.0, 3.0, 12.0, 16.0, 27.0, 37.0, 70.0, 138.0, 261.0, 570.0, 1468.0, 5054.0, 25902.0, 759245.0, 228451.0, 20632.0, 4283.0, 1327.0, 538.0, 250.0, 110.0, 53.0, 35.0, 22.0, 16.0, 17.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09747314453125, -0.09476089477539062, -0.09204864501953125, -0.08933639526367188, -0.0866241455078125, -0.08391189575195312, -0.08119964599609375, -0.07848739624023438, -0.075775146484375, -0.07306289672851562, -0.07035064697265625, -0.06763839721679688, -0.0649261474609375, -0.062213897705078125, -0.05950164794921875, -0.056789398193359375, -0.0540771484375, -0.051364898681640625, -0.04865264892578125, -0.045940399169921875, -0.0432281494140625, -0.040515899658203125, -0.03780364990234375, -0.035091400146484375, -0.032379150390625, -0.029666900634765625, -0.02695465087890625, -0.024242401123046875, -0.0215301513671875, -0.018817901611328125, -0.01610565185546875, -0.013393402099609375, -0.01068115234375, -0.007968902587890625, -0.00525665283203125, -0.002544403076171875, 0.0001678466796875, 0.002880096435546875, 0.00559234619140625, 0.008304595947265625, 0.011016845703125, 0.013729095458984375, 0.01644134521484375, 0.019153594970703125, 0.0218658447265625, 0.024578094482421875, 0.02729034423828125, 0.030002593994140625, 0.03271484375, 0.035427093505859375, 0.03813934326171875, 0.040851593017578125, 0.0435638427734375, 0.046276092529296875, 0.04898834228515625, 0.051700592041015625, 0.054412841796875, 0.057125091552734375, 0.05983734130859375, 0.06254959106445312, 0.0652618408203125, 0.06797409057617188, 0.07068634033203125, 0.07339859008789062, 0.07611083984375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 7.0, 3.0, 8.0, 7.0, 10.0, 15.0, 7.0, 16.0, 11.0, 20.0, 35.0, 20.0, 31.0, 41.0, 55.0, 72.0, 77.0, 69.0, 88.0, 80.0, 49.0, 52.0, 44.0, 27.0, 27.0, 22.0, 22.0, 11.0, 14.0, 8.0, 10.0, 5.0, 8.0, 12.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.5212764739990234e-05, -2.436712384223938e-05, -2.3521482944488525e-05, -2.267584204673767e-05, -2.1830201148986816e-05, -2.0984560251235962e-05, -2.0138919353485107e-05, -1.9293278455734253e-05, -1.84476375579834e-05, -1.7601996660232544e-05, -1.675635576248169e-05, -1.5910714864730835e-05, -1.506507396697998e-05, -1.4219433069229126e-05, -1.3373792171478271e-05, -1.2528151273727417e-05, -1.1682510375976562e-05, -1.0836869478225708e-05, -9.991228580474854e-06, -9.145587682723999e-06, -8.299946784973145e-06, -7.45430588722229e-06, -6.6086649894714355e-06, -5.763024091720581e-06, -4.9173831939697266e-06, -4.071742296218872e-06, -3.2261013984680176e-06, -2.380460500717163e-06, -1.5348196029663086e-06, -6.891787052154541e-07, 1.564621925354004e-07, 1.0021030902862549e-06, 1.8477439880371094e-06, 2.693384885787964e-06, 3.5390257835388184e-06, 4.384666681289673e-06, 5.230307579040527e-06, 6.075948476791382e-06, 6.921589374542236e-06, 7.76723027229309e-06, 8.612871170043945e-06, 9.4585120677948e-06, 1.0304152965545654e-05, 1.1149793863296509e-05, 1.1995434761047363e-05, 1.2841075658798218e-05, 1.3686716556549072e-05, 1.4532357454299927e-05, 1.537799835205078e-05, 1.6223639249801636e-05, 1.706928014755249e-05, 1.7914921045303345e-05, 1.87605619430542e-05, 1.9606202840805054e-05, 2.0451843738555908e-05, 2.1297484636306763e-05, 2.2143125534057617e-05, 2.298876643180847e-05, 2.3834407329559326e-05, 2.468004822731018e-05, 2.5525689125061035e-05, 2.637133002281189e-05, 2.7216970920562744e-05, 2.80626118183136e-05, 2.8908252716064453e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 7.0, 5.0, 8.0, 13.0, 14.0, 23.0, 38.0, 42.0, 97.0, 127.0, 213.0, 458.0, 730.0, 1563.0, 3663.0, 8922.0, 25886.0, 113294.0, 791761.0, 69819.0, 19138.0, 6948.0, 2877.0, 1382.0, 691.0, 317.0, 196.0, 115.0, 68.0, 46.0, 28.0, 17.0, 13.0, 5.0, 9.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05816650390625, -0.05618572235107422, -0.05420494079589844, -0.052224159240722656, -0.050243377685546875, -0.048262596130371094, -0.04628181457519531, -0.04430103302001953, -0.04232025146484375, -0.04033946990966797, -0.03835868835449219, -0.036377906799316406, -0.034397125244140625, -0.032416343688964844, -0.030435562133789062, -0.02845478057861328, -0.0264739990234375, -0.02449321746826172, -0.022512435913085938, -0.020531654357910156, -0.018550872802734375, -0.016570091247558594, -0.014589309692382812, -0.012608528137207031, -0.01062774658203125, -0.008646965026855469, -0.0066661834716796875, -0.004685401916503906, -0.002704620361328125, -0.0007238388061523438, 0.0012569427490234375, 0.0032377243041992188, 0.005218505859375, 0.007199287414550781, 0.009180068969726562, 0.011160850524902344, 0.013141632080078125, 0.015122413635253906, 0.017103195190429688, 0.01908397674560547, 0.02106475830078125, 0.02304553985595703, 0.025026321411132812, 0.027007102966308594, 0.028987884521484375, 0.030968666076660156, 0.03294944763183594, 0.03493022918701172, 0.0369110107421875, 0.03889179229736328, 0.04087257385253906, 0.042853355407714844, 0.044834136962890625, 0.046814918518066406, 0.04879570007324219, 0.05077648162841797, 0.05275726318359375, 0.05473804473876953, 0.05671882629394531, 0.058699607849121094, 0.060680389404296875, 0.06266117095947266, 0.06464195251464844, 0.06662273406982422, 0.068603515625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 4.0, 4.0, 7.0, 15.0, 12.0, 14.0, 15.0, 18.0, 20.0, 26.0, 51.0, 59.0, 77.0, 92.0, 100.0, 85.0, 87.0, 77.0, 58.0, 35.0, 24.0, 25.0, 22.0, 13.0, 11.0, 7.0, 4.0, 8.0, 6.0, 3.0, 4.0, 6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.088134765625, -0.08552742004394531, -0.08292007446289062, -0.08031272888183594, -0.07770538330078125, -0.07509803771972656, -0.07249069213867188, -0.06988334655761719, -0.0672760009765625, -0.06466865539550781, -0.062061309814453125, -0.05945396423339844, -0.05684661865234375, -0.05423927307128906, -0.051631927490234375, -0.04902458190917969, -0.046417236328125, -0.04380989074707031, -0.041202545166015625, -0.03859519958496094, -0.03598785400390625, -0.03338050842285156, -0.030773162841796875, -0.028165817260742188, -0.0255584716796875, -0.022951126098632812, -0.020343780517578125, -0.017736434936523438, -0.01512908935546875, -0.012521743774414062, -0.009914398193359375, -0.0073070526123046875, -0.00469970703125, -0.0020923614501953125, 0.000514984130859375, 0.0031223297119140625, 0.00572967529296875, 0.008337020874023438, 0.010944366455078125, 0.013551712036132812, 0.0161590576171875, 0.018766403198242188, 0.021373748779296875, 0.023981094360351562, 0.02658843994140625, 0.029195785522460938, 0.031803131103515625, 0.03441047668457031, 0.037017822265625, 0.03962516784667969, 0.042232513427734375, 0.04483985900878906, 0.04744720458984375, 0.05005455017089844, 0.052661895751953125, 0.05526924133300781, 0.0578765869140625, 0.06048393249511719, 0.06309127807617188, 0.06569862365722656, 0.06830596923828125, 0.07091331481933594, 0.07352066040039062, 0.07612800598144531, 0.0787353515625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 6.0, 14.0, 27.0, 43.0, 78.0, 183.0, 356.0, 131.0, 69.0, 35.0, 17.0, 12.0, 12.0, 6.0, 5.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9888582229614258, -0.8926008343696594, -0.7963434457778931, -0.7000859975814819, -0.6038286685943604, -0.5075712203979492, -0.41131383180618286, -0.3150564432144165, -0.21879905462265015, -0.12254165858030319, -0.026284262537956238, 0.06997314095497131, 0.16623052954673767, 0.26248791813850403, 0.3587453365325928, 0.45500272512435913, 0.5512601137161255, 0.6475175023078918, 0.7437748908996582, 0.8400323390960693, 0.9362896680831909, 1.032547116279602, 1.1288044452667236, 1.2250618934631348, 1.321319341659546, 1.417576789855957, 1.5138341188430786, 1.6100915670394897, 1.7063488960266113, 1.8026063442230225, 1.8988637924194336, 1.9951211214065552, 2.0913784503936768, 2.187635898590088, 2.283893346786499, 2.380150556564331, 2.476408004760742, 2.5726654529571533, 2.6689229011535645, 2.7651801109313965, 2.8614375591278076, 2.9576950073242188, 3.05395245552063, 3.150209665298462, 3.246467113494873, 3.342724561691284, 3.4389820098876953, 3.5352392196655273, 3.6314969062805176, 3.7277543544769287, 3.82401180267334, 3.920269012451172, 4.016526699066162, 4.112783908843994, 4.209041118621826, 4.305298805236816, 4.401556015014648, 4.4978132247924805, 4.594070911407471, 4.690328121185303, 4.786585807800293, 4.882843017578125, 4.979100227355957, 5.075357913970947, 5.171615123748779]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 9.0, 6.0, 6.0, 6.0, 6.0, 13.0, 5.0, 22.0, 15.0, 19.0, 23.0, 19.0, 33.0, 34.0, 57.0, 71.0, 123.0, 132.0, 108.0, 67.0, 38.0, 28.0, 25.0, 18.0, 24.0, 13.0, 12.0, 10.0, 11.0, 9.0, 12.0, 6.0, 8.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.556845188140869, -2.4864301681518555, -2.416015386581421, -2.3456003665924072, -2.2751855850219727, -2.204770565032959, -2.1343557834625244, -2.0639407634735107, -1.9935258626937866, -1.9231109619140625, -1.8526960611343384, -1.7822811603546143, -1.7118661403656006, -1.641451358795166, -1.5710363388061523, -1.5006214380264282, -1.430206537246704, -1.35979163646698, -1.2893767356872559, -1.2189618349075317, -1.1485469341278076, -1.078131914138794, -1.0077170133590698, -0.9373021125793457, -0.8668872117996216, -0.7964723110198975, -0.7260574102401733, -0.6556424498558044, -0.5852275490760803, -0.5148126482963562, -0.4443977177143097, -0.3739827871322632, -0.30356764793395996, -0.23315273225307465, -0.16273781657218933, -0.09232290089130402, -0.0219079852104187, 0.04850691556930542, 0.11892184615135193, 0.18933677673339844, 0.25975167751312256, 0.3301665782928467, 0.4005815088748932, 0.4709964394569397, 0.5414113402366638, 0.6118262410163879, 0.6822412014007568, 0.752656102180481, 0.8230710029602051, 0.8934859037399292, 0.9639008045196533, 1.0343157052993774, 1.1047306060791016, 1.1751456260681152, 1.2455605268478394, 1.3159754276275635, 1.3863903284072876, 1.4568052291870117, 1.5272201299667358, 1.59763503074646, 1.6680500507354736, 1.7384648323059082, 1.8088798522949219, 1.879294753074646, 1.9497096538543701]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 2.0, 5.0, 11.0, 10.0, 11.0, 14.0, 14.0, 18.0, 24.0, 23.0, 35.0, 23.0, 22.0, 28.0, 48.0, 64.0, 170.0, 118.0, 59.0, 40.0, 31.0, 25.0, 26.0, 18.0, 21.0, 16.0, 24.0, 12.0, 11.0, 17.0, 10.0, 10.0, 7.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159423828125, -0.15387916564941406, -0.14833450317382812, -0.1427898406982422, -0.13724517822265625, -0.1317005157470703, -0.12615585327148438, -0.12061119079589844, -0.1150665283203125, -0.10952186584472656, -0.10397720336914062, -0.09843254089355469, -0.09288787841796875, -0.08734321594238281, -0.08179855346679688, -0.07625389099121094, -0.070709228515625, -0.06516456604003906, -0.059619903564453125, -0.05407524108886719, -0.04853057861328125, -0.04298591613769531, -0.037441253662109375, -0.03189659118652344, -0.0263519287109375, -0.020807266235351562, -0.015262603759765625, -0.009717941284179688, -0.00417327880859375, 0.0013713836669921875, 0.006916046142578125, 0.012460708618164062, 0.01800537109375, 0.023550033569335938, 0.029094696044921875, 0.03463935852050781, 0.04018402099609375, 0.04572868347167969, 0.051273345947265625, 0.05681800842285156, 0.0623626708984375, 0.06790733337402344, 0.07345199584960938, 0.07899665832519531, 0.08454132080078125, 0.09008598327636719, 0.09563064575195312, 0.10117530822753906, 0.106719970703125, 0.11226463317871094, 0.11780929565429688, 0.12335395812988281, 0.12889862060546875, 0.1344432830810547, 0.13998794555664062, 0.14553260803222656, 0.1510772705078125, 0.15662193298339844, 0.16216659545898438, 0.1677112579345703, 0.17325592041015625, 0.1788005828857422, 0.18434524536132812, 0.18988990783691406, 0.1954345703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 2.0, 7.0, 9.0, 8.0, 14.0, 24.0, 32.0, 35.0, 42.0, 57.0, 99.0, 166.0, 370.0, 765.0, 2104.0, 6993.0, 63964.0, 8294026.0, 14207.0, 3358.0, 1198.0, 493.0, 231.0, 114.0, 57.0, 45.0, 39.0, 18.0, 9.0, 16.0, 19.0, 10.0, 7.0, 7.0, 7.0, 4.0, 4.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.2476420402526855, -1.2122299671173096, -1.1768180131912231, -1.1414059400558472, -1.1059939861297607, -1.0705819129943848, -1.0351698398590088, -0.9997578263282776, -0.9643458127975464, -0.9289337992668152, -0.893521785736084, -0.858109712600708, -0.8226976990699768, -0.7872856855392456, -0.7518736124038696, -0.7164615988731384, -0.6810495853424072, -0.645637571811676, -0.6102255582809448, -0.5748134851455688, -0.5394014716148376, -0.5039894580841064, -0.46857741475105286, -0.43316537141799927, -0.39775335788726807, -0.36234134435653687, -0.3269293010234833, -0.2915172576904297, -0.2561052441596985, -0.2206932157278061, -0.1852811872959137, -0.1498691588640213, -0.1144571304321289, -0.07904510200023651, -0.043633073568344116, -0.008221045136451721, 0.027190983295440674, 0.06260301172733307, 0.09801504015922546, 0.13342706859111786, 0.16883909702301025, 0.20425112545490265, 0.23966315388679504, 0.27507519721984863, 0.31048721075057983, 0.34589922428131104, 0.3813112676143646, 0.4167233109474182, 0.4521353244781494, 0.4875473380088806, 0.5229593515396118, 0.5583714246749878, 0.593783438205719, 0.6291954517364502, 0.6646075248718262, 0.7000195384025574, 0.7354315519332886, 0.7708435654640198, 0.806255578994751, 0.841667652130127, 0.8770796656608582, 0.9124916791915894, 0.9479037523269653, 0.9833157658576965, 1.0187277793884277]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 7.0, 2.0, 7.0, 9.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.232407569885254, -1.183804988861084, -1.135202407836914, -1.0865998268127441, -1.0379972457885742, -0.9893946647644043, -0.9407920241355896, -0.8921894431114197, -0.8435868620872498, -0.7949842810630798, -0.7463817000389099, -0.6977790594100952, -0.6491764783859253, -0.6005738973617554, -0.5519713163375854, -0.5033687353134155, -0.4547661542892456, -0.4061635732650757, -0.35756099224090576, -0.30895838141441345, -0.26035580039024353, -0.2117532193660736, -0.1631506085395813, -0.11454802751541138, -0.06594544649124146, -0.017342858016490936, 0.03125973045825958, 0.0798623263835907, 0.12846490740776062, 0.17706748843193054, 0.22567009925842285, 0.2742726802825928, 0.32287514209747314, 0.37147772312164307, 0.420080304145813, 0.4686829149723053, 0.5172854661941528, 0.5658880472183228, 0.6144906878471375, 0.6630932688713074, 0.7116958498954773, 0.7602984309196472, 0.8089010119438171, 0.8575036525726318, 0.9061062335968018, 0.9547088146209717, 1.0033113956451416, 1.0519139766693115, 1.1005165576934814, 1.1491191387176514, 1.1977217197418213, 1.2463243007659912, 1.2949268817901611, 1.343529462814331, 1.392132043838501, 1.440734624862671, 1.4893372058868408, 1.5379397869110107, 1.5865423679351807, 1.6351449489593506, 1.6837475299835205, 1.7323501110076904, 1.7809526920318604, 1.8295552730560303, 1.8781579732894897]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 5.0, 5.0, 8.0, 6.0, 12.0, 10.0, 12.0, 13.0, 27.0, 16.0, 21.0, 31.0, 28.0, 48.0, 63.0, 59.0, 57.0, 66.0, 70.0, 52.0, 63.0, 41.0, 40.0, 41.0, 42.0, 29.0, 25.0, 25.0, 18.0, 17.0, 11.0, 8.0, 11.0, 5.0, 8.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1424560546875, -0.13739967346191406, -0.13234329223632812, -0.1272869110107422, -0.12223052978515625, -0.11717414855957031, -0.11211776733398438, -0.10706138610839844, -0.1020050048828125, -0.09694862365722656, -0.09189224243164062, -0.08683586120605469, -0.08177947998046875, -0.07672309875488281, -0.07166671752929688, -0.06661033630371094, -0.061553955078125, -0.05649757385253906, -0.051441192626953125, -0.04638481140136719, -0.04132843017578125, -0.03627204895019531, -0.031215667724609375, -0.026159286499023438, -0.0211029052734375, -0.016046524047851562, -0.010990142822265625, -0.0059337615966796875, -0.00087738037109375, 0.0041790008544921875, 0.009235382080078125, 0.014291763305664062, 0.01934814453125, 0.024404525756835938, 0.029460906982421875, 0.03451728820800781, 0.03957366943359375, 0.04463005065917969, 0.049686431884765625, 0.05474281311035156, 0.0597991943359375, 0.06485557556152344, 0.06991195678710938, 0.07496833801269531, 0.08002471923828125, 0.08508110046386719, 0.09013748168945312, 0.09519386291503906, 0.100250244140625, 0.10530662536621094, 0.11036300659179688, 0.11541938781738281, 0.12047576904296875, 0.1255321502685547, 0.13058853149414062, 0.13564491271972656, 0.1407012939453125, 0.14575767517089844, 0.15081405639648438, 0.1558704376220703, 0.16092681884765625, 0.1659832000732422, 0.17103958129882812, 0.17609596252441406, 0.18115234375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 8.0, 13.0, 21.0, 25.0, 33.0, 73.0, 107.0, 195.0, 296.0, 611.0, 1350.0, 2774.0, 6783.0, 16844.0, 45559.0, 116810.0, 178288.0, 93744.0, 36044.0, 13952.0, 5693.0, 2527.0, 1155.0, 581.0, 322.0, 182.0, 109.0, 60.0, 38.0, 28.0, 11.0, 6.0, 7.0, 1.0, 5.0, 3.0, 0.0, 1.0], "bins": [-1.365234375, -1.3330230712890625, -1.300811767578125, -1.2686004638671875, -1.23638916015625, -1.2041778564453125, -1.171966552734375, -1.1397552490234375, -1.1075439453125, -1.0753326416015625, -1.043121337890625, -1.0109100341796875, -0.97869873046875, -0.9464874267578125, -0.914276123046875, -0.8820648193359375, -0.849853515625, -0.8176422119140625, -0.785430908203125, -0.7532196044921875, -0.72100830078125, -0.6887969970703125, -0.656585693359375, -0.6243743896484375, -0.5921630859375, -0.5599517822265625, -0.527740478515625, -0.4955291748046875, -0.46331787109375, -0.4311065673828125, -0.398895263671875, -0.3666839599609375, -0.33447265625, -0.3022613525390625, -0.270050048828125, -0.2378387451171875, -0.20562744140625, -0.1734161376953125, -0.141204833984375, -0.1089935302734375, -0.0767822265625, -0.0445709228515625, -0.012359619140625, 0.0198516845703125, 0.05206298828125, 0.0842742919921875, 0.116485595703125, 0.1486968994140625, 0.180908203125, 0.2131195068359375, 0.245330810546875, 0.2775421142578125, 0.30975341796875, 0.3419647216796875, 0.374176025390625, 0.4063873291015625, 0.4385986328125, 0.4708099365234375, 0.503021240234375, 0.5352325439453125, 0.56744384765625, 0.5996551513671875, 0.631866455078125, 0.6640777587890625, 0.6962890625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 5.0, 7.0, 8.0, 8.0, 7.0, 16.0, 17.0, 16.0, 20.0, 16.0, 30.0, 39.0, 41.0, 31.0, 58.0, 65.0, 50.0, 60.0, 56.0, 50.0, 54.0, 45.0, 40.0, 38.0, 39.0, 26.0, 24.0, 25.0, 21.0, 11.0, 12.0, 14.0, 8.0, 5.0, 8.0, 4.0, 4.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.178466796875, -0.17332077026367188, -0.16817474365234375, -0.16302871704101562, -0.1578826904296875, -0.15273666381835938, -0.14759063720703125, -0.14244461059570312, -0.137298583984375, -0.13215255737304688, -0.12700653076171875, -0.12186050415039062, -0.1167144775390625, -0.11156845092773438, -0.10642242431640625, -0.10127639770507812, -0.09613037109375, -0.09098434448242188, -0.08583831787109375, -0.08069229125976562, -0.0755462646484375, -0.07040023803710938, -0.06525421142578125, -0.060108184814453125, -0.054962158203125, -0.049816131591796875, -0.04467010498046875, -0.039524078369140625, -0.0343780517578125, -0.029232025146484375, -0.02408599853515625, -0.018939971923828125, -0.0137939453125, -0.008647918701171875, -0.00350189208984375, 0.001644134521484375, 0.0067901611328125, 0.011936187744140625, 0.01708221435546875, 0.022228240966796875, 0.027374267578125, 0.032520294189453125, 0.03766632080078125, 0.042812347412109375, 0.0479583740234375, 0.053104400634765625, 0.05825042724609375, 0.06339645385742188, 0.06854248046875, 0.07368850708007812, 0.07883453369140625, 0.08398056030273438, 0.0891265869140625, 0.09427261352539062, 0.09941864013671875, 0.10456466674804688, 0.109710693359375, 0.11485671997070312, 0.12000274658203125, 0.12514877319335938, 0.1302947998046875, 0.13544082641601562, 0.14058685302734375, 0.14573287963867188, 0.15087890625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 6.0, 3.0, 5.0, 7.0, 7.0, 28.0, 54.0, 124.0, 119.0, 66.0, 26.0, 10.0, 9.0, 2.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3505499362945557, -2.2932605743408203, -2.235971212387085, -2.1786818504333496, -2.1213927268981934, -2.064103364944458, -2.0068140029907227, -1.9495246410369873, -1.892235279083252, -1.8349459171295166, -1.7776566743850708, -1.7203673124313354, -1.6630779504776, -1.6057887077331543, -1.548499345779419, -1.4912099838256836, -1.4339206218719482, -1.376631259918213, -1.319342017173767, -1.2620526552200317, -1.2047632932662964, -1.1474740505218506, -1.0901846885681152, -1.0328953266143799, -0.9756060838699341, -0.9183167815208435, -0.8610274195671082, -0.8037381172180176, -0.7464487552642822, -0.6891594529151917, -0.6318701505661011, -0.5745807886123657, -0.5172914266586304, -0.4600020945072174, -0.40271276235580444, -0.34542346000671387, -0.2881340980529785, -0.23084479570388794, -0.17355546355247498, -0.11626613140106201, -0.05897679924964905, -0.0016874708235263824, 0.05560185760259628, 0.11289118230342865, 0.1701805144548416, 0.22746983170509338, 0.28475916385650635, 0.3420484960079193, 0.3993378281593323, 0.45662716031074524, 0.5139164924621582, 0.5712057948112488, 0.6284951567649841, 0.6857844591140747, 0.7430738210678101, 0.8003631234169006, 0.8576524257659912, 0.9149417281150818, 0.9722310900688171, 1.0295203924179077, 1.086809754371643, 1.1440989971160889, 1.2013883590698242, 1.2586777210235596, 1.315967082977295]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 9.0, 13.0, 23.0, 49.0, 54.0, 78.0, 82.0, 49.0, 33.0, 12.0, 7.0, 7.0, 4.0, 8.0, 1.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9270635843276978, -0.8975524306297302, -0.8680412173271179, -0.8385300636291504, -0.8090188503265381, -0.7795076966285706, -0.749996542930603, -0.7204853296279907, -0.6909741759300232, -0.6614630222320557, -0.6319518089294434, -0.6024406552314758, -0.5729295015335083, -0.543418288230896, -0.5139071345329285, -0.48439595103263855, -0.45488476753234863, -0.4253735840320587, -0.3958624005317688, -0.36635124683380127, -0.33684006333351135, -0.30732887983322144, -0.2778177261352539, -0.248306542634964, -0.21879535913467407, -0.18928417563438416, -0.15977300703525543, -0.1302618384361267, -0.10075065493583679, -0.07123947143554688, -0.04172830283641815, -0.012217134237289429, 0.017294108867645264, 0.046805284917354584, 0.0763164609670639, 0.10582763701677322, 0.13533881306648254, 0.16484999656677246, 0.19436116516590118, 0.2238723337650299, 0.2533835172653198, 0.28289470076560974, 0.31240588426589966, 0.3419170379638672, 0.3714282214641571, 0.400939404964447, 0.43045055866241455, 0.45996174216270447, 0.4894729256629944, 0.5189840793609619, 0.5484952926635742, 0.5780064463615417, 0.6075176000595093, 0.6370288133621216, 0.6665399670600891, 0.6960511207580566, 0.725562334060669, 0.7550734877586365, 0.7845847010612488, 0.8140958547592163, 0.8436070680618286, 0.8731182217597961, 0.9026293754577637, 0.932140588760376, 0.9616517424583435]}, "eval/loss": 0.35239124298095703, "eval/wer": 0.10420468068226894, "eval/runtime": 326.5742, "eval/samples_per_second": 8.09, "eval/steps_per_second": 0.508} \ No newline at end of file